David Pomerenke
commited on
Commit
·
eaf2d97
1
Parent(s):
7cdde63
spBLEU tokenizer, run on more languages
Browse files- bibliography.bib +16 -0
- data/INFO +1 -1
- evals/main.py +1 -1
- evals/tasks.py +3 -3
- frontend/public/{LICENSE → INFO} +0 -0
- frontend/public/results.json +371 -371
- results.json +1720 -280
bibliography.bib
CHANGED
|
@@ -209,6 +209,22 @@
|
|
| 209 |
keywords = {dataset,n=200}
|
| 210 |
}
|
| 211 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 212 |
@inproceedings{robinsonChatGPTMTCompetitive2023,
|
| 213 |
title = {{{ChatGPT MT}}: {{Competitive}} for {{High-}} (but {{Not Low-}}) {{Resource Languages}}},
|
| 214 |
shorttitle = {{{ChatGPT MT}}},
|
|
|
|
| 209 |
keywords = {dataset,n=200}
|
| 210 |
}
|
| 211 |
|
| 212 |
+
@misc{petrovLanguageModelTokenizers2023,
|
| 213 |
+
title = {Language {{Model Tokenizers Introduce Unfairness Between Languages}}},
|
| 214 |
+
author = {Petrov, Aleksandar and Malfa, Emanuele La and Torr, Philip H. S. and Bibi, Adel},
|
| 215 |
+
year = {2023},
|
| 216 |
+
month = oct,
|
| 217 |
+
number = {arXiv:2305.15425},
|
| 218 |
+
eprint = {2305.15425},
|
| 219 |
+
primaryclass = {cs},
|
| 220 |
+
publisher = {arXiv},
|
| 221 |
+
doi = {10.48550/arXiv.2305.15425},
|
| 222 |
+
urldate = {2025-03-24},
|
| 223 |
+
abstract = {Recent language models have shown impressive multilingual performance, even when not explicitly trained for it. Despite this, there are concerns about the quality of their outputs across different languages. In this paper, we show how disparity in the treatment of different languages arises at the tokenization stage, well before a model is even invoked. The same text translated into different languages can have drastically different tokenization lengths, with differences up to 15 times in some cases. These disparities persist even for tokenizers that are intentionally trained for multilingual support. Character-level and byte-level models also exhibit over 4 times the difference in the encoding length for some language pairs. This induces unfair treatment for some language communities in regard to the cost of accessing commercial language services, the processing time and latency, as well as the amount of content that can be provided as context to the models. Therefore, we make the case that we should train future language models using multilingually fair subword tokenizers.},
|
| 224 |
+
archiveprefix = {arXiv},
|
| 225 |
+
file = {/Users/david/Zotero/storage/NX3DT98Z/Petrov et al. - 2023 - Language Model Tokenizers Introduce Unfairness Between Languages.pdf;/Users/david/Zotero/storage/FKJQP22D/2305.html}
|
| 226 |
+
}
|
| 227 |
+
|
| 228 |
@inproceedings{robinsonChatGPTMTCompetitive2023,
|
| 229 |
title = {{{ChatGPT MT}}: {{Competitive}} for {{High-}} (but {{Not Low-}}) {{Resource Languages}}},
|
| 230 |
shorttitle = {{{ChatGPT MT}}},
|
data/INFO
CHANGED
|
@@ -2,4 +2,4 @@ fleurs: https://huggingface.co/datasets/google/fleurs via eval.py
|
|
| 2 |
floresp-v2.0-rc.3: https://github.com/openlanguagedata/flores
|
| 3 |
glottolog_languoid.csv: https://glottolog.org/meta/downloads
|
| 4 |
ScriptCodes.csv: https://www.unicode.org/iso15924/iso15924-codes.html
|
| 5 |
-
spbleu: https://github.com/facebookresearch/flores/tree/main
|
|
|
|
| 2 |
floresp-v2.0-rc.3: https://github.com/openlanguagedata/flores
|
| 3 |
glottolog_languoid.csv: https://glottolog.org/meta/downloads
|
| 4 |
ScriptCodes.csv: https://www.unicode.org/iso15924/iso15924-codes.html
|
| 5 |
+
spbleu: https://github.com/facebookresearch/flores/tree/main/flores200#spm-and-dictionary
|
evals/main.py
CHANGED
|
@@ -13,7 +13,7 @@ from tqdm.asyncio import tqdm_asyncio
|
|
| 13 |
# ===== config =====
|
| 14 |
|
| 15 |
n_sentences = 30
|
| 16 |
-
langs_eval = languages.iloc[:
|
| 17 |
langs_eval_detailed = languages.iloc[:2]
|
| 18 |
transcription_langs_eval = languages.iloc[:10]
|
| 19 |
transcription_langs_eval_detailed = languages.iloc[:5]
|
|
|
|
| 13 |
# ===== config =====
|
| 14 |
|
| 15 |
n_sentences = 30
|
| 16 |
+
langs_eval = languages.iloc[:30]
|
| 17 |
langs_eval_detailed = languages.iloc[:2]
|
| 18 |
transcription_langs_eval = languages.iloc[:10]
|
| 19 |
transcription_langs_eval_detailed = languages.iloc[:5]
|
evals/tasks.py
CHANGED
|
@@ -3,16 +3,16 @@ import random
|
|
| 3 |
import evaluate
|
| 4 |
import pandas as pd
|
| 5 |
from joblib.memory import Memory
|
| 6 |
-
from transformers import NllbTokenizer
|
| 7 |
from languages import languages, script_name
|
| 8 |
from datasets_.flores import flores_sentences
|
| 9 |
from models import complete, transcribe
|
|
|
|
|
|
|
| 10 |
cache = Memory(location=".cache", verbose=0).cache
|
| 11 |
bleu = evaluate.load("bleu")
|
| 12 |
chrf = evaluate.load("chrf")
|
| 13 |
wer = evaluate.load("wer")
|
| 14 |
-
tokenizer =
|
| 15 |
-
|
| 16 |
|
| 17 |
# sample languages to translate to
|
| 18 |
target_languages = languages[languages["in_benchmark"]].sample(
|
|
|
|
| 3 |
import evaluate
|
| 4 |
import pandas as pd
|
| 5 |
from joblib.memory import Memory
|
|
|
|
| 6 |
from languages import languages, script_name
|
| 7 |
from datasets_.flores import flores_sentences
|
| 8 |
from models import complete, transcribe
|
| 9 |
+
import sentencepiece as spm
|
| 10 |
+
|
| 11 |
cache = Memory(location=".cache", verbose=0).cache
|
| 12 |
bleu = evaluate.load("bleu")
|
| 13 |
chrf = evaluate.load("chrf")
|
| 14 |
wer = evaluate.load("wer")
|
| 15 |
+
tokenizer = spm.SentencePieceProcessor(model_file="data/spbleu/flores200_sacrebleu_tokenizer_spm.model")
|
|
|
|
| 16 |
|
| 17 |
# sample languages to translate to
|
| 18 |
target_languages = languages[languages["in_benchmark"]].sample(
|
frontend/public/{LICENSE → INFO}
RENAMED
|
File without changes
|
frontend/public/results.json
CHANGED
|
@@ -26,7 +26,7 @@
|
|
| 26 |
"license": null,
|
| 27 |
"average": 0.66,
|
| 28 |
"classification_accuracy": 0.73,
|
| 29 |
-
"language_modeling_chrf": 0.
|
| 30 |
"translation_bleu": 0.4,
|
| 31 |
"translation_chrf": 0.54
|
| 32 |
},
|
|
@@ -39,9 +39,9 @@
|
|
| 39 |
"size": 27432406640.0,
|
| 40 |
"type": "Open",
|
| 41 |
"license": "Gemma",
|
| 42 |
-
"average": 0.
|
| 43 |
"classification_accuracy": 0.72,
|
| 44 |
-
"language_modeling_chrf": 0.
|
| 45 |
"translation_bleu": 0.37,
|
| 46 |
"translation_chrf": 0.54
|
| 47 |
},
|
|
@@ -54,41 +54,41 @@
|
|
| 54 |
"size": 70553706496.0,
|
| 55 |
"type": "Open",
|
| 56 |
"license": "Llama3.1",
|
| 57 |
-
"average": 0.
|
| 58 |
"classification_accuracy": 0.57,
|
| 59 |
-
"language_modeling_chrf": 0.
|
| 60 |
"translation_bleu": 0.43,
|
| 61 |
"translation_chrf": 0.57
|
| 62 |
},
|
| 63 |
{
|
| 64 |
"rank": 5,
|
| 65 |
-
"provider": "
|
| 66 |
-
"model": "
|
| 67 |
"hf_id": null,
|
| 68 |
"creation_date": null,
|
| 69 |
"size": null,
|
| 70 |
"type": "Commercial",
|
| 71 |
"license": null,
|
| 72 |
"average": 0.61,
|
| 73 |
-
"classification_accuracy": 0.
|
| 74 |
-
"language_modeling_chrf": 0.
|
| 75 |
-
"translation_bleu": 0.
|
| 76 |
-
"translation_chrf": 0.
|
| 77 |
},
|
| 78 |
{
|
| 79 |
"rank": 6,
|
| 80 |
-
"provider": "
|
| 81 |
-
"model": "
|
| 82 |
"hf_id": null,
|
| 83 |
"creation_date": null,
|
| 84 |
"size": null,
|
| 85 |
"type": "Commercial",
|
| 86 |
"license": null,
|
| 87 |
-
"average": 0.
|
| 88 |
-
"classification_accuracy": 0.
|
| 89 |
-
"language_modeling_chrf": 0.
|
| 90 |
-
"translation_bleu": 0.
|
| 91 |
-
"translation_chrf": 0.
|
| 92 |
},
|
| 93 |
{
|
| 94 |
"rank": 7,
|
|
@@ -101,7 +101,7 @@
|
|
| 101 |
"license": null,
|
| 102 |
"average": 0.6,
|
| 103 |
"classification_accuracy": 0.52,
|
| 104 |
-
"language_modeling_chrf": 0.
|
| 105 |
"translation_bleu": 0.39,
|
| 106 |
"translation_chrf": 0.55
|
| 107 |
},
|
|
@@ -116,7 +116,7 @@
|
|
| 116 |
"license": "Apache 2.0",
|
| 117 |
"average": 0.58,
|
| 118 |
"classification_accuracy": 0.55,
|
| 119 |
-
"language_modeling_chrf": 0.
|
| 120 |
"translation_bleu": 0.38,
|
| 121 |
"translation_chrf": 0.52
|
| 122 |
},
|
|
@@ -129,11 +129,11 @@
|
|
| 129 |
"size": 70553706496.0,
|
| 130 |
"type": "Open",
|
| 131 |
"license": "Llama3.3",
|
| 132 |
-
"average": 0.
|
| 133 |
-
"classification_accuracy": 0.
|
| 134 |
"language_modeling_chrf": 0.94,
|
| 135 |
-
"translation_bleu": 0.
|
| 136 |
-
"translation_chrf": 0.
|
| 137 |
},
|
| 138 |
{
|
| 139 |
"rank": 10,
|
|
@@ -144,9 +144,9 @@
|
|
| 144 |
"size": null,
|
| 145 |
"type": "Commercial",
|
| 146 |
"license": null,
|
| 147 |
-
"average": 0.
|
| 148 |
"classification_accuracy": 0.5,
|
| 149 |
-
"language_modeling_chrf": 0.
|
| 150 |
"translation_bleu": 0.32,
|
| 151 |
"translation_chrf": 0.49
|
| 152 |
},
|
|
@@ -161,7 +161,7 @@
|
|
| 161 |
"license": "Mit",
|
| 162 |
"average": 0.52,
|
| 163 |
"classification_accuracy": 0.42,
|
| 164 |
-
"language_modeling_chrf": 0.
|
| 165 |
"translation_bleu": 0.32,
|
| 166 |
"translation_chrf": 0.46
|
| 167 |
},
|
|
@@ -176,7 +176,7 @@
|
|
| 176 |
"license": "Apache 2.0",
|
| 177 |
"average": 0.25,
|
| 178 |
"classification_accuracy": 0.0,
|
| 179 |
-
"language_modeling_chrf": 0.
|
| 180 |
"translation_bleu": 0.21,
|
| 181 |
"translation_chrf": 0.3
|
| 182 |
}
|
|
@@ -220,7 +220,7 @@
|
|
| 220 |
"in_benchmark": true,
|
| 221 |
"NaN": 0.0,
|
| 222 |
"classification_accuracy": 0.53,
|
| 223 |
-
"language_modeling_chrf": 0.
|
| 224 |
"translation_bleu": 0.32,
|
| 225 |
"translation_chrf": 0.49
|
| 226 |
},
|
|
@@ -248,7 +248,7 @@
|
|
| 248 |
"in_benchmark": true,
|
| 249 |
"NaN": 0.0,
|
| 250 |
"classification_accuracy": 0.43,
|
| 251 |
-
"language_modeling_chrf": 0.
|
| 252 |
"translation_bleu": 0.28,
|
| 253 |
"translation_chrf": 0.47
|
| 254 |
},
|
|
@@ -262,7 +262,7 @@
|
|
| 262 |
"in_benchmark": true,
|
| 263 |
"NaN": 0.0,
|
| 264 |
"classification_accuracy": 0.5,
|
| 265 |
-
"language_modeling_chrf": 0.
|
| 266 |
"translation_bleu": 0.24,
|
| 267 |
"translation_chrf": 0.42
|
| 268 |
},
|
|
@@ -290,7 +290,7 @@
|
|
| 290 |
"in_benchmark": true,
|
| 291 |
"NaN": 0.0,
|
| 292 |
"classification_accuracy": 0.4,
|
| 293 |
-
"language_modeling_chrf": 0.
|
| 294 |
"translation_bleu": 0.2,
|
| 295 |
"translation_chrf": 0.41
|
| 296 |
},
|
|
@@ -300,11 +300,11 @@
|
|
| 300 |
"autonym": "Português",
|
| 301 |
"speakers": 237496885,
|
| 302 |
"family": "Indo-European",
|
| 303 |
-
"average": 0.
|
| 304 |
"in_benchmark": true,
|
| 305 |
"NaN": 0.0,
|
| 306 |
"classification_accuracy": 0.5,
|
| 307 |
-
"language_modeling_chrf": 0.
|
| 308 |
"translation_bleu": 0.31,
|
| 309 |
"translation_chrf": 0.49
|
| 310 |
},
|
|
@@ -314,11 +314,11 @@
|
|
| 314 |
"autonym": "ਪੰਜਾਬੀ",
|
| 315 |
"speakers": 203571210,
|
| 316 |
"family": "Indo-European",
|
| 317 |
-
"average": 0.
|
| 318 |
"in_benchmark": true,
|
| 319 |
"NaN": 0.0,
|
| 320 |
"classification_accuracy": 0.4,
|
| 321 |
-
"language_modeling_chrf": 0.
|
| 322 |
"translation_bleu": 0.34,
|
| 323 |
"translation_chrf": 0.49
|
| 324 |
},
|
|
@@ -328,13 +328,13 @@
|
|
| 328 |
"autonym": "Русский",
|
| 329 |
"speakers": 195841151,
|
| 330 |
"family": "Indo-European",
|
| 331 |
-
"average": 0.
|
| 332 |
"in_benchmark": true,
|
| 333 |
"NaN": 0.0,
|
| 334 |
-
"classification_accuracy": 0.
|
| 335 |
-
"language_modeling_chrf": 0.
|
| 336 |
-
"translation_bleu": 0.
|
| 337 |
-
"translation_chrf": 0.
|
| 338 |
},
|
| 339 |
{
|
| 340 |
"bcp_47": "sw",
|
|
@@ -342,13 +342,13 @@
|
|
| 342 |
"autonym": "Kiswahili",
|
| 343 |
"speakers": 171610296,
|
| 344 |
"family": "Atlantic-Congo",
|
| 345 |
-
"average": 0.
|
| 346 |
"in_benchmark": true,
|
| 347 |
"NaN": 0.0,
|
| 348 |
-
"classification_accuracy": 0.
|
| 349 |
-
"language_modeling_chrf": 0.
|
| 350 |
-
"translation_bleu": 0.
|
| 351 |
-
"translation_chrf": 0.
|
| 352 |
},
|
| 353 |
{
|
| 354 |
"bcp_47": "id",
|
|
@@ -356,13 +356,13 @@
|
|
| 356 |
"autonym": "Bahasa Indonesia",
|
| 357 |
"speakers": 171207687,
|
| 358 |
"family": "Austronesian",
|
| 359 |
-
"average": 0.
|
| 360 |
"in_benchmark": true,
|
| 361 |
"NaN": 0.0,
|
| 362 |
-
"classification_accuracy": 0.
|
| 363 |
-
"language_modeling_chrf": 0.
|
| 364 |
-
"translation_bleu": 0.
|
| 365 |
-
"translation_chrf": 0.
|
| 366 |
},
|
| 367 |
{
|
| 368 |
"bcp_47": "de",
|
|
@@ -370,13 +370,13 @@
|
|
| 370 |
"autonym": "Deutsch",
|
| 371 |
"speakers": 136350226,
|
| 372 |
"family": "Indo-European",
|
| 373 |
-
"average": 0.
|
| 374 |
"in_benchmark": true,
|
| 375 |
"NaN": 0.0,
|
| 376 |
-
"classification_accuracy": 0.
|
| 377 |
-
"language_modeling_chrf": 0.
|
| 378 |
-
"translation_bleu": 0.
|
| 379 |
-
"translation_chrf": 0.
|
| 380 |
},
|
| 381 |
{
|
| 382 |
"bcp_47": "ja",
|
|
@@ -384,13 +384,13 @@
|
|
| 384 |
"autonym": "日本語",
|
| 385 |
"speakers": 119729026,
|
| 386 |
"family": "Japonic",
|
| 387 |
-
"average": 0.
|
| 388 |
"in_benchmark": true,
|
| 389 |
"NaN": 0.0,
|
| 390 |
-
"classification_accuracy": 0.
|
| 391 |
-
"language_modeling_chrf": 0.
|
| 392 |
-
"translation_bleu": 0.
|
| 393 |
-
"translation_chrf": 0.
|
| 394 |
},
|
| 395 |
{
|
| 396 |
"bcp_47": "te",
|
|
@@ -398,13 +398,13 @@
|
|
| 398 |
"autonym": "తెలుగు",
|
| 399 |
"speakers": 95478480,
|
| 400 |
"family": "Dravidian",
|
| 401 |
-
"average": 0.
|
| 402 |
"in_benchmark": true,
|
| 403 |
"NaN": 0.0,
|
| 404 |
-
"classification_accuracy": 0.
|
| 405 |
-
"language_modeling_chrf": 0.
|
| 406 |
-
"translation_bleu": 0.
|
| 407 |
-
"translation_chrf": 0.
|
| 408 |
},
|
| 409 |
{
|
| 410 |
"bcp_47": "lah",
|
|
@@ -426,13 +426,13 @@
|
|
| 426 |
"autonym": "मराठी",
|
| 427 |
"speakers": 92826300,
|
| 428 |
"family": "Indo-European",
|
| 429 |
-
"average": 0.
|
| 430 |
"in_benchmark": true,
|
| 431 |
"NaN": 0.0,
|
| 432 |
-
"classification_accuracy": 0.
|
| 433 |
-
"language_modeling_chrf": 0.
|
| 434 |
-
"translation_bleu": 0.
|
| 435 |
-
"translation_chrf": 0.
|
| 436 |
},
|
| 437 |
{
|
| 438 |
"bcp_47": "jv",
|
|
@@ -440,13 +440,13 @@
|
|
| 440 |
"autonym": "Jawa",
|
| 441 |
"speakers": 91180665,
|
| 442 |
"family": "Austronesian",
|
| 443 |
-
"average": 0.
|
| 444 |
"in_benchmark": true,
|
| 445 |
"NaN": 0.0,
|
| 446 |
-
"classification_accuracy": 0.
|
| 447 |
-
"language_modeling_chrf": 0.
|
| 448 |
-
"translation_bleu": 0.
|
| 449 |
-
"translation_chrf": 0.
|
| 450 |
},
|
| 451 |
{
|
| 452 |
"bcp_47": "vi",
|
|
@@ -454,13 +454,13 @@
|
|
| 454 |
"autonym": "Tiếng Việt",
|
| 455 |
"speakers": 86222962,
|
| 456 |
"family": "Austroasiatic",
|
| 457 |
-
"average": 0.
|
| 458 |
"in_benchmark": true,
|
| 459 |
"NaN": 0.0,
|
| 460 |
-
"classification_accuracy": 0.
|
| 461 |
-
"language_modeling_chrf": 0.
|
| 462 |
-
"translation_bleu": 0.
|
| 463 |
-
"translation_chrf": 0.
|
| 464 |
},
|
| 465 |
{
|
| 466 |
"bcp_47": "ta",
|
|
@@ -468,13 +468,13 @@
|
|
| 468 |
"autonym": "தமிழ்",
|
| 469 |
"speakers": 85616159,
|
| 470 |
"family": "Dravidian",
|
| 471 |
-
"average": 0.
|
| 472 |
"in_benchmark": true,
|
| 473 |
"NaN": 0.0,
|
| 474 |
-
"classification_accuracy": 0.
|
| 475 |
-
"language_modeling_chrf": 0.
|
| 476 |
-
"translation_bleu": 0.
|
| 477 |
-
"translation_chrf": 0.
|
| 478 |
},
|
| 479 |
{
|
| 480 |
"bcp_47": "fa",
|
|
@@ -482,13 +482,13 @@
|
|
| 482 |
"autonym": "فارسی",
|
| 483 |
"speakers": 84710459,
|
| 484 |
"family": "Indo-European",
|
| 485 |
-
"average": 0.
|
| 486 |
"in_benchmark": true,
|
| 487 |
"NaN": 0.0,
|
| 488 |
-
"classification_accuracy": 0.
|
| 489 |
-
"language_modeling_chrf": 0.
|
| 490 |
-
"translation_bleu": 0.
|
| 491 |
-
"translation_chrf": 0.
|
| 492 |
},
|
| 493 |
{
|
| 494 |
"bcp_47": "wuu",
|
|
@@ -510,13 +510,13 @@
|
|
| 510 |
"autonym": "Türkçe",
|
| 511 |
"speakers": 80360704,
|
| 512 |
"family": "Turkic",
|
| 513 |
-
"average": 0.
|
| 514 |
"in_benchmark": true,
|
| 515 |
"NaN": 0.0,
|
| 516 |
-
"classification_accuracy": 0.
|
| 517 |
-
"language_modeling_chrf": 0.
|
| 518 |
-
"translation_bleu": 0.
|
| 519 |
-
"translation_chrf": 0.
|
| 520 |
},
|
| 521 |
{
|
| 522 |
"bcp_47": "yue",
|
|
@@ -524,13 +524,13 @@
|
|
| 524 |
"autonym": "粵語",
|
| 525 |
"speakers": 79654759,
|
| 526 |
"family": "Sino-Tibetan",
|
| 527 |
-
"average": 0.
|
| 528 |
"in_benchmark": true,
|
| 529 |
"NaN": 0.0,
|
| 530 |
-
"classification_accuracy": 0.
|
| 531 |
-
"language_modeling_chrf": 0.
|
| 532 |
-
"translation_bleu": 0.
|
| 533 |
-
"translation_chrf": 0.
|
| 534 |
},
|
| 535 |
{
|
| 536 |
"bcp_47": "ko",
|
|
@@ -538,13 +538,13 @@
|
|
| 538 |
"autonym": "한국어",
|
| 539 |
"speakers": 78357046,
|
| 540 |
"family": "Koreanic",
|
| 541 |
-
"average": 0.
|
| 542 |
"in_benchmark": true,
|
| 543 |
"NaN": 0.0,
|
| 544 |
-
"classification_accuracy": 0.
|
| 545 |
-
"language_modeling_chrf": 0.
|
| 546 |
-
"translation_bleu": 0.
|
| 547 |
-
"translation_chrf": 0.
|
| 548 |
},
|
| 549 |
{
|
| 550 |
"bcp_47": "it",
|
|
@@ -552,13 +552,13 @@
|
|
| 552 |
"autonym": "Italiano",
|
| 553 |
"speakers": 70247060,
|
| 554 |
"family": "Indo-European",
|
| 555 |
-
"average": 0.
|
| 556 |
"in_benchmark": true,
|
| 557 |
"NaN": 0.0,
|
| 558 |
-
"classification_accuracy": 0.
|
| 559 |
-
"language_modeling_chrf": 0.
|
| 560 |
-
"translation_bleu": 0.
|
| 561 |
-
"translation_chrf": 0.
|
| 562 |
},
|
| 563 |
{
|
| 564 |
"bcp_47": "fil",
|
|
@@ -566,13 +566,13 @@
|
|
| 566 |
"autonym": "Filipino",
|
| 567 |
"speakers": 67471096,
|
| 568 |
"family": "Austronesian",
|
| 569 |
-
"average": 0.
|
| 570 |
"in_benchmark": true,
|
| 571 |
"NaN": 0.0,
|
| 572 |
-
"classification_accuracy": 0.
|
| 573 |
-
"language_modeling_chrf": 0.
|
| 574 |
-
"translation_bleu": 0.
|
| 575 |
-
"translation_chrf": 0.
|
| 576 |
},
|
| 577 |
{
|
| 578 |
"bcp_47": "arz",
|
|
@@ -580,13 +580,13 @@
|
|
| 580 |
"autonym": "Egyptian Arabic",
|
| 581 |
"speakers": 66639360,
|
| 582 |
"family": "Afro-Asiatic",
|
| 583 |
-
"average": 0.
|
| 584 |
"in_benchmark": true,
|
| 585 |
"NaN": 0.0,
|
| 586 |
-
"classification_accuracy": 0.
|
| 587 |
-
"language_modeling_chrf": 0.
|
| 588 |
-
"translation_bleu": 0.
|
| 589 |
-
"translation_chrf": 0.
|
| 590 |
},
|
| 591 |
{
|
| 592 |
"bcp_47": "gu",
|
|
@@ -594,13 +594,13 @@
|
|
| 594 |
"autonym": "ગુજરાતી",
|
| 595 |
"speakers": 61721799,
|
| 596 |
"family": "Indo-European",
|
| 597 |
-
"average": 0.
|
| 598 |
"in_benchmark": true,
|
| 599 |
"NaN": 0.0,
|
| 600 |
-
"classification_accuracy": 0.
|
| 601 |
-
"language_modeling_chrf": 0.
|
| 602 |
-
"translation_bleu": 0.
|
| 603 |
-
"translation_chrf": 0.
|
| 604 |
},
|
| 605 |
{
|
| 606 |
"bcp_47": "th",
|
|
@@ -10164,7 +10164,7 @@
|
|
| 10164 |
]
|
| 10165 |
},
|
| 10166 |
"AE": {
|
| 10167 |
-
"score": 0.
|
| 10168 |
"languages": [
|
| 10169 |
{
|
| 10170 |
"name": "English",
|
|
@@ -10182,7 +10182,7 @@
|
|
| 10182 |
"name": "Persian",
|
| 10183 |
"bcp_47": "fa",
|
| 10184 |
"population": 189850,
|
| 10185 |
-
"score": 0.
|
| 10186 |
},
|
| 10187 |
{
|
| 10188 |
"name": "Pashto",
|
|
@@ -10205,7 +10205,7 @@
|
|
| 10205 |
]
|
| 10206 |
},
|
| 10207 |
"AG": {
|
| 10208 |
-
"score": 0.
|
| 10209 |
"languages": [
|
| 10210 |
{
|
| 10211 |
"name": "English",
|
|
@@ -10217,7 +10217,7 @@
|
|
| 10217 |
"name": "Portuguese",
|
| 10218 |
"bcp_47": "pt",
|
| 10219 |
"population": 1571,
|
| 10220 |
-
"score": 0.
|
| 10221 |
}
|
| 10222 |
]
|
| 10223 |
},
|
|
@@ -10290,7 +10290,7 @@
|
|
| 10290 |
]
|
| 10291 |
},
|
| 10292 |
"AT": {
|
| 10293 |
-
"score": 0.
|
| 10294 |
"languages": [
|
| 10295 |
{
|
| 10296 |
"name": "English",
|
|
@@ -10308,13 +10308,13 @@
|
|
| 10308 |
"name": "German",
|
| 10309 |
"bcp_47": "de",
|
| 10310 |
"population": 8593666,
|
| 10311 |
-
"score": 0.
|
| 10312 |
},
|
| 10313 |
{
|
| 10314 |
"name": "Italian",
|
| 10315 |
"bcp_47": "it",
|
| 10316 |
"population": 797350,
|
| 10317 |
-
"score": 0.
|
| 10318 |
},
|
| 10319 |
{
|
| 10320 |
"name": "Bavarian",
|
|
@@ -10343,7 +10343,7 @@
|
|
| 10343 |
]
|
| 10344 |
},
|
| 10345 |
"AU": {
|
| 10346 |
-
"score": 0.
|
| 10347 |
"languages": [
|
| 10348 |
{
|
| 10349 |
"name": "English",
|
|
@@ -10361,7 +10361,7 @@
|
|
| 10361 |
"name": "Italian",
|
| 10362 |
"bcp_47": "it",
|
| 10363 |
"population": 483864,
|
| 10364 |
-
"score": 0.
|
| 10365 |
},
|
| 10366 |
{
|
| 10367 |
"name": "Hmong Njua",
|
|
@@ -10506,7 +10506,7 @@
|
|
| 10506 |
]
|
| 10507 |
},
|
| 10508 |
"BE": {
|
| 10509 |
-
"score": 0.
|
| 10510 |
"languages": [
|
| 10511 |
{
|
| 10512 |
"name": "English",
|
|
@@ -10524,7 +10524,7 @@
|
|
| 10524 |
"name": "German",
|
| 10525 |
"bcp_47": "de",
|
| 10526 |
"population": 2578554,
|
| 10527 |
-
"score": 0.
|
| 10528 |
},
|
| 10529 |
{
|
| 10530 |
"name": "Dutch",
|
|
@@ -10547,7 +10547,7 @@
|
|
| 10547 |
]
|
| 10548 |
},
|
| 10549 |
"BG": {
|
| 10550 |
-
"score": 0.
|
| 10551 |
"languages": [
|
| 10552 |
{
|
| 10553 |
"name": "English",
|
|
@@ -10559,19 +10559,19 @@
|
|
| 10559 |
"name": "Russian",
|
| 10560 |
"bcp_47": "ru",
|
| 10561 |
"population": 1602387,
|
| 10562 |
-
"score": 0.
|
| 10563 |
},
|
| 10564 |
{
|
| 10565 |
"name": "German",
|
| 10566 |
"bcp_47": "de",
|
| 10567 |
"population": 557352,
|
| 10568 |
-
"score": 0.
|
| 10569 |
},
|
| 10570 |
{
|
| 10571 |
"name": "Turkish",
|
| 10572 |
"bcp_47": "tr",
|
| 10573 |
"population": 766359,
|
| 10574 |
-
"score": 0.
|
| 10575 |
},
|
| 10576 |
{
|
| 10577 |
"name": "Bulgarian",
|
|
@@ -10582,7 +10582,7 @@
|
|
| 10582 |
]
|
| 10583 |
},
|
| 10584 |
"BI": {
|
| 10585 |
-
"score": 0.
|
| 10586 |
"languages": [
|
| 10587 |
{
|
| 10588 |
"name": "English",
|
|
@@ -10600,7 +10600,7 @@
|
|
| 10600 |
"name": "Swahili",
|
| 10601 |
"bcp_47": "sw",
|
| 10602 |
"population": 6408,
|
| 10603 |
-
"score": 0.
|
| 10604 |
},
|
| 10605 |
{
|
| 10606 |
"name": "Rundi",
|
|
@@ -10645,7 +10645,7 @@
|
|
| 10645 |
]
|
| 10646 |
},
|
| 10647 |
"BR": {
|
| 10648 |
-
"score": 0.
|
| 10649 |
"languages": [
|
| 10650 |
{
|
| 10651 |
"name": "English",
|
|
@@ -10663,31 +10663,31 @@
|
|
| 10663 |
"name": "Portuguese",
|
| 10664 |
"bcp_47": "pt",
|
| 10665 |
"population": 192661560,
|
| 10666 |
-
"score": 0.
|
| 10667 |
},
|
| 10668 |
{
|
| 10669 |
"name": "German",
|
| 10670 |
"bcp_47": "de",
|
| 10671 |
"population": 1778414,
|
| 10672 |
-
"score": 0.
|
| 10673 |
},
|
| 10674 |
{
|
| 10675 |
"name": "Japanese",
|
| 10676 |
"bcp_47": "ja",
|
| 10677 |
"population": 444604,
|
| 10678 |
-
"score": 0.
|
| 10679 |
},
|
| 10680 |
{
|
| 10681 |
"name": "Korean",
|
| 10682 |
"bcp_47": "ko",
|
| 10683 |
"population": 44460,
|
| 10684 |
-
"score": 0.
|
| 10685 |
},
|
| 10686 |
{
|
| 10687 |
"name": "Italian",
|
| 10688 |
"bcp_47": "it",
|
| 10689 |
"population": 592805,
|
| 10690 |
-
"score": 0.
|
| 10691 |
},
|
| 10692 |
{
|
| 10693 |
"name": "Venetian",
|
|
@@ -10819,7 +10819,7 @@
|
|
| 10819 |
]
|
| 10820 |
},
|
| 10821 |
"CA": {
|
| 10822 |
-
"score": 0.
|
| 10823 |
"languages": [
|
| 10824 |
{
|
| 10825 |
"name": "English",
|
|
@@ -10873,85 +10873,85 @@
|
|
| 10873 |
"name": "Portuguese",
|
| 10874 |
"bcp_47": "pt",
|
| 10875 |
"population": 229934,
|
| 10876 |
-
"score": 0.
|
| 10877 |
},
|
| 10878 |
{
|
| 10879 |
"name": "Punjabi",
|
| 10880 |
"bcp_47": "pa",
|
| 10881 |
"population": 603106,
|
| 10882 |
-
"score": 0.
|
| 10883 |
},
|
| 10884 |
{
|
| 10885 |
"name": "Russian",
|
| 10886 |
"bcp_47": "ru",
|
| 10887 |
"population": 211087,
|
| 10888 |
-
"score": 0.
|
| 10889 |
},
|
| 10890 |
{
|
| 10891 |
"name": "German",
|
| 10892 |
"bcp_47": "de",
|
| 10893 |
"population": 294014,
|
| 10894 |
-
"score": 0.
|
| 10895 |
},
|
| 10896 |
{
|
| 10897 |
"name": "Japanese",
|
| 10898 |
"bcp_47": "ja",
|
| 10899 |
"population": 52772,
|
| 10900 |
-
"score": 0.
|
| 10901 |
},
|
| 10902 |
{
|
| 10903 |
"name": "Vietnamese",
|
| 10904 |
"bcp_47": "vi",
|
| 10905 |
"population": 184701,
|
| 10906 |
-
"score": 0.
|
| 10907 |
},
|
| 10908 |
{
|
| 10909 |
"name": "Tamil",
|
| 10910 |
"bcp_47": "ta",
|
| 10911 |
"population": 184701,
|
| 10912 |
-
"score": 0.
|
| 10913 |
},
|
| 10914 |
{
|
| 10915 |
"name": "Persian",
|
| 10916 |
"bcp_47": "fa",
|
| 10917 |
"population": 245012,
|
| 10918 |
-
"score": 0.
|
| 10919 |
},
|
| 10920 |
{
|
| 10921 |
"name": "Turkish",
|
| 10922 |
"bcp_47": "tr",
|
| 10923 |
"population": 37694,
|
| 10924 |
-
"score": 0.
|
| 10925 |
},
|
| 10926 |
{
|
| 10927 |
"name": "Cantonese",
|
| 10928 |
"bcp_47": "yue",
|
| 10929 |
"population": 640800,
|
| 10930 |
-
"score": 0.
|
| 10931 |
},
|
| 10932 |
{
|
| 10933 |
"name": "Korean",
|
| 10934 |
"bcp_47": "ko",
|
| 10935 |
"population": 169623,
|
| 10936 |
-
"score": 0.
|
| 10937 |
},
|
| 10938 |
{
|
| 10939 |
"name": "Italian",
|
| 10940 |
"bcp_47": "it",
|
| 10941 |
"population": 343016,
|
| 10942 |
-
"score": 0.
|
| 10943 |
},
|
| 10944 |
{
|
| 10945 |
"name": "Filipino",
|
| 10946 |
"bcp_47": "fil",
|
| 10947 |
"population": 565412,
|
| 10948 |
-
"score": 0.
|
| 10949 |
},
|
| 10950 |
{
|
| 10951 |
"name": "Gujarati",
|
| 10952 |
"bcp_47": "gu",
|
| 10953 |
"population": 135699,
|
| 10954 |
-
"score": 0.
|
| 10955 |
},
|
| 10956 |
{
|
| 10957 |
"name": "Polish",
|
|
@@ -11189,7 +11189,7 @@
|
|
| 11189 |
]
|
| 11190 |
},
|
| 11191 |
"CH": {
|
| 11192 |
-
"score": 0.
|
| 11193 |
"languages": [
|
| 11194 |
{
|
| 11195 |
"name": "English",
|
|
@@ -11207,19 +11207,19 @@
|
|
| 11207 |
"name": "Portuguese",
|
| 11208 |
"bcp_47": "pt",
|
| 11209 |
"population": 285736,
|
| 11210 |
-
"score": 0.
|
| 11211 |
},
|
| 11212 |
{
|
| 11213 |
"name": "German",
|
| 11214 |
"bcp_47": "de",
|
| 11215 |
"population": 6134913,
|
| 11216 |
-
"score": 0.
|
| 11217 |
},
|
| 11218 |
{
|
| 11219 |
"name": "Italian",
|
| 11220 |
"bcp_47": "it",
|
| 11221 |
"population": 361372,
|
| 11222 |
-
"score": 0.
|
| 11223 |
},
|
| 11224 |
{
|
| 11225 |
"name": "Swiss German",
|
|
@@ -11455,7 +11455,7 @@
|
|
| 11455 |
]
|
| 11456 |
},
|
| 11457 |
"CN": {
|
| 11458 |
-
"score": 0.
|
| 11459 |
"languages": [
|
| 11460 |
{
|
| 11461 |
"name": "English",
|
|
@@ -11473,13 +11473,13 @@
|
|
| 11473 |
"name": "Russian",
|
| 11474 |
"bcp_47": "ru",
|
| 11475 |
"population": 13940,
|
| 11476 |
-
"score": 0.
|
| 11477 |
},
|
| 11478 |
{
|
| 11479 |
"name": "Vietnamese",
|
| 11480 |
"bcp_47": "vi",
|
| 11481 |
"population": 6970,
|
| 11482 |
-
"score": 0.
|
| 11483 |
},
|
| 11484 |
{
|
| 11485 |
"name": "Wu Chinese",
|
|
@@ -11491,13 +11491,13 @@
|
|
| 11491 |
"name": "Cantonese",
|
| 11492 |
"bcp_47": "yue",
|
| 11493 |
"population": 72489040,
|
| 11494 |
-
"score": 0.
|
| 11495 |
},
|
| 11496 |
{
|
| 11497 |
"name": "Korean",
|
| 11498 |
"bcp_47": "ko",
|
| 11499 |
"population": 2091030,
|
| 11500 |
-
"score": 0.
|
| 11501 |
},
|
| 11502 |
{
|
| 11503 |
"name": "Xiang Chinese",
|
|
@@ -11649,7 +11649,7 @@
|
|
| 11649 |
]
|
| 11650 |
},
|
| 11651 |
"CY": {
|
| 11652 |
-
"score": 0.
|
| 11653 |
"languages": [
|
| 11654 |
{
|
| 11655 |
"name": "English",
|
|
@@ -11673,7 +11673,7 @@
|
|
| 11673 |
"name": "Turkish",
|
| 11674 |
"bcp_47": "tr",
|
| 11675 |
"population": 291336,
|
| 11676 |
-
"score": 0.
|
| 11677 |
},
|
| 11678 |
{
|
| 11679 |
"name": "Greek",
|
|
@@ -11690,7 +11690,7 @@
|
|
| 11690 |
]
|
| 11691 |
},
|
| 11692 |
"CZ": {
|
| 11693 |
-
"score": 0.
|
| 11694 |
"languages": [
|
| 11695 |
{
|
| 11696 |
"name": "English",
|
|
@@ -11702,7 +11702,7 @@
|
|
| 11702 |
"name": "German",
|
| 11703 |
"bcp_47": "de",
|
| 11704 |
"population": 1605375,
|
| 11705 |
-
"score": 0.
|
| 11706 |
},
|
| 11707 |
{
|
| 11708 |
"name": "Polish",
|
|
@@ -11725,7 +11725,7 @@
|
|
| 11725 |
]
|
| 11726 |
},
|
| 11727 |
"DE": {
|
| 11728 |
-
"score": 0.
|
| 11729 |
"languages": [
|
| 11730 |
{
|
| 11731 |
"name": "English",
|
|
@@ -11749,25 +11749,25 @@
|
|
| 11749 |
"name": "Russian",
|
| 11750 |
"bcp_47": "ru",
|
| 11751 |
"population": 4809582,
|
| 11752 |
-
"score": 0.
|
| 11753 |
},
|
| 11754 |
{
|
| 11755 |
"name": "German",
|
| 11756 |
"bcp_47": "de",
|
| 11757 |
"population": 72945327,
|
| 11758 |
-
"score": 0.
|
| 11759 |
},
|
| 11760 |
{
|
| 11761 |
"name": "Turkish",
|
| 11762 |
"bcp_47": "tr",
|
| 11763 |
"population": 2003992,
|
| 11764 |
-
"score": 0.
|
| 11765 |
},
|
| 11766 |
{
|
| 11767 |
"name": "Italian",
|
| 11768 |
"bcp_47": "it",
|
| 11769 |
"population": 5611179,
|
| 11770 |
-
"score": 0.
|
| 11771 |
},
|
| 11772 |
{
|
| 11773 |
"name": "Polish",
|
|
@@ -11891,7 +11891,7 @@
|
|
| 11891 |
]
|
| 11892 |
},
|
| 11893 |
"DK": {
|
| 11894 |
-
"score": 0.
|
| 11895 |
"languages": [
|
| 11896 |
{
|
| 11897 |
"name": "English",
|
|
@@ -11903,7 +11903,7 @@
|
|
| 11903 |
"name": "German",
|
| 11904 |
"bcp_47": "de",
|
| 11905 |
"population": 2758623,
|
| 11906 |
-
"score": 0.
|
| 11907 |
},
|
| 11908 |
{
|
| 11909 |
"name": "Swedish",
|
|
@@ -12001,7 +12001,7 @@
|
|
| 12001 |
]
|
| 12002 |
},
|
| 12003 |
"EE": {
|
| 12004 |
-
"score": 0.
|
| 12005 |
"languages": [
|
| 12006 |
{
|
| 12007 |
"name": "English",
|
|
@@ -12013,7 +12013,7 @@
|
|
| 12013 |
"name": "Russian",
|
| 12014 |
"bcp_47": "ru",
|
| 12015 |
"population": 688027,
|
| 12016 |
-
"score": 0.
|
| 12017 |
},
|
| 12018 |
{
|
| 12019 |
"name": "Finnish",
|
|
@@ -12042,7 +12042,7 @@
|
|
| 12042 |
]
|
| 12043 |
},
|
| 12044 |
"EG": {
|
| 12045 |
-
"score": 0.
|
| 12046 |
"languages": [
|
| 12047 |
{
|
| 12048 |
"name": "English",
|
|
@@ -12060,7 +12060,7 @@
|
|
| 12060 |
"name": "Egyptian Arabic",
|
| 12061 |
"bcp_47": "arz",
|
| 12062 |
"population": 66639360,
|
| 12063 |
-
"score": 0.
|
| 12064 |
},
|
| 12065 |
{
|
| 12066 |
"name": "Greek",
|
|
@@ -12236,7 +12236,7 @@
|
|
| 12236 |
]
|
| 12237 |
},
|
| 12238 |
"FI": {
|
| 12239 |
-
"score": 0.
|
| 12240 |
"languages": [
|
| 12241 |
{
|
| 12242 |
"name": "English",
|
|
@@ -12248,13 +12248,13 @@
|
|
| 12248 |
"name": "Russian",
|
| 12249 |
"bcp_47": "ru",
|
| 12250 |
"population": 45131,
|
| 12251 |
-
"score": 0.
|
| 12252 |
},
|
| 12253 |
{
|
| 12254 |
"name": "German",
|
| 12255 |
"bcp_47": "de",
|
| 12256 |
"population": 1002901,
|
| 12257 |
-
"score": 0.
|
| 12258 |
},
|
| 12259 |
{
|
| 12260 |
"name": "Swedish",
|
|
@@ -12388,7 +12388,7 @@
|
|
| 12388 |
]
|
| 12389 |
},
|
| 12390 |
"FR": {
|
| 12391 |
-
"score": 0.
|
| 12392 |
"languages": [
|
| 12393 |
{
|
| 12394 |
"name": "English",
|
|
@@ -12412,19 +12412,19 @@
|
|
| 12412 |
"name": "Portuguese",
|
| 12413 |
"bcp_47": "pt",
|
| 12414 |
"population": 882027,
|
| 12415 |
-
"score": 0.
|
| 12416 |
},
|
| 12417 |
{
|
| 12418 |
"name": "German",
|
| 12419 |
"bcp_47": "de",
|
| 12420 |
"population": 3392410,
|
| 12421 |
-
"score": 0.
|
| 12422 |
},
|
| 12423 |
{
|
| 12424 |
"name": "Italian",
|
| 12425 |
"bcp_47": "it",
|
| 12426 |
"population": 1153419,
|
| 12427 |
-
"score": 0.
|
| 12428 |
},
|
| 12429 |
{
|
| 12430 |
"name": "Dutch",
|
|
@@ -12495,7 +12495,7 @@
|
|
| 12495 |
]
|
| 12496 |
},
|
| 12497 |
"GB": {
|
| 12498 |
-
"score": 0.
|
| 12499 |
"languages": [
|
| 12500 |
{
|
| 12501 |
"name": "English",
|
|
@@ -12543,43 +12543,43 @@
|
|
| 12543 |
"name": "Portuguese",
|
| 12544 |
"bcp_47": "pt",
|
| 12545 |
"population": 131522,
|
| 12546 |
-
"score": 0.
|
| 12547 |
},
|
| 12548 |
{
|
| 12549 |
"name": "Punjabi",
|
| 12550 |
"bcp_47": "pa",
|
| 12551 |
"population": 2367400,
|
| 12552 |
-
"score": 0.
|
| 12553 |
},
|
| 12554 |
{
|
| 12555 |
"name": "German",
|
| 12556 |
"bcp_47": "de",
|
| 12557 |
"population": 5918499,
|
| 12558 |
-
"score": 0.
|
| 12559 |
},
|
| 12560 |
{
|
| 12561 |
"name": "Tamil",
|
| 12562 |
"bcp_47": "ta",
|
| 12563 |
"population": 2104355,
|
| 12564 |
-
"score": 0.
|
| 12565 |
},
|
| 12566 |
{
|
| 12567 |
"name": "Turkish",
|
| 12568 |
"bcp_47": "tr",
|
| 12569 |
"population": 131522,
|
| 12570 |
-
"score": 0.
|
| 12571 |
},
|
| 12572 |
{
|
| 12573 |
"name": "Italian",
|
| 12574 |
"bcp_47": "it",
|
| 12575 |
"population": 131522,
|
| 12576 |
-
"score": 0.
|
| 12577 |
},
|
| 12578 |
{
|
| 12579 |
"name": "Gujarati",
|
| 12580 |
"bcp_47": "gu",
|
| 12581 |
"population": 1907072,
|
| 12582 |
-
"score": 0.
|
| 12583 |
},
|
| 12584 |
{
|
| 12585 |
"name": "Polish",
|
|
@@ -12765,7 +12765,7 @@
|
|
| 12765 |
]
|
| 12766 |
},
|
| 12767 |
"GR": {
|
| 12768 |
-
"score": 0.
|
| 12769 |
"languages": [
|
| 12770 |
{
|
| 12771 |
"name": "English",
|
|
@@ -12783,13 +12783,13 @@
|
|
| 12783 |
"name": "German",
|
| 12784 |
"bcp_47": "de",
|
| 12785 |
"population": 530355,
|
| 12786 |
-
"score": 0.
|
| 12787 |
},
|
| 12788 |
{
|
| 12789 |
"name": "Turkish",
|
| 12790 |
"bcp_47": "tr",
|
| 12791 |
"population": 127285,
|
| 12792 |
-
"score": 0.
|
| 12793 |
},
|
| 12794 |
{
|
| 12795 |
"name": "Greek",
|
|
@@ -12869,7 +12869,7 @@
|
|
| 12869 |
]
|
| 12870 |
},
|
| 12871 |
"HK": {
|
| 12872 |
-
"score": 0.
|
| 12873 |
"languages": [
|
| 12874 |
{
|
| 12875 |
"name": "English",
|
|
@@ -12887,7 +12887,7 @@
|
|
| 12887 |
"name": "Cantonese",
|
| 12888 |
"bcp_47": "yue",
|
| 12889 |
"population": 6524919,
|
| 12890 |
-
"score": 0.
|
| 12891 |
}
|
| 12892 |
]
|
| 12893 |
},
|
|
@@ -12920,7 +12920,7 @@
|
|
| 12920 |
]
|
| 12921 |
},
|
| 12922 |
"HR": {
|
| 12923 |
-
"score": 0.
|
| 12924 |
"languages": [
|
| 12925 |
{
|
| 12926 |
"name": "English",
|
|
@@ -12932,7 +12932,7 @@
|
|
| 12932 |
"name": "Italian",
|
| 12933 |
"bcp_47": "it",
|
| 12934 |
"population": 67644,
|
| 12935 |
-
"score": 0.
|
| 12936 |
},
|
| 12937 |
{
|
| 12938 |
"name": "Croatian",
|
|
@@ -12949,7 +12949,7 @@
|
|
| 12949 |
]
|
| 12950 |
},
|
| 12951 |
"HU": {
|
| 12952 |
-
"score": 0.
|
| 12953 |
"languages": [
|
| 12954 |
{
|
| 12955 |
"name": "English",
|
|
@@ -12967,7 +12967,7 @@
|
|
| 12967 |
"name": "German",
|
| 12968 |
"bcp_47": "de",
|
| 12969 |
"population": 1758929,
|
| 12970 |
-
"score": 0.
|
| 12971 |
},
|
| 12972 |
{
|
| 12973 |
"name": "Romanian",
|
|
@@ -13025,7 +13025,7 @@
|
|
| 13025 |
]
|
| 13026 |
},
|
| 13027 |
"IL": {
|
| 13028 |
-
"score": 0.
|
| 13029 |
"languages": [
|
| 13030 |
{
|
| 13031 |
"name": "English",
|
|
@@ -13043,7 +13043,7 @@
|
|
| 13043 |
"name": "Russian",
|
| 13044 |
"bcp_47": "ru",
|
| 13045 |
"population": 954303,
|
| 13046 |
-
"score": 0.
|
| 13047 |
},
|
| 13048 |
{
|
| 13049 |
"name": "Malayalam",
|
|
@@ -13125,7 +13125,7 @@
|
|
| 13125 |
]
|
| 13126 |
},
|
| 13127 |
"IN": {
|
| 13128 |
-
"score": 0.
|
| 13129 |
"languages": [
|
| 13130 |
{
|
| 13131 |
"name": "English",
|
|
@@ -13155,13 +13155,13 @@
|
|
| 13155 |
"name": "Punjabi",
|
| 13156 |
"bcp_47": "pa",
|
| 13157 |
"population": 37130520,
|
| 13158 |
-
"score": 0.
|
| 13159 |
},
|
| 13160 |
{
|
| 13161 |
"name": "Telugu",
|
| 13162 |
"bcp_47": "te",
|
| 13163 |
"population": 95478480,
|
| 13164 |
-
"score": 0.
|
| 13165 |
},
|
| 13166 |
{
|
| 13167 |
"name": "Western Panjabi",
|
|
@@ -13173,19 +13173,19 @@
|
|
| 13173 |
"name": "Marathi",
|
| 13174 |
"bcp_47": "mr",
|
| 13175 |
"population": 92826300,
|
| 13176 |
-
"score": 0.
|
| 13177 |
},
|
| 13178 |
{
|
| 13179 |
"name": "Tamil",
|
| 13180 |
"bcp_47": "ta",
|
| 13181 |
"population": 78239310,
|
| 13182 |
-
"score": 0.
|
| 13183 |
},
|
| 13184 |
{
|
| 13185 |
"name": "Gujarati",
|
| 13186 |
"bcp_47": "gu",
|
| 13187 |
"population": 59674050,
|
| 13188 |
-
"score": 0.
|
| 13189 |
},
|
| 13190 |
{
|
| 13191 |
"name": "Kannada",
|
|
@@ -13603,7 +13603,7 @@
|
|
| 13603 |
]
|
| 13604 |
},
|
| 13605 |
"IQ": {
|
| 13606 |
-
"score": 0.
|
| 13607 |
"languages": [
|
| 13608 |
{
|
| 13609 |
"name": "English",
|
|
@@ -13621,7 +13621,7 @@
|
|
| 13621 |
"name": "Persian",
|
| 13622 |
"bcp_47": "fa",
|
| 13623 |
"population": 338192,
|
| 13624 |
-
"score": 0.
|
| 13625 |
},
|
| 13626 |
{
|
| 13627 |
"name": "Azerbaijani",
|
|
@@ -13650,7 +13650,7 @@
|
|
| 13650 |
]
|
| 13651 |
},
|
| 13652 |
"IT": {
|
| 13653 |
-
"score": 0.
|
| 13654 |
"languages": [
|
| 13655 |
{
|
| 13656 |
"name": "English",
|
|
@@ -13668,13 +13668,13 @@
|
|
| 13668 |
"name": "German",
|
| 13669 |
"bcp_47": "de",
|
| 13670 |
"population": 998443,
|
| 13671 |
-
"score": 0.
|
| 13672 |
},
|
| 13673 |
{
|
| 13674 |
"name": "Italian",
|
| 13675 |
"bcp_47": "it",
|
| 13676 |
"population": 59282565,
|
| 13677 |
-
"score": 0.
|
| 13678 |
},
|
| 13679 |
{
|
| 13680 |
"name": "Greek",
|
|
@@ -13820,7 +13820,7 @@
|
|
| 13820 |
]
|
| 13821 |
},
|
| 13822 |
"KE": {
|
| 13823 |
-
"score": 0.
|
| 13824 |
"languages": [
|
| 13825 |
{
|
| 13826 |
"name": "English",
|
|
@@ -13838,19 +13838,19 @@
|
|
| 13838 |
"name": "Punjabi",
|
| 13839 |
"bcp_47": "pa",
|
| 13840 |
"population": 10170,
|
| 13841 |
-
"score": 0.
|
| 13842 |
},
|
| 13843 |
{
|
| 13844 |
"name": "Swahili",
|
| 13845 |
"bcp_47": "sw",
|
| 13846 |
"population": 35328414,
|
| 13847 |
-
"score": 0.
|
| 13848 |
},
|
| 13849 |
{
|
| 13850 |
"name": "Gujarati",
|
| 13851 |
"bcp_47": "gu",
|
| 13852 |
"population": 4978,
|
| 13853 |
-
"score": 0.
|
| 13854 |
},
|
| 13855 |
{
|
| 13856 |
"name": "Oromo",
|
|
@@ -13984,7 +13984,7 @@
|
|
| 13984 |
]
|
| 13985 |
},
|
| 13986 |
"KZ": {
|
| 13987 |
-
"score": 0.
|
| 13988 |
"languages": [
|
| 13989 |
{
|
| 13990 |
"name": "English",
|
|
@@ -13996,13 +13996,13 @@
|
|
| 13996 |
"name": "Russian",
|
| 13997 |
"bcp_47": "ru",
|
| 13998 |
"population": 13746168,
|
| 13999 |
-
"score": 0.
|
| 14000 |
},
|
| 14001 |
{
|
| 14002 |
"name": "German",
|
| 14003 |
"bcp_47": "de",
|
| 14004 |
"population": 1221882,
|
| 14005 |
-
"score": 0.
|
| 14006 |
},
|
| 14007 |
{
|
| 14008 |
"name": "Kazakh",
|
|
@@ -14071,7 +14071,7 @@
|
|
| 14071 |
]
|
| 14072 |
},
|
| 14073 |
"LK": {
|
| 14074 |
-
"score": 0.
|
| 14075 |
"languages": [
|
| 14076 |
{
|
| 14077 |
"name": "English",
|
|
@@ -14083,7 +14083,7 @@
|
|
| 14083 |
"name": "Tamil",
|
| 14084 |
"bcp_47": "ta",
|
| 14085 |
"population": 3433380,
|
| 14086 |
-
"score": 0.
|
| 14087 |
},
|
| 14088 |
{
|
| 14089 |
"name": "Sinhala",
|
|
@@ -14164,7 +14164,7 @@
|
|
| 14164 |
]
|
| 14165 |
},
|
| 14166 |
"LT": {
|
| 14167 |
-
"score": 0.
|
| 14168 |
"languages": [
|
| 14169 |
{
|
| 14170 |
"name": "English",
|
|
@@ -14176,13 +14176,13 @@
|
|
| 14176 |
"name": "Russian",
|
| 14177 |
"bcp_47": "ru",
|
| 14178 |
"population": 2185168,
|
| 14179 |
-
"score": 0.
|
| 14180 |
},
|
| 14181 |
{
|
| 14182 |
"name": "German",
|
| 14183 |
"bcp_47": "de",
|
| 14184 |
"population": 382404,
|
| 14185 |
-
"score": 0.
|
| 14186 |
},
|
| 14187 |
{
|
| 14188 |
"name": "Lithuanian",
|
|
@@ -14199,7 +14199,7 @@
|
|
| 14199 |
]
|
| 14200 |
},
|
| 14201 |
"LU": {
|
| 14202 |
-
"score": 0.
|
| 14203 |
"languages": [
|
| 14204 |
{
|
| 14205 |
"name": "English",
|
|
@@ -14217,13 +14217,13 @@
|
|
| 14217 |
"name": "Portuguese",
|
| 14218 |
"bcp_47": "pt",
|
| 14219 |
"population": 100541,
|
| 14220 |
-
"score": 0.
|
| 14221 |
},
|
| 14222 |
{
|
| 14223 |
"name": "German",
|
| 14224 |
"bcp_47": "de",
|
| 14225 |
"population": 395880,
|
| 14226 |
-
"score": 0.
|
| 14227 |
},
|
| 14228 |
{
|
| 14229 |
"name": "Luxembourgish",
|
|
@@ -14234,7 +14234,7 @@
|
|
| 14234 |
]
|
| 14235 |
},
|
| 14236 |
"LV": {
|
| 14237 |
-
"score": 0.
|
| 14238 |
"languages": [
|
| 14239 |
{
|
| 14240 |
"name": "English",
|
|
@@ -14246,7 +14246,7 @@
|
|
| 14246 |
"name": "Russian",
|
| 14247 |
"bcp_47": "ru",
|
| 14248 |
"population": 714867,
|
| 14249 |
-
"score": 0.
|
| 14250 |
},
|
| 14251 |
{
|
| 14252 |
"name": "Latvian",
|
|
@@ -14362,7 +14362,7 @@
|
|
| 14362 |
]
|
| 14363 |
},
|
| 14364 |
"MO": {
|
| 14365 |
-
"score": 0.
|
| 14366 |
"languages": [
|
| 14367 |
{
|
| 14368 |
"name": "English",
|
|
@@ -14380,7 +14380,7 @@
|
|
| 14380 |
"name": "Portuguese",
|
| 14381 |
"bcp_47": "pt",
|
| 14382 |
"population": 30723,
|
| 14383 |
-
"score": 0.
|
| 14384 |
}
|
| 14385 |
]
|
| 14386 |
},
|
|
@@ -14413,7 +14413,7 @@
|
|
| 14413 |
]
|
| 14414 |
},
|
| 14415 |
"MT": {
|
| 14416 |
-
"score": 0.
|
| 14417 |
"languages": [
|
| 14418 |
{
|
| 14419 |
"name": "English",
|
|
@@ -14431,7 +14431,7 @@
|
|
| 14431 |
"name": "Italian",
|
| 14432 |
"bcp_47": "it",
|
| 14433 |
"population": 256070,
|
| 14434 |
-
"score": 0.
|
| 14435 |
},
|
| 14436 |
{
|
| 14437 |
"name": "Maltese",
|
|
@@ -14442,7 +14442,7 @@
|
|
| 14442 |
]
|
| 14443 |
},
|
| 14444 |
"MU": {
|
| 14445 |
-
"score": 0.
|
| 14446 |
"languages": [
|
| 14447 |
{
|
| 14448 |
"name": "English",
|
|
@@ -14466,7 +14466,7 @@
|
|
| 14466 |
"name": "Tamil",
|
| 14467 |
"bcp_47": "ta",
|
| 14468 |
"population": 34484,
|
| 14469 |
-
"score": 0.
|
| 14470 |
},
|
| 14471 |
{
|
| 14472 |
"name": "Bhojpuri",
|
|
@@ -14594,7 +14594,7 @@
|
|
| 14594 |
]
|
| 14595 |
},
|
| 14596 |
"MY": {
|
| 14597 |
-
"score": 0.
|
| 14598 |
"languages": [
|
| 14599 |
{
|
| 14600 |
"name": "English",
|
|
@@ -14612,13 +14612,13 @@
|
|
| 14612 |
"name": "Javanese",
|
| 14613 |
"bcp_47": "jv",
|
| 14614 |
"population": 391825,
|
| 14615 |
-
"score": 0.
|
| 14616 |
},
|
| 14617 |
{
|
| 14618 |
"name": "Tamil",
|
| 14619 |
"bcp_47": "ta",
|
| 14620 |
"population": 1371388,
|
| 14621 |
-
"score": 0.
|
| 14622 |
},
|
| 14623 |
{
|
| 14624 |
"name": "Malayalam",
|
|
@@ -14665,7 +14665,7 @@
|
|
| 14665 |
]
|
| 14666 |
},
|
| 14667 |
"NA": {
|
| 14668 |
-
"score": 0.
|
| 14669 |
"languages": [
|
| 14670 |
{
|
| 14671 |
"name": "English",
|
|
@@ -14677,7 +14677,7 @@
|
|
| 14677 |
"name": "German",
|
| 14678 |
"bcp_47": "de",
|
| 14679 |
"population": 23671,
|
| 14680 |
-
"score": 0.
|
| 14681 |
},
|
| 14682 |
{
|
| 14683 |
"name": "Afrikaans",
|
|
@@ -14836,7 +14836,7 @@
|
|
| 14836 |
]
|
| 14837 |
},
|
| 14838 |
"NL": {
|
| 14839 |
-
"score": 0.
|
| 14840 |
"languages": [
|
| 14841 |
{
|
| 14842 |
"name": "English",
|
|
@@ -14854,19 +14854,19 @@
|
|
| 14854 |
"name": "Indonesian",
|
| 14855 |
"bcp_47": "id",
|
| 14856 |
"population": 311047,
|
| 14857 |
-
"score": 0.
|
| 14858 |
},
|
| 14859 |
{
|
| 14860 |
"name": "German",
|
| 14861 |
"bcp_47": "de",
|
| 14862 |
"population": 12269084,
|
| 14863 |
-
"score": 0.
|
| 14864 |
},
|
| 14865 |
{
|
| 14866 |
"name": "Turkish",
|
| 14867 |
"bcp_47": "tr",
|
| 14868 |
"population": 207365,
|
| 14869 |
-
"score": 0.
|
| 14870 |
},
|
| 14871 |
{
|
| 14872 |
"name": "Dutch",
|
|
@@ -15183,7 +15183,7 @@
|
|
| 15183 |
]
|
| 15184 |
},
|
| 15185 |
"PH": {
|
| 15186 |
-
"score": 0.
|
| 15187 |
"languages": [
|
| 15188 |
{
|
| 15189 |
"name": "English",
|
|
@@ -15207,7 +15207,7 @@
|
|
| 15207 |
"name": "Filipino",
|
| 15208 |
"bcp_47": "fil",
|
| 15209 |
"population": 65508600,
|
| 15210 |
-
"score": 0.
|
| 15211 |
},
|
| 15212 |
{
|
| 15213 |
"name": "Cebuano",
|
|
@@ -15308,7 +15308,7 @@
|
|
| 15308 |
]
|
| 15309 |
},
|
| 15310 |
"PK": {
|
| 15311 |
-
"score": 0.
|
| 15312 |
"languages": [
|
| 15313 |
{
|
| 15314 |
"name": "English",
|
|
@@ -15326,7 +15326,7 @@
|
|
| 15326 |
"name": "Punjabi",
|
| 15327 |
"bcp_47": "pa",
|
| 15328 |
"population": 163450700,
|
| 15329 |
-
"score": 0.
|
| 15330 |
},
|
| 15331 |
{
|
| 15332 |
"name": "Western Panjabi",
|
|
@@ -15338,7 +15338,7 @@
|
|
| 15338 |
"name": "Persian",
|
| 15339 |
"bcp_47": "fa",
|
| 15340 |
"population": 1541107,
|
| 15341 |
-
"score": 0.
|
| 15342 |
},
|
| 15343 |
{
|
| 15344 |
"name": "Pashto",
|
|
@@ -15457,7 +15457,7 @@
|
|
| 15457 |
]
|
| 15458 |
},
|
| 15459 |
"PL": {
|
| 15460 |
-
"score": 0.
|
| 15461 |
"languages": [
|
| 15462 |
{
|
| 15463 |
"name": "English",
|
|
@@ -15469,13 +15469,13 @@
|
|
| 15469 |
"name": "Russian",
|
| 15470 |
"bcp_47": "ru",
|
| 15471 |
"population": 6890814,
|
| 15472 |
-
"score": 0.
|
| 15473 |
},
|
| 15474 |
{
|
| 15475 |
"name": "German",
|
| 15476 |
"bcp_47": "de",
|
| 15477 |
"population": 7273637,
|
| 15478 |
-
"score": 0.
|
| 15479 |
},
|
| 15480 |
{
|
| 15481 |
"name": "Polish",
|
|
@@ -15573,7 +15573,7 @@
|
|
| 15573 |
]
|
| 15574 |
},
|
| 15575 |
"PT": {
|
| 15576 |
-
"score": 0.
|
| 15577 |
"languages": [
|
| 15578 |
{
|
| 15579 |
"name": "English",
|
|
@@ -15597,7 +15597,7 @@
|
|
| 15597 |
"name": "Portuguese",
|
| 15598 |
"bcp_47": "pt",
|
| 15599 |
"population": 9890592,
|
| 15600 |
-
"score": 0.
|
| 15601 |
},
|
| 15602 |
{
|
| 15603 |
"name": "Galician",
|
|
@@ -15625,7 +15625,7 @@
|
|
| 15625 |
]
|
| 15626 |
},
|
| 15627 |
"RO": {
|
| 15628 |
-
"score": 0.
|
| 15629 |
"languages": [
|
| 15630 |
{
|
| 15631 |
"name": "English",
|
|
@@ -15649,13 +15649,13 @@
|
|
| 15649 |
"name": "German",
|
| 15650 |
"bcp_47": "de",
|
| 15651 |
"population": 44736,
|
| 15652 |
-
"score": 0.
|
| 15653 |
},
|
| 15654 |
{
|
| 15655 |
"name": "Turkish",
|
| 15656 |
"bcp_47": "tr",
|
| 15657 |
"population": 27694,
|
| 15658 |
-
"score": 0.
|
| 15659 |
},
|
| 15660 |
{
|
| 15661 |
"name": "Polish",
|
|
@@ -15883,7 +15883,7 @@
|
|
| 15883 |
]
|
| 15884 |
},
|
| 15885 |
"SG": {
|
| 15886 |
-
"score": 0.
|
| 15887 |
"languages": [
|
| 15888 |
{
|
| 15889 |
"name": "English",
|
|
@@ -15901,13 +15901,13 @@
|
|
| 15901 |
"name": "Punjabi",
|
| 15902 |
"bcp_47": "pa",
|
| 15903 |
"population": 9314,
|
| 15904 |
-
"score": 0.
|
| 15905 |
},
|
| 15906 |
{
|
| 15907 |
"name": "Tamil",
|
| 15908 |
"bcp_47": "ta",
|
| 15909 |
"population": 130403,
|
| 15910 |
-
"score": 0.
|
| 15911 |
},
|
| 15912 |
{
|
| 15913 |
"name": "Malayalam",
|
|
@@ -15935,7 +15935,7 @@
|
|
| 15935 |
]
|
| 15936 |
},
|
| 15937 |
"SI": {
|
| 15938 |
-
"score": 0.
|
| 15939 |
"languages": [
|
| 15940 |
{
|
| 15941 |
"name": "English",
|
|
@@ -15947,13 +15947,13 @@
|
|
| 15947 |
"name": "German",
|
| 15948 |
"bcp_47": "de",
|
| 15949 |
"population": 883126,
|
| 15950 |
-
"score": 0.
|
| 15951 |
},
|
| 15952 |
{
|
| 15953 |
"name": "Italian",
|
| 15954 |
"bcp_47": "it",
|
| 15955 |
"population": 3995,
|
| 15956 |
-
"score": 0.
|
| 15957 |
},
|
| 15958 |
{
|
| 15959 |
"name": "Hungarian",
|
|
@@ -15982,7 +15982,7 @@
|
|
| 15982 |
]
|
| 15983 |
},
|
| 15984 |
"SK": {
|
| 15985 |
-
"score": 0.
|
| 15986 |
"languages": [
|
| 15987 |
{
|
| 15988 |
"name": "English",
|
|
@@ -15994,7 +15994,7 @@
|
|
| 15994 |
"name": "German",
|
| 15995 |
"bcp_47": "de",
|
| 15996 |
"population": 1196932,
|
| 15997 |
-
"score": 0.
|
| 15998 |
},
|
| 15999 |
{
|
| 16000 |
"name": "Polish",
|
|
@@ -16290,7 +16290,7 @@
|
|
| 16290 |
]
|
| 16291 |
},
|
| 16292 |
"TR": {
|
| 16293 |
-
"score": 0.
|
| 16294 |
"languages": [
|
| 16295 |
{
|
| 16296 |
"name": "English",
|
|
@@ -16308,7 +16308,7 @@
|
|
| 16308 |
"name": "Turkish",
|
| 16309 |
"bcp_47": "tr",
|
| 16310 |
"population": 76276275,
|
| 16311 |
-
"score": 0.
|
| 16312 |
},
|
| 16313 |
{
|
| 16314 |
"name": "North Levantine Arabic",
|
|
@@ -16467,7 +16467,7 @@
|
|
| 16467 |
]
|
| 16468 |
},
|
| 16469 |
"TZ": {
|
| 16470 |
-
"score": 0.
|
| 16471 |
"languages": [
|
| 16472 |
{
|
| 16473 |
"name": "English",
|
|
@@ -16479,7 +16479,7 @@
|
|
| 16479 |
"name": "Swahili",
|
| 16480 |
"bcp_47": "sw",
|
| 16481 |
"population": 52697520,
|
| 16482 |
-
"score": 0.
|
| 16483 |
},
|
| 16484 |
{
|
| 16485 |
"name": "Sukuma",
|
|
@@ -16568,7 +16568,7 @@
|
|
| 16568 |
]
|
| 16569 |
},
|
| 16570 |
"UG": {
|
| 16571 |
-
"score": 0.
|
| 16572 |
"languages": [
|
| 16573 |
{
|
| 16574 |
"name": "English",
|
|
@@ -16586,7 +16586,7 @@
|
|
| 16586 |
"name": "Swahili",
|
| 16587 |
"bcp_47": "sw",
|
| 16588 |
"population": 32439750,
|
| 16589 |
-
"score": 0.
|
| 16590 |
},
|
| 16591 |
{
|
| 16592 |
"name": "Kinyarwanda",
|
|
@@ -16662,7 +16662,7 @@
|
|
| 16662 |
]
|
| 16663 |
},
|
| 16664 |
"US": {
|
| 16665 |
-
"score": 0.
|
| 16666 |
"languages": [
|
| 16667 |
{
|
| 16668 |
"name": "English",
|
|
@@ -16692,37 +16692,37 @@
|
|
| 16692 |
"name": "Russian",
|
| 16693 |
"bcp_47": "ru",
|
| 16694 |
"population": 798334,
|
| 16695 |
-
"score": 0.
|
| 16696 |
},
|
| 16697 |
{
|
| 16698 |
"name": "German",
|
| 16699 |
"bcp_47": "de",
|
| 16700 |
"population": 1563403,
|
| 16701 |
-
"score": 0.
|
| 16702 |
},
|
| 16703 |
{
|
| 16704 |
"name": "Vietnamese",
|
| 16705 |
"bcp_47": "vi",
|
| 16706 |
"population": 1130973,
|
| 16707 |
-
"score": 0.
|
| 16708 |
},
|
| 16709 |
{
|
| 16710 |
"name": "Korean",
|
| 16711 |
"bcp_47": "ko",
|
| 16712 |
"population": 997917,
|
| 16713 |
-
"score": 0.
|
| 16714 |
},
|
| 16715 |
{
|
| 16716 |
"name": "Italian",
|
| 16717 |
"bcp_47": "it",
|
| 16718 |
"population": 1130973,
|
| 16719 |
-
"score": 0.
|
| 16720 |
},
|
| 16721 |
{
|
| 16722 |
"name": "Filipino",
|
| 16723 |
"bcp_47": "fil",
|
| 16724 |
"population": 1397084,
|
| 16725 |
-
"score": 0.
|
| 16726 |
},
|
| 16727 |
{
|
| 16728 |
"name": "Yiddish",
|
|
@@ -16925,7 +16925,7 @@
|
|
| 16925 |
]
|
| 16926 |
},
|
| 16927 |
"ZA": {
|
| 16928 |
-
"score": 0.
|
| 16929 |
"languages": [
|
| 16930 |
{
|
| 16931 |
"name": "English",
|
|
@@ -16943,7 +16943,7 @@
|
|
| 16943 |
"name": "Swahili",
|
| 16944 |
"bcp_47": "sw",
|
| 16945 |
"population": 1016,
|
| 16946 |
-
"score": 0.
|
| 16947 |
},
|
| 16948 |
{
|
| 16949 |
"name": "Zulu",
|
|
@@ -17125,7 +17125,7 @@
|
|
| 17125 |
]
|
| 17126 |
},
|
| 17127 |
"ID": {
|
| 17128 |
-
"score": 0.
|
| 17129 |
"languages": [
|
| 17130 |
{
|
| 17131 |
"name": "Chinese",
|
|
@@ -17137,13 +17137,13 @@
|
|
| 17137 |
"name": "Indonesian",
|
| 17138 |
"bcp_47": "id",
|
| 17139 |
"population": 170896640,
|
| 17140 |
-
"score": 0.
|
| 17141 |
},
|
| 17142 |
{
|
| 17143 |
"name": "Javanese",
|
| 17144 |
"bcp_47": "jv",
|
| 17145 |
"population": 90788840,
|
| 17146 |
-
"score": 0.
|
| 17147 |
},
|
| 17148 |
{
|
| 17149 |
"name": "Malay",
|
|
@@ -17304,7 +17304,7 @@
|
|
| 17304 |
]
|
| 17305 |
},
|
| 17306 |
"MN": {
|
| 17307 |
-
"score": 0.
|
| 17308 |
"languages": [
|
| 17309 |
{
|
| 17310 |
"name": "Chinese",
|
|
@@ -17316,7 +17316,7 @@
|
|
| 17316 |
"name": "Russian",
|
| 17317 |
"bcp_47": "ru",
|
| 17318 |
"population": 4118,
|
| 17319 |
-
"score": 0.
|
| 17320 |
},
|
| 17321 |
{
|
| 17322 |
"name": "Kazakh",
|
|
@@ -17408,7 +17408,7 @@
|
|
| 17408 |
]
|
| 17409 |
},
|
| 17410 |
"VN": {
|
| 17411 |
-
"score": 0.
|
| 17412 |
"languages": [
|
| 17413 |
{
|
| 17414 |
"name": "Chinese",
|
|
@@ -17420,7 +17420,7 @@
|
|
| 17420 |
"name": "Vietnamese",
|
| 17421 |
"bcp_47": "vi",
|
| 17422 |
"population": 84900318,
|
| 17423 |
-
"score": 0.
|
| 17424 |
},
|
| 17425 |
{
|
| 17426 |
"name": "Hmong Njua",
|
|
@@ -17603,7 +17603,7 @@
|
|
| 17603 |
]
|
| 17604 |
},
|
| 17605 |
"GQ": {
|
| 17606 |
-
"score": 0.
|
| 17607 |
"languages": [
|
| 17608 |
{
|
| 17609 |
"name": "Spanish",
|
|
@@ -17621,7 +17621,7 @@
|
|
| 17621 |
"name": "Portuguese",
|
| 17622 |
"bcp_47": "pt",
|
| 17623 |
"population": 1,
|
| 17624 |
-
"score": 0.
|
| 17625 |
},
|
| 17626 |
{
|
| 17627 |
"name": "Fang",
|
|
@@ -17700,7 +17700,7 @@
|
|
| 17700 |
]
|
| 17701 |
},
|
| 17702 |
"PY": {
|
| 17703 |
-
"score": 0.
|
| 17704 |
"languages": [
|
| 17705 |
{
|
| 17706 |
"name": "Spanish",
|
|
@@ -17712,7 +17712,7 @@
|
|
| 17712 |
"name": "German",
|
| 17713 |
"bcp_47": "de",
|
| 17714 |
"population": 208559,
|
| 17715 |
-
"score": 0.
|
| 17716 |
},
|
| 17717 |
{
|
| 17718 |
"name": "Guarani",
|
|
@@ -17819,7 +17819,7 @@
|
|
| 17819 |
]
|
| 17820 |
},
|
| 17821 |
"IR": {
|
| 17822 |
-
"score": 0.
|
| 17823 |
"languages": [
|
| 17824 |
{
|
| 17825 |
"name": "Arabic",
|
|
@@ -17831,7 +17831,7 @@
|
|
| 17831 |
"name": "Persian",
|
| 17832 |
"bcp_47": "fa",
|
| 17833 |
"population": 63692475,
|
| 17834 |
-
"score": 0.
|
| 17835 |
},
|
| 17836 |
{
|
| 17837 |
"name": "Pashto",
|
|
@@ -18166,7 +18166,7 @@
|
|
| 18166 |
]
|
| 18167 |
},
|
| 18168 |
"OM": {
|
| 18169 |
-
"score": 0.
|
| 18170 |
"languages": [
|
| 18171 |
{
|
| 18172 |
"name": "Arabic",
|
|
@@ -18178,7 +18178,7 @@
|
|
| 18178 |
"name": "Persian",
|
| 18179 |
"bcp_47": "fa",
|
| 18180 |
"population": 43849,
|
| 18181 |
-
"score": 0.
|
| 18182 |
},
|
| 18183 |
{
|
| 18184 |
"name": "Baluchi",
|
|
@@ -18206,7 +18206,7 @@
|
|
| 18206 |
]
|
| 18207 |
},
|
| 18208 |
"QA": {
|
| 18209 |
-
"score": 0.
|
| 18210 |
"languages": [
|
| 18211 |
{
|
| 18212 |
"name": "Arabic",
|
|
@@ -18218,7 +18218,7 @@
|
|
| 18218 |
"name": "Persian",
|
| 18219 |
"bcp_47": "fa",
|
| 18220 |
"population": 268859,
|
| 18221 |
-
"score": 0.
|
| 18222 |
},
|
| 18223 |
{
|
| 18224 |
"name": "Malayalam",
|
|
@@ -18246,7 +18246,7 @@
|
|
| 18246 |
]
|
| 18247 |
},
|
| 18248 |
"SO": {
|
| 18249 |
-
"score": 0.
|
| 18250 |
"languages": [
|
| 18251 |
{
|
| 18252 |
"name": "Arabic",
|
|
@@ -18258,7 +18258,7 @@
|
|
| 18258 |
"name": "Swahili",
|
| 18259 |
"bcp_47": "sw",
|
| 18260 |
"population": 235142,
|
| 18261 |
-
"score": 0.
|
| 18262 |
},
|
| 18263 |
{
|
| 18264 |
"name": "Oromo",
|
|
@@ -18333,7 +18333,7 @@
|
|
| 18333 |
]
|
| 18334 |
},
|
| 18335 |
"TJ": {
|
| 18336 |
-
"score":
|
| 18337 |
"languages": [
|
| 18338 |
{
|
| 18339 |
"name": "Arabic",
|
|
@@ -18345,13 +18345,13 @@
|
|
| 18345 |
"name": "Russian",
|
| 18346 |
"bcp_47": "ru",
|
| 18347 |
"population": 1064840,
|
| 18348 |
-
"score": 0.
|
| 18349 |
},
|
| 18350 |
{
|
| 18351 |
"name": "Persian",
|
| 18352 |
"bcp_47": "fa",
|
| 18353 |
"population": 69215,
|
| 18354 |
-
"score": 0.
|
| 18355 |
},
|
| 18356 |
{
|
| 18357 |
"name": "Tajik",
|
|
@@ -18454,7 +18454,7 @@
|
|
| 18454 |
]
|
| 18455 |
},
|
| 18456 |
"CD": {
|
| 18457 |
-
"score": 0.
|
| 18458 |
"languages": [
|
| 18459 |
{
|
| 18460 |
"name": "French",
|
|
@@ -18466,7 +18466,7 @@
|
|
| 18466 |
"name": "Swahili",
|
| 18467 |
"bcp_47": "sw",
|
| 18468 |
"population": 50890000,
|
| 18469 |
-
"score": 0.
|
| 18470 |
},
|
| 18471 |
{
|
| 18472 |
"name": "Kinyarwanda",
|
|
@@ -18718,7 +18718,7 @@
|
|
| 18718 |
]
|
| 18719 |
},
|
| 18720 |
"RE": {
|
| 18721 |
-
"score": 0.
|
| 18722 |
"languages": [
|
| 18723 |
{
|
| 18724 |
"name": "French",
|
|
@@ -18730,7 +18730,7 @@
|
|
| 18730 |
"name": "Tamil",
|
| 18731 |
"bcp_47": "ta",
|
| 18732 |
"population": 118138,
|
| 18733 |
-
"score": 0.
|
| 18734 |
},
|
| 18735 |
{
|
| 18736 |
"name": "Réunion Creole French",
|
|
@@ -18887,7 +18887,7 @@
|
|
| 18887 |
]
|
| 18888 |
},
|
| 18889 |
"YT": {
|
| 18890 |
-
"score": 0.
|
| 18891 |
"languages": [
|
| 18892 |
{
|
| 18893 |
"name": "French",
|
|
@@ -18899,7 +18899,7 @@
|
|
| 18899 |
"name": "Swahili",
|
| 18900 |
"bcp_47": "sw",
|
| 18901 |
"population": 2716,
|
| 18902 |
-
"score": 0.
|
| 18903 |
},
|
| 18904 |
{
|
| 18905 |
"name": "Comorian",
|
|
@@ -18916,13 +18916,13 @@
|
|
| 18916 |
]
|
| 18917 |
},
|
| 18918 |
"AO": {
|
| 18919 |
-
"score": 0.
|
| 18920 |
"languages": [
|
| 18921 |
{
|
| 18922 |
"name": "Portuguese",
|
| 18923 |
"bcp_47": "pt",
|
| 18924 |
"population": 21789941,
|
| 18925 |
-
"score": 0.
|
| 18926 |
},
|
| 18927 |
{
|
| 18928 |
"name": "Umbundu",
|
|
@@ -18945,13 +18945,13 @@
|
|
| 18945 |
]
|
| 18946 |
},
|
| 18947 |
"CV": {
|
| 18948 |
-
"score": 0.
|
| 18949 |
"languages": [
|
| 18950 |
{
|
| 18951 |
"name": "Portuguese",
|
| 18952 |
"bcp_47": "pt",
|
| 18953 |
"population": 443274,
|
| 18954 |
-
"score": 0.
|
| 18955 |
},
|
| 18956 |
{
|
| 18957 |
"name": "Kabuverdianu",
|
|
@@ -18962,13 +18962,13 @@
|
|
| 18962 |
]
|
| 18963 |
},
|
| 18964 |
"GW": {
|
| 18965 |
-
"score": 0.
|
| 18966 |
"languages": [
|
| 18967 |
{
|
| 18968 |
"name": "Portuguese",
|
| 18969 |
"bcp_47": "pt",
|
| 18970 |
"population": 1927100,
|
| 18971 |
-
"score": 0.
|
| 18972 |
},
|
| 18973 |
{
|
| 18974 |
"name": "Fula",
|
|
@@ -18985,19 +18985,19 @@
|
|
| 18985 |
]
|
| 18986 |
},
|
| 18987 |
"MZ": {
|
| 18988 |
-
"score": 0.
|
| 18989 |
"languages": [
|
| 18990 |
{
|
| 18991 |
"name": "Portuguese",
|
| 18992 |
"bcp_47": "pt",
|
| 18993 |
"population": 8126514,
|
| 18994 |
-
"score": 0.
|
| 18995 |
},
|
| 18996 |
{
|
| 18997 |
"name": "Swahili",
|
| 18998 |
"bcp_47": "sw",
|
| 18999 |
"population": 9330,
|
| 19000 |
-
"score": 0.
|
| 19001 |
},
|
| 19002 |
{
|
| 19003 |
"name": "Nyanja",
|
|
@@ -19062,24 +19062,24 @@
|
|
| 19062 |
]
|
| 19063 |
},
|
| 19064 |
"ST": {
|
| 19065 |
-
"score": 0.
|
| 19066 |
"languages": [
|
| 19067 |
{
|
| 19068 |
"name": "Portuguese",
|
| 19069 |
"bcp_47": "pt",
|
| 19070 |
"population": 179454,
|
| 19071 |
-
"score": 0.
|
| 19072 |
}
|
| 19073 |
]
|
| 19074 |
},
|
| 19075 |
"TL": {
|
| 19076 |
-
"score": 0.
|
| 19077 |
"languages": [
|
| 19078 |
{
|
| 19079 |
"name": "Portuguese",
|
| 19080 |
"bcp_47": "pt",
|
| 19081 |
"population": 816395,
|
| 19082 |
-
"score": 0.
|
| 19083 |
},
|
| 19084 |
{
|
| 19085 |
"name": "Tetum",
|
|
@@ -19090,13 +19090,13 @@
|
|
| 19090 |
]
|
| 19091 |
},
|
| 19092 |
"BY": {
|
| 19093 |
-
"score": 0.
|
| 19094 |
"languages": [
|
| 19095 |
{
|
| 19096 |
"name": "Russian",
|
| 19097 |
"bcp_47": "ru",
|
| 19098 |
"population": 1137350,
|
| 19099 |
-
"score": 0.
|
| 19100 |
},
|
| 19101 |
{
|
| 19102 |
"name": "Belarusian",
|
|
@@ -19107,13 +19107,13 @@
|
|
| 19107 |
]
|
| 19108 |
},
|
| 19109 |
"GE": {
|
| 19110 |
-
"score": 0.
|
| 19111 |
"languages": [
|
| 19112 |
{
|
| 19113 |
"name": "Russian",
|
| 19114 |
"bcp_47": "ru",
|
| 19115 |
"population": 359730,
|
| 19116 |
-
"score": 0.
|
| 19117 |
},
|
| 19118 |
{
|
| 19119 |
"name": "Kurdish",
|
|
@@ -19154,13 +19154,13 @@
|
|
| 19154 |
]
|
| 19155 |
},
|
| 19156 |
"KG": {
|
| 19157 |
-
"score": 0.
|
| 19158 |
"languages": [
|
| 19159 |
{
|
| 19160 |
"name": "Russian",
|
| 19161 |
"bcp_47": "ru",
|
| 19162 |
"population": 2147364,
|
| 19163 |
-
"score": 0.
|
| 19164 |
},
|
| 19165 |
{
|
| 19166 |
"name": "Kyrgyz",
|
|
@@ -19171,13 +19171,13 @@
|
|
| 19171 |
]
|
| 19172 |
},
|
| 19173 |
"MD": {
|
| 19174 |
-
"score": 0.
|
| 19175 |
"languages": [
|
| 19176 |
{
|
| 19177 |
"name": "Russian",
|
| 19178 |
"bcp_47": "ru",
|
| 19179 |
"population": 100935,
|
| 19180 |
-
"score": 0.
|
| 19181 |
},
|
| 19182 |
{
|
| 19183 |
"name": "Ukrainian",
|
|
@@ -19206,13 +19206,13 @@
|
|
| 19206 |
]
|
| 19207 |
},
|
| 19208 |
"RU": {
|
| 19209 |
-
"score": 0.
|
| 19210 |
"languages": [
|
| 19211 |
{
|
| 19212 |
"name": "Russian",
|
| 19213 |
"bcp_47": "ru",
|
| 19214 |
"population": 133218680,
|
| 19215 |
-
"score": 0.
|
| 19216 |
},
|
| 19217 |
{
|
| 19218 |
"name": "Azerbaijani",
|
|
@@ -19427,13 +19427,13 @@
|
|
| 19427 |
]
|
| 19428 |
},
|
| 19429 |
"SJ": {
|
| 19430 |
-
"score": 0.
|
| 19431 |
"languages": [
|
| 19432 |
{
|
| 19433 |
"name": "Russian",
|
| 19434 |
"bcp_47": "ru",
|
| 19435 |
"population": 1200,
|
| 19436 |
-
"score": 0.
|
| 19437 |
},
|
| 19438 |
{
|
| 19439 |
"name": "Norwegian Bokmål",
|
|
@@ -19444,13 +19444,13 @@
|
|
| 19444 |
]
|
| 19445 |
},
|
| 19446 |
"TM": {
|
| 19447 |
-
"score": 0.
|
| 19448 |
"languages": [
|
| 19449 |
{
|
| 19450 |
"name": "Russian",
|
| 19451 |
"bcp_47": "ru",
|
| 19452 |
"population": 663436,
|
| 19453 |
-
"score": 0.
|
| 19454 |
},
|
| 19455 |
{
|
| 19456 |
"name": "Uzbek",
|
|
@@ -19473,19 +19473,19 @@
|
|
| 19473 |
]
|
| 19474 |
},
|
| 19475 |
"UA": {
|
| 19476 |
-
"score": 0.
|
| 19477 |
"languages": [
|
| 19478 |
{
|
| 19479 |
"name": "Russian",
|
| 19480 |
"bcp_47": "ru",
|
| 19481 |
"population": 20204534,
|
| 19482 |
-
"score": 0.
|
| 19483 |
},
|
| 19484 |
{
|
| 19485 |
"name": "Turkish",
|
| 19486 |
"bcp_47": "tr",
|
| 19487 |
"population": 184476,
|
| 19488 |
-
"score": 0.
|
| 19489 |
},
|
| 19490 |
{
|
| 19491 |
"name": "Polish",
|
|
@@ -19550,19 +19550,19 @@
|
|
| 19550 |
]
|
| 19551 |
},
|
| 19552 |
"UZ": {
|
| 19553 |
-
"score": 0.
|
| 19554 |
"languages": [
|
| 19555 |
{
|
| 19556 |
"name": "Russian",
|
| 19557 |
"bcp_47": "ru",
|
| 19558 |
"population": 4279156,
|
| 19559 |
-
"score": 0.
|
| 19560 |
},
|
| 19561 |
{
|
| 19562 |
"name": "Turkish",
|
| 19563 |
"bcp_47": "tr",
|
| 19564 |
"population": 232297,
|
| 19565 |
-
"score": 0.
|
| 19566 |
},
|
| 19567 |
{
|
| 19568 |
"name": "Uzbek",
|
|
@@ -19579,13 +19579,13 @@
|
|
| 19579 |
]
|
| 19580 |
},
|
| 19581 |
"LI": {
|
| 19582 |
-
"score": 0.
|
| 19583 |
"languages": [
|
| 19584 |
{
|
| 19585 |
"name": "German",
|
| 19586 |
"bcp_47": "de",
|
| 19587 |
"population": 39137,
|
| 19588 |
-
"score": 0.
|
| 19589 |
},
|
| 19590 |
{
|
| 19591 |
"name": "Swiss German",
|
|
@@ -19602,19 +19602,19 @@
|
|
| 19602 |
]
|
| 19603 |
},
|
| 19604 |
"JP": {
|
| 19605 |
-
"score": 0.
|
| 19606 |
"languages": [
|
| 19607 |
{
|
| 19608 |
"name": "Japanese",
|
| 19609 |
"bcp_47": "ja",
|
| 19610 |
"population": 119231650,
|
| 19611 |
-
"score": 0.
|
| 19612 |
},
|
| 19613 |
{
|
| 19614 |
"name": "Korean",
|
| 19615 |
"bcp_47": "ko",
|
| 19616 |
"population": 652636,
|
| 19617 |
-
"score": 0.
|
| 19618 |
},
|
| 19619 |
{
|
| 19620 |
"name": "Central Okinawan",
|
|
@@ -19625,13 +19625,13 @@
|
|
| 19625 |
]
|
| 19626 |
},
|
| 19627 |
"AF": {
|
| 19628 |
-
"score": 0.
|
| 19629 |
"languages": [
|
| 19630 |
{
|
| 19631 |
"name": "Persian",
|
| 19632 |
"bcp_47": "fa",
|
| 19633 |
"population": 18321900,
|
| 19634 |
-
"score": 0.
|
| 19635 |
},
|
| 19636 |
{
|
| 19637 |
"name": "Pashto",
|
|
@@ -19684,13 +19684,13 @@
|
|
| 19684 |
]
|
| 19685 |
},
|
| 19686 |
"MK": {
|
| 19687 |
-
"score": 0.
|
| 19688 |
"languages": [
|
| 19689 |
{
|
| 19690 |
"name": "Turkish",
|
| 19691 |
"bcp_47": "tr",
|
| 19692 |
"population": 74409,
|
| 19693 |
-
"score": 0.
|
| 19694 |
},
|
| 19695 |
{
|
| 19696 |
"name": "Albanian",
|
|
@@ -19707,35 +19707,35 @@
|
|
| 19707 |
]
|
| 19708 |
},
|
| 19709 |
"KP": {
|
| 19710 |
-
"score": 0.
|
| 19711 |
"languages": [
|
| 19712 |
{
|
| 19713 |
"name": "Korean",
|
| 19714 |
"bcp_47": "ko",
|
| 19715 |
"population": 22566280,
|
| 19716 |
-
"score": 0.
|
| 19717 |
}
|
| 19718 |
]
|
| 19719 |
},
|
| 19720 |
"KR": {
|
| 19721 |
-
"score": 0.
|
| 19722 |
"languages": [
|
| 19723 |
{
|
| 19724 |
"name": "Korean",
|
| 19725 |
"bcp_47": "ko",
|
| 19726 |
"population": 51835100,
|
| 19727 |
-
"score": 0.
|
| 19728 |
}
|
| 19729 |
]
|
| 19730 |
},
|
| 19731 |
"SM": {
|
| 19732 |
-
"score": 0.
|
| 19733 |
"languages": [
|
| 19734 |
{
|
| 19735 |
"name": "Italian",
|
| 19736 |
"bcp_47": "it",
|
| 19737 |
"population": 30466,
|
| 19738 |
-
"score": 0.
|
| 19739 |
},
|
| 19740 |
{
|
| 19741 |
"name": "Esperanto",
|
|
@@ -19746,13 +19746,13 @@
|
|
| 19746 |
]
|
| 19747 |
},
|
| 19748 |
"VA": {
|
| 19749 |
-
"score": 0.
|
| 19750 |
"languages": [
|
| 19751 |
{
|
| 19752 |
"name": "Italian",
|
| 19753 |
"bcp_47": "it",
|
| 19754 |
"population": 820,
|
| 19755 |
-
"score": 0.
|
| 19756 |
},
|
| 19757 |
{
|
| 19758 |
"name": "Latin",
|
|
|
|
| 26 |
"license": null,
|
| 27 |
"average": 0.66,
|
| 28 |
"classification_accuracy": 0.73,
|
| 29 |
+
"language_modeling_chrf": 0.96,
|
| 30 |
"translation_bleu": 0.4,
|
| 31 |
"translation_chrf": 0.54
|
| 32 |
},
|
|
|
|
| 39 |
"size": 27432406640.0,
|
| 40 |
"type": "Open",
|
| 41 |
"license": "Gemma",
|
| 42 |
+
"average": 0.64,
|
| 43 |
"classification_accuracy": 0.72,
|
| 44 |
+
"language_modeling_chrf": 0.94,
|
| 45 |
"translation_bleu": 0.37,
|
| 46 |
"translation_chrf": 0.54
|
| 47 |
},
|
|
|
|
| 54 |
"size": 70553706496.0,
|
| 55 |
"type": "Open",
|
| 56 |
"license": "Llama3.1",
|
| 57 |
+
"average": 0.63,
|
| 58 |
"classification_accuracy": 0.57,
|
| 59 |
+
"language_modeling_chrf": 0.95,
|
| 60 |
"translation_bleu": 0.43,
|
| 61 |
"translation_chrf": 0.57
|
| 62 |
},
|
| 63 |
{
|
| 64 |
"rank": 5,
|
| 65 |
+
"provider": "Meta Llama",
|
| 66 |
+
"model": "Llama 3 70b Instruct",
|
| 67 |
"hf_id": null,
|
| 68 |
"creation_date": null,
|
| 69 |
"size": null,
|
| 70 |
"type": "Commercial",
|
| 71 |
"license": null,
|
| 72 |
"average": 0.61,
|
| 73 |
+
"classification_accuracy": 0.8,
|
| 74 |
+
"language_modeling_chrf": 0.96,
|
| 75 |
+
"translation_bleu": 0.25,
|
| 76 |
+
"translation_chrf": 0.43
|
| 77 |
},
|
| 78 |
{
|
| 79 |
"rank": 6,
|
| 80 |
+
"provider": "Amazon",
|
| 81 |
+
"model": "Nova Micro V1",
|
| 82 |
"hf_id": null,
|
| 83 |
"creation_date": null,
|
| 84 |
"size": null,
|
| 85 |
"type": "Commercial",
|
| 86 |
"license": null,
|
| 87 |
+
"average": 0.6,
|
| 88 |
+
"classification_accuracy": 0.52,
|
| 89 |
+
"language_modeling_chrf": 0.94,
|
| 90 |
+
"translation_bleu": 0.4,
|
| 91 |
+
"translation_chrf": 0.56
|
| 92 |
},
|
| 93 |
{
|
| 94 |
"rank": 7,
|
|
|
|
| 101 |
"license": null,
|
| 102 |
"average": 0.6,
|
| 103 |
"classification_accuracy": 0.52,
|
| 104 |
+
"language_modeling_chrf": 0.96,
|
| 105 |
"translation_bleu": 0.39,
|
| 106 |
"translation_chrf": 0.55
|
| 107 |
},
|
|
|
|
| 116 |
"license": "Apache 2.0",
|
| 117 |
"average": 0.58,
|
| 118 |
"classification_accuracy": 0.55,
|
| 119 |
+
"language_modeling_chrf": 0.88,
|
| 120 |
"translation_bleu": 0.38,
|
| 121 |
"translation_chrf": 0.52
|
| 122 |
},
|
|
|
|
| 129 |
"size": 70553706496.0,
|
| 130 |
"type": "Open",
|
| 131 |
"license": "Llama3.3",
|
| 132 |
+
"average": 0.55,
|
| 133 |
+
"classification_accuracy": 0.51,
|
| 134 |
"language_modeling_chrf": 0.94,
|
| 135 |
+
"translation_bleu": 0.28,
|
| 136 |
+
"translation_chrf": 0.46
|
| 137 |
},
|
| 138 |
{
|
| 139 |
"rank": 10,
|
|
|
|
| 144 |
"size": null,
|
| 145 |
"type": "Commercial",
|
| 146 |
"license": null,
|
| 147 |
+
"average": 0.54,
|
| 148 |
"classification_accuracy": 0.5,
|
| 149 |
+
"language_modeling_chrf": 0.86,
|
| 150 |
"translation_bleu": 0.32,
|
| 151 |
"translation_chrf": 0.49
|
| 152 |
},
|
|
|
|
| 161 |
"license": "Mit",
|
| 162 |
"average": 0.52,
|
| 163 |
"classification_accuracy": 0.42,
|
| 164 |
+
"language_modeling_chrf": 0.88,
|
| 165 |
"translation_bleu": 0.32,
|
| 166 |
"translation_chrf": 0.46
|
| 167 |
},
|
|
|
|
| 176 |
"license": "Apache 2.0",
|
| 177 |
"average": 0.25,
|
| 178 |
"classification_accuracy": 0.0,
|
| 179 |
+
"language_modeling_chrf": 0.47,
|
| 180 |
"translation_bleu": 0.21,
|
| 181 |
"translation_chrf": 0.3
|
| 182 |
}
|
|
|
|
| 220 |
"in_benchmark": true,
|
| 221 |
"NaN": 0.0,
|
| 222 |
"classification_accuracy": 0.53,
|
| 223 |
+
"language_modeling_chrf": 0.94,
|
| 224 |
"translation_bleu": 0.32,
|
| 225 |
"translation_chrf": 0.49
|
| 226 |
},
|
|
|
|
| 248 |
"in_benchmark": true,
|
| 249 |
"NaN": 0.0,
|
| 250 |
"classification_accuracy": 0.43,
|
| 251 |
+
"language_modeling_chrf": 0.94,
|
| 252 |
"translation_bleu": 0.28,
|
| 253 |
"translation_chrf": 0.47
|
| 254 |
},
|
|
|
|
| 262 |
"in_benchmark": true,
|
| 263 |
"NaN": 0.0,
|
| 264 |
"classification_accuracy": 0.5,
|
| 265 |
+
"language_modeling_chrf": 0.92,
|
| 266 |
"translation_bleu": 0.24,
|
| 267 |
"translation_chrf": 0.42
|
| 268 |
},
|
|
|
|
| 290 |
"in_benchmark": true,
|
| 291 |
"NaN": 0.0,
|
| 292 |
"classification_accuracy": 0.4,
|
| 293 |
+
"language_modeling_chrf": 0.91,
|
| 294 |
"translation_bleu": 0.2,
|
| 295 |
"translation_chrf": 0.41
|
| 296 |
},
|
|
|
|
| 300 |
"autonym": "Português",
|
| 301 |
"speakers": 237496885,
|
| 302 |
"family": "Indo-European",
|
| 303 |
+
"average": 0.45,
|
| 304 |
"in_benchmark": true,
|
| 305 |
"NaN": 0.0,
|
| 306 |
"classification_accuracy": 0.5,
|
| 307 |
+
"language_modeling_chrf": 0.96,
|
| 308 |
"translation_bleu": 0.31,
|
| 309 |
"translation_chrf": 0.49
|
| 310 |
},
|
|
|
|
| 314 |
"autonym": "ਪੰਜਾਬੀ",
|
| 315 |
"speakers": 203571210,
|
| 316 |
"family": "Indo-European",
|
| 317 |
+
"average": 0.43,
|
| 318 |
"in_benchmark": true,
|
| 319 |
"NaN": 0.0,
|
| 320 |
"classification_accuracy": 0.4,
|
| 321 |
+
"language_modeling_chrf": 0.9,
|
| 322 |
"translation_bleu": 0.34,
|
| 323 |
"translation_chrf": 0.49
|
| 324 |
},
|
|
|
|
| 328 |
"autonym": "Русский",
|
| 329 |
"speakers": 195841151,
|
| 330 |
"family": "Indo-European",
|
| 331 |
+
"average": 0.45,
|
| 332 |
"in_benchmark": true,
|
| 333 |
"NaN": 0.0,
|
| 334 |
+
"classification_accuracy": 0.57,
|
| 335 |
+
"language_modeling_chrf": 0.97,
|
| 336 |
+
"translation_bleu": 0.26,
|
| 337 |
+
"translation_chrf": 0.45
|
| 338 |
},
|
| 339 |
{
|
| 340 |
"bcp_47": "sw",
|
|
|
|
| 342 |
"autonym": "Kiswahili",
|
| 343 |
"speakers": 171610296,
|
| 344 |
"family": "Atlantic-Congo",
|
| 345 |
+
"average": 0.45,
|
| 346 |
"in_benchmark": true,
|
| 347 |
"NaN": 0.0,
|
| 348 |
+
"classification_accuracy": 0.57,
|
| 349 |
+
"language_modeling_chrf": 0.94,
|
| 350 |
+
"translation_bleu": 0.3,
|
| 351 |
+
"translation_chrf": 0.47
|
| 352 |
},
|
| 353 |
{
|
| 354 |
"bcp_47": "id",
|
|
|
|
| 356 |
"autonym": "Bahasa Indonesia",
|
| 357 |
"speakers": 171207687,
|
| 358 |
"family": "Austronesian",
|
| 359 |
+
"average": 0.47,
|
| 360 |
"in_benchmark": true,
|
| 361 |
"NaN": 0.0,
|
| 362 |
+
"classification_accuracy": 0.63,
|
| 363 |
+
"language_modeling_chrf": 0.96,
|
| 364 |
+
"translation_bleu": 0.29,
|
| 365 |
+
"translation_chrf": 0.47
|
| 366 |
},
|
| 367 |
{
|
| 368 |
"bcp_47": "de",
|
|
|
|
| 370 |
"autonym": "Deutsch",
|
| 371 |
"speakers": 136350226,
|
| 372 |
"family": "Indo-European",
|
| 373 |
+
"average": 0.49,
|
| 374 |
"in_benchmark": true,
|
| 375 |
"NaN": 0.0,
|
| 376 |
+
"classification_accuracy": 0.67,
|
| 377 |
+
"language_modeling_chrf": 0.96,
|
| 378 |
+
"translation_bleu": 0.32,
|
| 379 |
+
"translation_chrf": 0.5
|
| 380 |
},
|
| 381 |
{
|
| 382 |
"bcp_47": "ja",
|
|
|
|
| 384 |
"autonym": "日本語",
|
| 385 |
"speakers": 119729026,
|
| 386 |
"family": "Japonic",
|
| 387 |
+
"average": 0.46,
|
| 388 |
"in_benchmark": true,
|
| 389 |
"NaN": 0.0,
|
| 390 |
+
"classification_accuracy": 0.63,
|
| 391 |
+
"language_modeling_chrf": 0.94,
|
| 392 |
+
"translation_bleu": 0.27,
|
| 393 |
+
"translation_chrf": 0.44
|
| 394 |
},
|
| 395 |
{
|
| 396 |
"bcp_47": "te",
|
|
|
|
| 398 |
"autonym": "తెలుగు",
|
| 399 |
"speakers": 95478480,
|
| 400 |
"family": "Dravidian",
|
| 401 |
+
"average": 0.41,
|
| 402 |
"in_benchmark": true,
|
| 403 |
"NaN": 0.0,
|
| 404 |
+
"classification_accuracy": 0.37,
|
| 405 |
+
"language_modeling_chrf": 0.95,
|
| 406 |
+
"translation_bleu": 0.28,
|
| 407 |
+
"translation_chrf": 0.47
|
| 408 |
},
|
| 409 |
{
|
| 410 |
"bcp_47": "lah",
|
|
|
|
| 426 |
"autonym": "मराठी",
|
| 427 |
"speakers": 92826300,
|
| 428 |
"family": "Indo-European",
|
| 429 |
+
"average": 0.45,
|
| 430 |
"in_benchmark": true,
|
| 431 |
"NaN": 0.0,
|
| 432 |
+
"classification_accuracy": 0.63,
|
| 433 |
+
"language_modeling_chrf": 0.94,
|
| 434 |
+
"translation_bleu": 0.25,
|
| 435 |
+
"translation_chrf": 0.42
|
| 436 |
},
|
| 437 |
{
|
| 438 |
"bcp_47": "jv",
|
|
|
|
| 440 |
"autonym": "Jawa",
|
| 441 |
"speakers": 91180665,
|
| 442 |
"family": "Austronesian",
|
| 443 |
+
"average": 0.41,
|
| 444 |
"in_benchmark": true,
|
| 445 |
"NaN": 0.0,
|
| 446 |
+
"classification_accuracy": 0.47,
|
| 447 |
+
"language_modeling_chrf": 0.93,
|
| 448 |
+
"translation_bleu": 0.24,
|
| 449 |
+
"translation_chrf": 0.42
|
| 450 |
},
|
| 451 |
{
|
| 452 |
"bcp_47": "vi",
|
|
|
|
| 454 |
"autonym": "Tiếng Việt",
|
| 455 |
"speakers": 86222962,
|
| 456 |
"family": "Austroasiatic",
|
| 457 |
+
"average": 0.45,
|
| 458 |
"in_benchmark": true,
|
| 459 |
"NaN": 0.0,
|
| 460 |
+
"classification_accuracy": 0.6,
|
| 461 |
+
"language_modeling_chrf": 0.96,
|
| 462 |
+
"translation_bleu": 0.26,
|
| 463 |
+
"translation_chrf": 0.44
|
| 464 |
},
|
| 465 |
{
|
| 466 |
"bcp_47": "ta",
|
|
|
|
| 468 |
"autonym": "தமிழ்",
|
| 469 |
"speakers": 85616159,
|
| 470 |
"family": "Dravidian",
|
| 471 |
+
"average": 0.41,
|
| 472 |
"in_benchmark": true,
|
| 473 |
"NaN": 0.0,
|
| 474 |
+
"classification_accuracy": 0.43,
|
| 475 |
+
"language_modeling_chrf": 0.96,
|
| 476 |
+
"translation_bleu": 0.25,
|
| 477 |
+
"translation_chrf": 0.42
|
| 478 |
},
|
| 479 |
{
|
| 480 |
"bcp_47": "fa",
|
|
|
|
| 482 |
"autonym": "فارسی",
|
| 483 |
"speakers": 84710459,
|
| 484 |
"family": "Indo-European",
|
| 485 |
+
"average": 0.41,
|
| 486 |
"in_benchmark": true,
|
| 487 |
"NaN": 0.0,
|
| 488 |
+
"classification_accuracy": 0.4,
|
| 489 |
+
"language_modeling_chrf": 0.94,
|
| 490 |
+
"translation_bleu": 0.26,
|
| 491 |
+
"translation_chrf": 0.45
|
| 492 |
},
|
| 493 |
{
|
| 494 |
"bcp_47": "wuu",
|
|
|
|
| 510 |
"autonym": "Türkçe",
|
| 511 |
"speakers": 80360704,
|
| 512 |
"family": "Turkic",
|
| 513 |
+
"average": 0.44,
|
| 514 |
"in_benchmark": true,
|
| 515 |
"NaN": 0.0,
|
| 516 |
+
"classification_accuracy": 0.53,
|
| 517 |
+
"language_modeling_chrf": 0.94,
|
| 518 |
+
"translation_bleu": 0.28,
|
| 519 |
+
"translation_chrf": 0.45
|
| 520 |
},
|
| 521 |
{
|
| 522 |
"bcp_47": "yue",
|
|
|
|
| 524 |
"autonym": "粵語",
|
| 525 |
"speakers": 79654759,
|
| 526 |
"family": "Sino-Tibetan",
|
| 527 |
+
"average": 0.39,
|
| 528 |
"in_benchmark": true,
|
| 529 |
"NaN": 0.0,
|
| 530 |
+
"classification_accuracy": 0.43,
|
| 531 |
+
"language_modeling_chrf": 0.9,
|
| 532 |
+
"translation_bleu": 0.23,
|
| 533 |
+
"translation_chrf": 0.41
|
| 534 |
},
|
| 535 |
{
|
| 536 |
"bcp_47": "ko",
|
|
|
|
| 538 |
"autonym": "한국어",
|
| 539 |
"speakers": 78357046,
|
| 540 |
"family": "Koreanic",
|
| 541 |
+
"average": 0.41,
|
| 542 |
"in_benchmark": true,
|
| 543 |
"NaN": 0.0,
|
| 544 |
+
"classification_accuracy": 0.53,
|
| 545 |
+
"language_modeling_chrf": 0.94,
|
| 546 |
+
"translation_bleu": 0.2,
|
| 547 |
+
"translation_chrf": 0.4
|
| 548 |
},
|
| 549 |
{
|
| 550 |
"bcp_47": "it",
|
|
|
|
| 552 |
"autonym": "Italiano",
|
| 553 |
"speakers": 70247060,
|
| 554 |
"family": "Indo-European",
|
| 555 |
+
"average": 0.47,
|
| 556 |
"in_benchmark": true,
|
| 557 |
"NaN": 0.0,
|
| 558 |
+
"classification_accuracy": 0.67,
|
| 559 |
+
"language_modeling_chrf": 0.94,
|
| 560 |
+
"translation_bleu": 0.28,
|
| 561 |
+
"translation_chrf": 0.47
|
| 562 |
},
|
| 563 |
{
|
| 564 |
"bcp_47": "fil",
|
|
|
|
| 566 |
"autonym": "Filipino",
|
| 567 |
"speakers": 67471096,
|
| 568 |
"family": "Austronesian",
|
| 569 |
+
"average": 0.42,
|
| 570 |
"in_benchmark": true,
|
| 571 |
"NaN": 0.0,
|
| 572 |
+
"classification_accuracy": 0.43,
|
| 573 |
+
"language_modeling_chrf": 0.94,
|
| 574 |
+
"translation_bleu": 0.29,
|
| 575 |
+
"translation_chrf": 0.45
|
| 576 |
},
|
| 577 |
{
|
| 578 |
"bcp_47": "arz",
|
|
|
|
| 580 |
"autonym": "Egyptian Arabic",
|
| 581 |
"speakers": 66639360,
|
| 582 |
"family": "Afro-Asiatic",
|
| 583 |
+
"average": 0.38,
|
| 584 |
"in_benchmark": true,
|
| 585 |
"NaN": 0.0,
|
| 586 |
+
"classification_accuracy": 0.4,
|
| 587 |
+
"language_modeling_chrf": 0.93,
|
| 588 |
+
"translation_bleu": 0.2,
|
| 589 |
+
"translation_chrf": 0.39
|
| 590 |
},
|
| 591 |
{
|
| 592 |
"bcp_47": "gu",
|
|
|
|
| 594 |
"autonym": "ગુજરાતી",
|
| 595 |
"speakers": 61721799,
|
| 596 |
"family": "Indo-European",
|
| 597 |
+
"average": 0.42,
|
| 598 |
"in_benchmark": true,
|
| 599 |
"NaN": 0.0,
|
| 600 |
+
"classification_accuracy": 0.43,
|
| 601 |
+
"language_modeling_chrf": 0.94,
|
| 602 |
+
"translation_bleu": 0.26,
|
| 603 |
+
"translation_chrf": 0.44
|
| 604 |
},
|
| 605 |
{
|
| 606 |
"bcp_47": "th",
|
|
|
|
| 10164 |
]
|
| 10165 |
},
|
| 10166 |
"AE": {
|
| 10167 |
+
"score": 0.40140041521976655,
|
| 10168 |
"languages": [
|
| 10169 |
{
|
| 10170 |
"name": "English",
|
|
|
|
| 10182 |
"name": "Persian",
|
| 10183 |
"bcp_47": "fa",
|
| 10184 |
"population": 189850,
|
| 10185 |
+
"score": 0.41
|
| 10186 |
},
|
| 10187 |
{
|
| 10188 |
"name": "Pashto",
|
|
|
|
| 10205 |
]
|
| 10206 |
},
|
| 10207 |
"AG": {
|
| 10208 |
+
"score": 0.4696346724027672,
|
| 10209 |
"languages": [
|
| 10210 |
{
|
| 10211 |
"name": "English",
|
|
|
|
| 10217 |
"name": "Portuguese",
|
| 10218 |
"bcp_47": "pt",
|
| 10219 |
"population": 1571,
|
| 10220 |
+
"score": 0.45
|
| 10221 |
}
|
| 10222 |
]
|
| 10223 |
},
|
|
|
|
| 10290 |
]
|
| 10291 |
},
|
| 10292 |
"AT": {
|
| 10293 |
+
"score": 0.31771431191158667,
|
| 10294 |
"languages": [
|
| 10295 |
{
|
| 10296 |
"name": "English",
|
|
|
|
| 10308 |
"name": "German",
|
| 10309 |
"bcp_47": "de",
|
| 10310 |
"population": 8593666,
|
| 10311 |
+
"score": 0.49
|
| 10312 |
},
|
| 10313 |
{
|
| 10314 |
"name": "Italian",
|
| 10315 |
"bcp_47": "it",
|
| 10316 |
"population": 797350,
|
| 10317 |
+
"score": 0.47
|
| 10318 |
},
|
| 10319 |
{
|
| 10320 |
"name": "Bavarian",
|
|
|
|
| 10343 |
]
|
| 10344 |
},
|
| 10345 |
"AU": {
|
| 10346 |
+
"score": 0.46970357171432847,
|
| 10347 |
"languages": [
|
| 10348 |
{
|
| 10349 |
"name": "English",
|
|
|
|
| 10361 |
"name": "Italian",
|
| 10362 |
"bcp_47": "it",
|
| 10363 |
"population": 483864,
|
| 10364 |
+
"score": 0.47
|
| 10365 |
},
|
| 10366 |
{
|
| 10367 |
"name": "Hmong Njua",
|
|
|
|
| 10506 |
]
|
| 10507 |
},
|
| 10508 |
"BE": {
|
| 10509 |
+
"score": 0.29499472599184506,
|
| 10510 |
"languages": [
|
| 10511 |
{
|
| 10512 |
"name": "English",
|
|
|
|
| 10524 |
"name": "German",
|
| 10525 |
"bcp_47": "de",
|
| 10526 |
"population": 2578554,
|
| 10527 |
+
"score": 0.49
|
| 10528 |
},
|
| 10529 |
{
|
| 10530 |
"name": "Dutch",
|
|
|
|
| 10547 |
]
|
| 10548 |
},
|
| 10549 |
"BG": {
|
| 10550 |
+
"score": 0.18479041916167663,
|
| 10551 |
"languages": [
|
| 10552 |
{
|
| 10553 |
"name": "English",
|
|
|
|
| 10559 |
"name": "Russian",
|
| 10560 |
"bcp_47": "ru",
|
| 10561 |
"population": 1602387,
|
| 10562 |
+
"score": 0.45
|
| 10563 |
},
|
| 10564 |
{
|
| 10565 |
"name": "German",
|
| 10566 |
"bcp_47": "de",
|
| 10567 |
"population": 557352,
|
| 10568 |
+
"score": 0.49
|
| 10569 |
},
|
| 10570 |
{
|
| 10571 |
"name": "Turkish",
|
| 10572 |
"bcp_47": "tr",
|
| 10573 |
"population": 766359,
|
| 10574 |
+
"score": 0.44
|
| 10575 |
},
|
| 10576 |
{
|
| 10577 |
"name": "Bulgarian",
|
|
|
|
| 10582 |
]
|
| 10583 |
},
|
| 10584 |
"BI": {
|
| 10585 |
+
"score": 0.2226670965568091,
|
| 10586 |
"languages": [
|
| 10587 |
{
|
| 10588 |
"name": "English",
|
|
|
|
| 10600 |
"name": "Swahili",
|
| 10601 |
"bcp_47": "sw",
|
| 10602 |
"population": 6408,
|
| 10603 |
+
"score": 0.45
|
| 10604 |
},
|
| 10605 |
{
|
| 10606 |
"name": "Rundi",
|
|
|
|
| 10645 |
]
|
| 10646 |
},
|
| 10647 |
"BR": {
|
| 10648 |
+
"score": 0.45070787745315494,
|
| 10649 |
"languages": [
|
| 10650 |
{
|
| 10651 |
"name": "English",
|
|
|
|
| 10663 |
"name": "Portuguese",
|
| 10664 |
"bcp_47": "pt",
|
| 10665 |
"population": 192661560,
|
| 10666 |
+
"score": 0.45
|
| 10667 |
},
|
| 10668 |
{
|
| 10669 |
"name": "German",
|
| 10670 |
"bcp_47": "de",
|
| 10671 |
"population": 1778414,
|
| 10672 |
+
"score": 0.49
|
| 10673 |
},
|
| 10674 |
{
|
| 10675 |
"name": "Japanese",
|
| 10676 |
"bcp_47": "ja",
|
| 10677 |
"population": 444604,
|
| 10678 |
+
"score": 0.46
|
| 10679 |
},
|
| 10680 |
{
|
| 10681 |
"name": "Korean",
|
| 10682 |
"bcp_47": "ko",
|
| 10683 |
"population": 44460,
|
| 10684 |
+
"score": 0.41
|
| 10685 |
},
|
| 10686 |
{
|
| 10687 |
"name": "Italian",
|
| 10688 |
"bcp_47": "it",
|
| 10689 |
"population": 592805,
|
| 10690 |
+
"score": 0.47
|
| 10691 |
},
|
| 10692 |
{
|
| 10693 |
"name": "Venetian",
|
|
|
|
| 10819 |
]
|
| 10820 |
},
|
| 10821 |
"CA": {
|
| 10822 |
+
"score": 0.4538591979207903,
|
| 10823 |
"languages": [
|
| 10824 |
{
|
| 10825 |
"name": "English",
|
|
|
|
| 10873 |
"name": "Portuguese",
|
| 10874 |
"bcp_47": "pt",
|
| 10875 |
"population": 229934,
|
| 10876 |
+
"score": 0.45
|
| 10877 |
},
|
| 10878 |
{
|
| 10879 |
"name": "Punjabi",
|
| 10880 |
"bcp_47": "pa",
|
| 10881 |
"population": 603106,
|
| 10882 |
+
"score": 0.43
|
| 10883 |
},
|
| 10884 |
{
|
| 10885 |
"name": "Russian",
|
| 10886 |
"bcp_47": "ru",
|
| 10887 |
"population": 211087,
|
| 10888 |
+
"score": 0.45
|
| 10889 |
},
|
| 10890 |
{
|
| 10891 |
"name": "German",
|
| 10892 |
"bcp_47": "de",
|
| 10893 |
"population": 294014,
|
| 10894 |
+
"score": 0.49
|
| 10895 |
},
|
| 10896 |
{
|
| 10897 |
"name": "Japanese",
|
| 10898 |
"bcp_47": "ja",
|
| 10899 |
"population": 52772,
|
| 10900 |
+
"score": 0.46
|
| 10901 |
},
|
| 10902 |
{
|
| 10903 |
"name": "Vietnamese",
|
| 10904 |
"bcp_47": "vi",
|
| 10905 |
"population": 184701,
|
| 10906 |
+
"score": 0.45
|
| 10907 |
},
|
| 10908 |
{
|
| 10909 |
"name": "Tamil",
|
| 10910 |
"bcp_47": "ta",
|
| 10911 |
"population": 184701,
|
| 10912 |
+
"score": 0.41
|
| 10913 |
},
|
| 10914 |
{
|
| 10915 |
"name": "Persian",
|
| 10916 |
"bcp_47": "fa",
|
| 10917 |
"population": 245012,
|
| 10918 |
+
"score": 0.41
|
| 10919 |
},
|
| 10920 |
{
|
| 10921 |
"name": "Turkish",
|
| 10922 |
"bcp_47": "tr",
|
| 10923 |
"population": 37694,
|
| 10924 |
+
"score": 0.44
|
| 10925 |
},
|
| 10926 |
{
|
| 10927 |
"name": "Cantonese",
|
| 10928 |
"bcp_47": "yue",
|
| 10929 |
"population": 640800,
|
| 10930 |
+
"score": 0.39
|
| 10931 |
},
|
| 10932 |
{
|
| 10933 |
"name": "Korean",
|
| 10934 |
"bcp_47": "ko",
|
| 10935 |
"population": 169623,
|
| 10936 |
+
"score": 0.41
|
| 10937 |
},
|
| 10938 |
{
|
| 10939 |
"name": "Italian",
|
| 10940 |
"bcp_47": "it",
|
| 10941 |
"population": 343016,
|
| 10942 |
+
"score": 0.47
|
| 10943 |
},
|
| 10944 |
{
|
| 10945 |
"name": "Filipino",
|
| 10946 |
"bcp_47": "fil",
|
| 10947 |
"population": 565412,
|
| 10948 |
+
"score": 0.42
|
| 10949 |
},
|
| 10950 |
{
|
| 10951 |
"name": "Gujarati",
|
| 10952 |
"bcp_47": "gu",
|
| 10953 |
"population": 135699,
|
| 10954 |
+
"score": 0.42
|
| 10955 |
},
|
| 10956 |
{
|
| 10957 |
"name": "Polish",
|
|
|
|
| 11189 |
]
|
| 11190 |
},
|
| 11191 |
"CH": {
|
| 11192 |
+
"score": 0.33368138748580556,
|
| 11193 |
"languages": [
|
| 11194 |
{
|
| 11195 |
"name": "English",
|
|
|
|
| 11207 |
"name": "Portuguese",
|
| 11208 |
"bcp_47": "pt",
|
| 11209 |
"population": 285736,
|
| 11210 |
+
"score": 0.45
|
| 11211 |
},
|
| 11212 |
{
|
| 11213 |
"name": "German",
|
| 11214 |
"bcp_47": "de",
|
| 11215 |
"population": 6134913,
|
| 11216 |
+
"score": 0.49
|
| 11217 |
},
|
| 11218 |
{
|
| 11219 |
"name": "Italian",
|
| 11220 |
"bcp_47": "it",
|
| 11221 |
"population": 361372,
|
| 11222 |
+
"score": 0.47
|
| 11223 |
},
|
| 11224 |
{
|
| 11225 |
"name": "Swiss German",
|
|
|
|
| 11455 |
]
|
| 11456 |
},
|
| 11457 |
"CN": {
|
| 11458 |
+
"score": 0.38724457341349466,
|
| 11459 |
"languages": [
|
| 11460 |
{
|
| 11461 |
"name": "English",
|
|
|
|
| 11473 |
"name": "Russian",
|
| 11474 |
"bcp_47": "ru",
|
| 11475 |
"population": 13940,
|
| 11476 |
+
"score": 0.45
|
| 11477 |
},
|
| 11478 |
{
|
| 11479 |
"name": "Vietnamese",
|
| 11480 |
"bcp_47": "vi",
|
| 11481 |
"population": 6970,
|
| 11482 |
+
"score": 0.45
|
| 11483 |
},
|
| 11484 |
{
|
| 11485 |
"name": "Wu Chinese",
|
|
|
|
| 11491 |
"name": "Cantonese",
|
| 11492 |
"bcp_47": "yue",
|
| 11493 |
"population": 72489040,
|
| 11494 |
+
"score": 0.39
|
| 11495 |
},
|
| 11496 |
{
|
| 11497 |
"name": "Korean",
|
| 11498 |
"bcp_47": "ko",
|
| 11499 |
"population": 2091030,
|
| 11500 |
+
"score": 0.41
|
| 11501 |
},
|
| 11502 |
{
|
| 11503 |
"name": "Xiang Chinese",
|
|
|
|
| 11649 |
]
|
| 11650 |
},
|
| 11651 |
"CY": {
|
| 11652 |
+
"score": 0.2404799926753925,
|
| 11653 |
"languages": [
|
| 11654 |
{
|
| 11655 |
"name": "English",
|
|
|
|
| 11673 |
"name": "Turkish",
|
| 11674 |
"bcp_47": "tr",
|
| 11675 |
"population": 291336,
|
| 11676 |
+
"score": 0.44
|
| 11677 |
},
|
| 11678 |
{
|
| 11679 |
"name": "Greek",
|
|
|
|
| 11690 |
]
|
| 11691 |
},
|
| 11692 |
"CZ": {
|
| 11693 |
+
"score": 0.12805930282531847,
|
| 11694 |
"languages": [
|
| 11695 |
{
|
| 11696 |
"name": "English",
|
|
|
|
| 11702 |
"name": "German",
|
| 11703 |
"bcp_47": "de",
|
| 11704 |
"population": 1605375,
|
| 11705 |
+
"score": 0.49
|
| 11706 |
},
|
| 11707 |
{
|
| 11708 |
"name": "Polish",
|
|
|
|
| 11725 |
]
|
| 11726 |
},
|
| 11727 |
"DE": {
|
| 11728 |
+
"score": 0.3765932308207555,
|
| 11729 |
"languages": [
|
| 11730 |
{
|
| 11731 |
"name": "English",
|
|
|
|
| 11749 |
"name": "Russian",
|
| 11750 |
"bcp_47": "ru",
|
| 11751 |
"population": 4809582,
|
| 11752 |
+
"score": 0.45
|
| 11753 |
},
|
| 11754 |
{
|
| 11755 |
"name": "German",
|
| 11756 |
"bcp_47": "de",
|
| 11757 |
"population": 72945327,
|
| 11758 |
+
"score": 0.49
|
| 11759 |
},
|
| 11760 |
{
|
| 11761 |
"name": "Turkish",
|
| 11762 |
"bcp_47": "tr",
|
| 11763 |
"population": 2003992,
|
| 11764 |
+
"score": 0.44
|
| 11765 |
},
|
| 11766 |
{
|
| 11767 |
"name": "Italian",
|
| 11768 |
"bcp_47": "it",
|
| 11769 |
"population": 5611179,
|
| 11770 |
+
"score": 0.47
|
| 11771 |
},
|
| 11772 |
{
|
| 11773 |
"name": "Polish",
|
|
|
|
| 11891 |
]
|
| 11892 |
},
|
| 11893 |
"DK": {
|
| 11894 |
+
"score": 0.2649269539952979,
|
| 11895 |
"languages": [
|
| 11896 |
{
|
| 11897 |
"name": "English",
|
|
|
|
| 11903 |
"name": "German",
|
| 11904 |
"bcp_47": "de",
|
| 11905 |
"population": 2758623,
|
| 11906 |
+
"score": 0.49
|
| 11907 |
},
|
| 11908 |
{
|
| 11909 |
"name": "Swedish",
|
|
|
|
| 12001 |
]
|
| 12002 |
},
|
| 12003 |
"EE": {
|
| 12004 |
+
"score": 0.23907703243578238,
|
| 12005 |
"languages": [
|
| 12006 |
{
|
| 12007 |
"name": "English",
|
|
|
|
| 12013 |
"name": "Russian",
|
| 12014 |
"bcp_47": "ru",
|
| 12015 |
"population": 688027,
|
| 12016 |
+
"score": 0.45
|
| 12017 |
},
|
| 12018 |
{
|
| 12019 |
"name": "Finnish",
|
|
|
|
| 12042 |
]
|
| 12043 |
},
|
| 12044 |
"EG": {
|
| 12045 |
+
"score": 0.4156717299521135,
|
| 12046 |
"languages": [
|
| 12047 |
{
|
| 12048 |
"name": "English",
|
|
|
|
| 12060 |
"name": "Egyptian Arabic",
|
| 12061 |
"bcp_47": "arz",
|
| 12062 |
"population": 66639360,
|
| 12063 |
+
"score": 0.38
|
| 12064 |
},
|
| 12065 |
{
|
| 12066 |
"name": "Greek",
|
|
|
|
| 12236 |
]
|
| 12237 |
},
|
| 12238 |
"FI": {
|
| 12239 |
+
"score": 0.18533875082776866,
|
| 12240 |
"languages": [
|
| 12241 |
{
|
| 12242 |
"name": "English",
|
|
|
|
| 12248 |
"name": "Russian",
|
| 12249 |
"bcp_47": "ru",
|
| 12250 |
"population": 45131,
|
| 12251 |
+
"score": 0.45
|
| 12252 |
},
|
| 12253 |
{
|
| 12254 |
"name": "German",
|
| 12255 |
"bcp_47": "de",
|
| 12256 |
"population": 1002901,
|
| 12257 |
+
"score": 0.49
|
| 12258 |
},
|
| 12259 |
{
|
| 12260 |
"name": "Swedish",
|
|
|
|
| 12388 |
]
|
| 12389 |
},
|
| 12390 |
"FR": {
|
| 12391 |
+
"score": 0.4436463938115849,
|
| 12392 |
"languages": [
|
| 12393 |
{
|
| 12394 |
"name": "English",
|
|
|
|
| 12412 |
"name": "Portuguese",
|
| 12413 |
"bcp_47": "pt",
|
| 12414 |
"population": 882027,
|
| 12415 |
+
"score": 0.45
|
| 12416 |
},
|
| 12417 |
{
|
| 12418 |
"name": "German",
|
| 12419 |
"bcp_47": "de",
|
| 12420 |
"population": 3392410,
|
| 12421 |
+
"score": 0.49
|
| 12422 |
},
|
| 12423 |
{
|
| 12424 |
"name": "Italian",
|
| 12425 |
"bcp_47": "it",
|
| 12426 |
"population": 1153419,
|
| 12427 |
+
"score": 0.47
|
| 12428 |
},
|
| 12429 |
{
|
| 12430 |
"name": "Dutch",
|
|
|
|
| 12495 |
]
|
| 12496 |
},
|
| 12497 |
"GB": {
|
| 12498 |
+
"score": 0.43956766255639257,
|
| 12499 |
"languages": [
|
| 12500 |
{
|
| 12501 |
"name": "English",
|
|
|
|
| 12543 |
"name": "Portuguese",
|
| 12544 |
"bcp_47": "pt",
|
| 12545 |
"population": 131522,
|
| 12546 |
+
"score": 0.45
|
| 12547 |
},
|
| 12548 |
{
|
| 12549 |
"name": "Punjabi",
|
| 12550 |
"bcp_47": "pa",
|
| 12551 |
"population": 2367400,
|
| 12552 |
+
"score": 0.43
|
| 12553 |
},
|
| 12554 |
{
|
| 12555 |
"name": "German",
|
| 12556 |
"bcp_47": "de",
|
| 12557 |
"population": 5918499,
|
| 12558 |
+
"score": 0.49
|
| 12559 |
},
|
| 12560 |
{
|
| 12561 |
"name": "Tamil",
|
| 12562 |
"bcp_47": "ta",
|
| 12563 |
"population": 2104355,
|
| 12564 |
+
"score": 0.41
|
| 12565 |
},
|
| 12566 |
{
|
| 12567 |
"name": "Turkish",
|
| 12568 |
"bcp_47": "tr",
|
| 12569 |
"population": 131522,
|
| 12570 |
+
"score": 0.44
|
| 12571 |
},
|
| 12572 |
{
|
| 12573 |
"name": "Italian",
|
| 12574 |
"bcp_47": "it",
|
| 12575 |
"population": 131522,
|
| 12576 |
+
"score": 0.47
|
| 12577 |
},
|
| 12578 |
{
|
| 12579 |
"name": "Gujarati",
|
| 12580 |
"bcp_47": "gu",
|
| 12581 |
"population": 1907072,
|
| 12582 |
+
"score": 0.42
|
| 12583 |
},
|
| 12584 |
{
|
| 12585 |
"name": "Polish",
|
|
|
|
| 12765 |
]
|
| 12766 |
},
|
| 12767 |
"GR": {
|
| 12768 |
+
"score": 0.18194383576443016,
|
| 12769 |
"languages": [
|
| 12770 |
{
|
| 12771 |
"name": "English",
|
|
|
|
| 12783 |
"name": "German",
|
| 12784 |
"bcp_47": "de",
|
| 12785 |
"population": 530355,
|
| 12786 |
+
"score": 0.49
|
| 12787 |
},
|
| 12788 |
{
|
| 12789 |
"name": "Turkish",
|
| 12790 |
"bcp_47": "tr",
|
| 12791 |
"population": 127285,
|
| 12792 |
+
"score": 0.44
|
| 12793 |
},
|
| 12794 |
{
|
| 12795 |
"name": "Greek",
|
|
|
|
| 12869 |
]
|
| 12870 |
},
|
| 12871 |
"HK": {
|
| 12872 |
+
"score": 0.4359751035397035,
|
| 12873 |
"languages": [
|
| 12874 |
{
|
| 12875 |
"name": "English",
|
|
|
|
| 12887 |
"name": "Cantonese",
|
| 12888 |
"bcp_47": "yue",
|
| 12889 |
"population": 6524919,
|
| 12890 |
+
"score": 0.39
|
| 12891 |
}
|
| 12892 |
]
|
| 12893 |
},
|
|
|
|
| 12920 |
]
|
| 12921 |
},
|
| 12922 |
"HR": {
|
| 12923 |
+
"score": 0.15823024946225459,
|
| 12924 |
"languages": [
|
| 12925 |
{
|
| 12926 |
"name": "English",
|
|
|
|
| 12932 |
"name": "Italian",
|
| 12933 |
"bcp_47": "it",
|
| 12934 |
"population": 67644,
|
| 12935 |
+
"score": 0.47
|
| 12936 |
},
|
| 12937 |
{
|
| 12938 |
"name": "Croatian",
|
|
|
|
| 12949 |
]
|
| 12950 |
},
|
| 12951 |
"HU": {
|
| 12952 |
+
"score": 0.13756219151316587,
|
| 12953 |
"languages": [
|
| 12954 |
{
|
| 12955 |
"name": "English",
|
|
|
|
| 12967 |
"name": "German",
|
| 12968 |
"bcp_47": "de",
|
| 12969 |
"population": 1758929,
|
| 12970 |
+
"score": 0.49
|
| 12971 |
},
|
| 12972 |
{
|
| 12973 |
"name": "Romanian",
|
|
|
|
| 13025 |
]
|
| 13026 |
},
|
| 13027 |
"IL": {
|
| 13028 |
+
"score": 0.21817259544999,
|
| 13029 |
"languages": [
|
| 13030 |
{
|
| 13031 |
"name": "English",
|
|
|
|
| 13043 |
"name": "Russian",
|
| 13044 |
"bcp_47": "ru",
|
| 13045 |
"population": 954303,
|
| 13046 |
+
"score": 0.45
|
| 13047 |
},
|
| 13048 |
{
|
| 13049 |
"name": "Malayalam",
|
|
|
|
| 13125 |
]
|
| 13126 |
},
|
| 13127 |
"IN": {
|
| 13128 |
+
"score": 0.3397907454052606,
|
| 13129 |
"languages": [
|
| 13130 |
{
|
| 13131 |
"name": "English",
|
|
|
|
| 13155 |
"name": "Punjabi",
|
| 13156 |
"bcp_47": "pa",
|
| 13157 |
"population": 37130520,
|
| 13158 |
+
"score": 0.43
|
| 13159 |
},
|
| 13160 |
{
|
| 13161 |
"name": "Telugu",
|
| 13162 |
"bcp_47": "te",
|
| 13163 |
"population": 95478480,
|
| 13164 |
+
"score": 0.41
|
| 13165 |
},
|
| 13166 |
{
|
| 13167 |
"name": "Western Panjabi",
|
|
|
|
| 13173 |
"name": "Marathi",
|
| 13174 |
"bcp_47": "mr",
|
| 13175 |
"population": 92826300,
|
| 13176 |
+
"score": 0.45
|
| 13177 |
},
|
| 13178 |
{
|
| 13179 |
"name": "Tamil",
|
| 13180 |
"bcp_47": "ta",
|
| 13181 |
"population": 78239310,
|
| 13182 |
+
"score": 0.41
|
| 13183 |
},
|
| 13184 |
{
|
| 13185 |
"name": "Gujarati",
|
| 13186 |
"bcp_47": "gu",
|
| 13187 |
"population": 59674050,
|
| 13188 |
+
"score": 0.42
|
| 13189 |
},
|
| 13190 |
{
|
| 13191 |
"name": "Kannada",
|
|
|
|
| 13603 |
]
|
| 13604 |
},
|
| 13605 |
"IQ": {
|
| 13606 |
+
"score": 0.357837983423388,
|
| 13607 |
"languages": [
|
| 13608 |
{
|
| 13609 |
"name": "English",
|
|
|
|
| 13621 |
"name": "Persian",
|
| 13622 |
"bcp_47": "fa",
|
| 13623 |
"population": 338192,
|
| 13624 |
+
"score": 0.41
|
| 13625 |
},
|
| 13626 |
{
|
| 13627 |
"name": "Azerbaijani",
|
|
|
|
| 13650 |
]
|
| 13651 |
},
|
| 13652 |
"IT": {
|
| 13653 |
+
"score": 0.43224641662655555,
|
| 13654 |
"languages": [
|
| 13655 |
{
|
| 13656 |
"name": "English",
|
|
|
|
| 13668 |
"name": "German",
|
| 13669 |
"bcp_47": "de",
|
| 13670 |
"population": 998443,
|
| 13671 |
+
"score": 0.49
|
| 13672 |
},
|
| 13673 |
{
|
| 13674 |
"name": "Italian",
|
| 13675 |
"bcp_47": "it",
|
| 13676 |
"population": 59282565,
|
| 13677 |
+
"score": 0.47
|
| 13678 |
},
|
| 13679 |
{
|
| 13680 |
"name": "Greek",
|
|
|
|
| 13820 |
]
|
| 13821 |
},
|
| 13822 |
"KE": {
|
| 13823 |
+
"score": 0.2501476621404106,
|
| 13824 |
"languages": [
|
| 13825 |
{
|
| 13826 |
"name": "English",
|
|
|
|
| 13838 |
"name": "Punjabi",
|
| 13839 |
"bcp_47": "pa",
|
| 13840 |
"population": 10170,
|
| 13841 |
+
"score": 0.43
|
| 13842 |
},
|
| 13843 |
{
|
| 13844 |
"name": "Swahili",
|
| 13845 |
"bcp_47": "sw",
|
| 13846 |
"population": 35328414,
|
| 13847 |
+
"score": 0.45
|
| 13848 |
},
|
| 13849 |
{
|
| 13850 |
"name": "Gujarati",
|
| 13851 |
"bcp_47": "gu",
|
| 13852 |
"population": 4978,
|
| 13853 |
+
"score": 0.42
|
| 13854 |
},
|
| 13855 |
{
|
| 13856 |
"name": "Oromo",
|
|
|
|
| 13984 |
]
|
| 13985 |
},
|
| 13986 |
"KZ": {
|
| 13987 |
+
"score": 0.2671643693028198,
|
| 13988 |
"languages": [
|
| 13989 |
{
|
| 13990 |
"name": "English",
|
|
|
|
| 13996 |
"name": "Russian",
|
| 13997 |
"bcp_47": "ru",
|
| 13998 |
"population": 13746168,
|
| 13999 |
+
"score": 0.45
|
| 14000 |
},
|
| 14001 |
{
|
| 14002 |
"name": "German",
|
| 14003 |
"bcp_47": "de",
|
| 14004 |
"population": 1221882,
|
| 14005 |
+
"score": 0.49
|
| 14006 |
},
|
| 14007 |
{
|
| 14008 |
"name": "Kazakh",
|
|
|
|
| 14071 |
]
|
| 14072 |
},
|
| 14073 |
"LK": {
|
| 14074 |
+
"score": 0.11666666666666665,
|
| 14075 |
"languages": [
|
| 14076 |
{
|
| 14077 |
"name": "English",
|
|
|
|
| 14083 |
"name": "Tamil",
|
| 14084 |
"bcp_47": "ta",
|
| 14085 |
"population": 3433380,
|
| 14086 |
+
"score": 0.41
|
| 14087 |
},
|
| 14088 |
{
|
| 14089 |
"name": "Sinhala",
|
|
|
|
| 14164 |
]
|
| 14165 |
},
|
| 14166 |
"LT": {
|
| 14167 |
+
"score": 0.2785320836068621,
|
| 14168 |
"languages": [
|
| 14169 |
{
|
| 14170 |
"name": "English",
|
|
|
|
| 14176 |
"name": "Russian",
|
| 14177 |
"bcp_47": "ru",
|
| 14178 |
"population": 2185168,
|
| 14179 |
+
"score": 0.45
|
| 14180 |
},
|
| 14181 |
{
|
| 14182 |
"name": "German",
|
| 14183 |
"bcp_47": "de",
|
| 14184 |
"population": 382404,
|
| 14185 |
+
"score": 0.49
|
| 14186 |
},
|
| 14187 |
{
|
| 14188 |
"name": "Lithuanian",
|
|
|
|
| 14199 |
]
|
| 14200 |
},
|
| 14201 |
"LU": {
|
| 14202 |
+
"score": 0.3612802832567923,
|
| 14203 |
"languages": [
|
| 14204 |
{
|
| 14205 |
"name": "English",
|
|
|
|
| 14217 |
"name": "Portuguese",
|
| 14218 |
"bcp_47": "pt",
|
| 14219 |
"population": 100541,
|
| 14220 |
+
"score": 0.45
|
| 14221 |
},
|
| 14222 |
{
|
| 14223 |
"name": "German",
|
| 14224 |
"bcp_47": "de",
|
| 14225 |
"population": 395880,
|
| 14226 |
+
"score": 0.49
|
| 14227 |
},
|
| 14228 |
{
|
| 14229 |
"name": "Luxembourgish",
|
|
|
|
| 14234 |
]
|
| 14235 |
},
|
| 14236 |
"LV": {
|
| 14237 |
+
"score": 0.2515919974081345,
|
| 14238 |
"languages": [
|
| 14239 |
{
|
| 14240 |
"name": "English",
|
|
|
|
| 14246 |
"name": "Russian",
|
| 14247 |
"bcp_47": "ru",
|
| 14248 |
"population": 714867,
|
| 14249 |
+
"score": 0.45
|
| 14250 |
},
|
| 14251 |
{
|
| 14252 |
"name": "Latvian",
|
|
|
|
| 14362 |
]
|
| 14363 |
},
|
| 14364 |
"MO": {
|
| 14365 |
+
"score": 0.4597552187538731,
|
| 14366 |
"languages": [
|
| 14367 |
{
|
| 14368 |
"name": "English",
|
|
|
|
| 14380 |
"name": "Portuguese",
|
| 14381 |
"bcp_47": "pt",
|
| 14382 |
"population": 30723,
|
| 14383 |
+
"score": 0.45
|
| 14384 |
}
|
| 14385 |
]
|
| 14386 |
},
|
|
|
|
| 14413 |
]
|
| 14414 |
},
|
| 14415 |
"MT": {
|
| 14416 |
+
"score": 0.28525492889983195,
|
| 14417 |
"languages": [
|
| 14418 |
{
|
| 14419 |
"name": "English",
|
|
|
|
| 14431 |
"name": "Italian",
|
| 14432 |
"bcp_47": "it",
|
| 14433 |
"population": 256070,
|
| 14434 |
+
"score": 0.47
|
| 14435 |
},
|
| 14436 |
{
|
| 14437 |
"name": "Maltese",
|
|
|
|
| 14442 |
]
|
| 14443 |
},
|
| 14444 |
"MU": {
|
| 14445 |
+
"score": 0.19243355389764255,
|
| 14446 |
"languages": [
|
| 14447 |
{
|
| 14448 |
"name": "English",
|
|
|
|
| 14466 |
"name": "Tamil",
|
| 14467 |
"bcp_47": "ta",
|
| 14468 |
"population": 34484,
|
| 14469 |
+
"score": 0.41
|
| 14470 |
},
|
| 14471 |
{
|
| 14472 |
"name": "Bhojpuri",
|
|
|
|
| 14594 |
]
|
| 14595 |
},
|
| 14596 |
"MY": {
|
| 14597 |
+
"score": 0.1619475361727729,
|
| 14598 |
"languages": [
|
| 14599 |
{
|
| 14600 |
"name": "English",
|
|
|
|
| 14612 |
"name": "Javanese",
|
| 14613 |
"bcp_47": "jv",
|
| 14614 |
"population": 391825,
|
| 14615 |
+
"score": 0.41
|
| 14616 |
},
|
| 14617 |
{
|
| 14618 |
"name": "Tamil",
|
| 14619 |
"bcp_47": "ta",
|
| 14620 |
"population": 1371388,
|
| 14621 |
+
"score": 0.41
|
| 14622 |
},
|
| 14623 |
{
|
| 14624 |
"name": "Malayalam",
|
|
|
|
| 14665 |
]
|
| 14666 |
},
|
| 14667 |
"NA": {
|
| 14668 |
+
"score": 0.023383111654627774,
|
| 14669 |
"languages": [
|
| 14670 |
{
|
| 14671 |
"name": "English",
|
|
|
|
| 14677 |
"name": "German",
|
| 14678 |
"bcp_47": "de",
|
| 14679 |
"population": 23671,
|
| 14680 |
+
"score": 0.49
|
| 14681 |
},
|
| 14682 |
{
|
| 14683 |
"name": "Afrikaans",
|
|
|
|
| 14836 |
]
|
| 14837 |
},
|
| 14838 |
"NL": {
|
| 14839 |
+
"score": 0.28688749989149553,
|
| 14840 |
"languages": [
|
| 14841 |
{
|
| 14842 |
"name": "English",
|
|
|
|
| 14854 |
"name": "Indonesian",
|
| 14855 |
"bcp_47": "id",
|
| 14856 |
"population": 311047,
|
| 14857 |
+
"score": 0.47
|
| 14858 |
},
|
| 14859 |
{
|
| 14860 |
"name": "German",
|
| 14861 |
"bcp_47": "de",
|
| 14862 |
"population": 12269084,
|
| 14863 |
+
"score": 0.49
|
| 14864 |
},
|
| 14865 |
{
|
| 14866 |
"name": "Turkish",
|
| 14867 |
"bcp_47": "tr",
|
| 14868 |
"population": 207365,
|
| 14869 |
+
"score": 0.44
|
| 14870 |
},
|
| 14871 |
{
|
| 14872 |
"name": "Dutch",
|
|
|
|
| 15183 |
]
|
| 15184 |
},
|
| 15185 |
"PH": {
|
| 15186 |
+
"score": 0.32615211365536473,
|
| 15187 |
"languages": [
|
| 15188 |
{
|
| 15189 |
"name": "English",
|
|
|
|
| 15207 |
"name": "Filipino",
|
| 15208 |
"bcp_47": "fil",
|
| 15209 |
"population": 65508600,
|
| 15210 |
+
"score": 0.42
|
| 15211 |
},
|
| 15212 |
{
|
| 15213 |
"name": "Cebuano",
|
|
|
|
| 15308 |
]
|
| 15309 |
},
|
| 15310 |
"PK": {
|
| 15311 |
+
"score": 0.30567966556461956,
|
| 15312 |
"languages": [
|
| 15313 |
{
|
| 15314 |
"name": "English",
|
|
|
|
| 15326 |
"name": "Punjabi",
|
| 15327 |
"bcp_47": "pa",
|
| 15328 |
"population": 163450700,
|
| 15329 |
+
"score": 0.43
|
| 15330 |
},
|
| 15331 |
{
|
| 15332 |
"name": "Western Panjabi",
|
|
|
|
| 15338 |
"name": "Persian",
|
| 15339 |
"bcp_47": "fa",
|
| 15340 |
"population": 1541107,
|
| 15341 |
+
"score": 0.41
|
| 15342 |
},
|
| 15343 |
{
|
| 15344 |
"name": "Pashto",
|
|
|
|
| 15457 |
]
|
| 15458 |
},
|
| 15459 |
"PL": {
|
| 15460 |
+
"score": 0.19542647519424666,
|
| 15461 |
"languages": [
|
| 15462 |
{
|
| 15463 |
"name": "English",
|
|
|
|
| 15469 |
"name": "Russian",
|
| 15470 |
"bcp_47": "ru",
|
| 15471 |
"population": 6890814,
|
| 15472 |
+
"score": 0.45
|
| 15473 |
},
|
| 15474 |
{
|
| 15475 |
"name": "German",
|
| 15476 |
"bcp_47": "de",
|
| 15477 |
"population": 7273637,
|
| 15478 |
+
"score": 0.49
|
| 15479 |
},
|
| 15480 |
{
|
| 15481 |
"name": "Polish",
|
|
|
|
| 15573 |
]
|
| 15574 |
},
|
| 15575 |
"PT": {
|
| 15576 |
+
"score": 0.4542324762390237,
|
| 15577 |
"languages": [
|
| 15578 |
{
|
| 15579 |
"name": "English",
|
|
|
|
| 15597 |
"name": "Portuguese",
|
| 15598 |
"bcp_47": "pt",
|
| 15599 |
"population": 9890592,
|
| 15600 |
+
"score": 0.45
|
| 15601 |
},
|
| 15602 |
{
|
| 15603 |
"name": "Galician",
|
|
|
|
| 15625 |
]
|
| 15626 |
},
|
| 15627 |
"RO": {
|
| 15628 |
+
"score": 0.1743772772485309,
|
| 15629 |
"languages": [
|
| 15630 |
{
|
| 15631 |
"name": "English",
|
|
|
|
| 15649 |
"name": "German",
|
| 15650 |
"bcp_47": "de",
|
| 15651 |
"population": 44736,
|
| 15652 |
+
"score": 0.49
|
| 15653 |
},
|
| 15654 |
{
|
| 15655 |
"name": "Turkish",
|
| 15656 |
"bcp_47": "tr",
|
| 15657 |
"population": 27694,
|
| 15658 |
+
"score": 0.44
|
| 15659 |
},
|
| 15660 |
{
|
| 15661 |
"name": "Polish",
|
|
|
|
| 15883 |
]
|
| 15884 |
},
|
| 15885 |
"SG": {
|
| 15886 |
+
"score": 0.4294592881506046,
|
| 15887 |
"languages": [
|
| 15888 |
{
|
| 15889 |
"name": "English",
|
|
|
|
| 15901 |
"name": "Punjabi",
|
| 15902 |
"bcp_47": "pa",
|
| 15903 |
"population": 9314,
|
| 15904 |
+
"score": 0.43
|
| 15905 |
},
|
| 15906 |
{
|
| 15907 |
"name": "Tamil",
|
| 15908 |
"bcp_47": "ta",
|
| 15909 |
"population": 130403,
|
| 15910 |
+
"score": 0.41
|
| 15911 |
},
|
| 15912 |
{
|
| 15913 |
"name": "Malayalam",
|
|
|
|
| 15935 |
]
|
| 15936 |
},
|
| 15937 |
"SI": {
|
| 15938 |
+
"score": 0.1928028123892293,
|
| 15939 |
"languages": [
|
| 15940 |
{
|
| 15941 |
"name": "English",
|
|
|
|
| 15947 |
"name": "German",
|
| 15948 |
"bcp_47": "de",
|
| 15949 |
"population": 883126,
|
| 15950 |
+
"score": 0.49
|
| 15951 |
},
|
| 15952 |
{
|
| 15953 |
"name": "Italian",
|
| 15954 |
"bcp_47": "it",
|
| 15955 |
"population": 3995,
|
| 15956 |
+
"score": 0.47
|
| 15957 |
},
|
| 15958 |
{
|
| 15959 |
"name": "Hungarian",
|
|
|
|
| 15982 |
]
|
| 15983 |
},
|
| 15984 |
"SK": {
|
| 15985 |
+
"score": 0.11567670853229638,
|
| 15986 |
"languages": [
|
| 15987 |
{
|
| 15988 |
"name": "English",
|
|
|
|
| 15994 |
"name": "German",
|
| 15995 |
"bcp_47": "de",
|
| 15996 |
"population": 1196932,
|
| 15997 |
+
"score": 0.49
|
| 15998 |
},
|
| 15999 |
{
|
| 16000 |
"name": "Polish",
|
|
|
|
| 16290 |
]
|
| 16291 |
},
|
| 16292 |
"TR": {
|
| 16293 |
+
"score": 0.38853953080443926,
|
| 16294 |
"languages": [
|
| 16295 |
{
|
| 16296 |
"name": "English",
|
|
|
|
| 16308 |
"name": "Turkish",
|
| 16309 |
"bcp_47": "tr",
|
| 16310 |
"population": 76276275,
|
| 16311 |
+
"score": 0.44
|
| 16312 |
},
|
| 16313 |
{
|
| 16314 |
"name": "North Levantine Arabic",
|
|
|
|
| 16467 |
]
|
| 16468 |
},
|
| 16469 |
"TZ": {
|
| 16470 |
+
"score": 0.3952631230768349,
|
| 16471 |
"languages": [
|
| 16472 |
{
|
| 16473 |
"name": "English",
|
|
|
|
| 16479 |
"name": "Swahili",
|
| 16480 |
"bcp_47": "sw",
|
| 16481 |
"population": 52697520,
|
| 16482 |
+
"score": 0.45
|
| 16483 |
},
|
| 16484 |
{
|
| 16485 |
"name": "Sukuma",
|
|
|
|
| 16568 |
]
|
| 16569 |
},
|
| 16570 |
"UG": {
|
| 16571 |
+
"score": 0.2797477934487195,
|
| 16572 |
"languages": [
|
| 16573 |
{
|
| 16574 |
"name": "English",
|
|
|
|
| 16586 |
"name": "Swahili",
|
| 16587 |
"bcp_47": "sw",
|
| 16588 |
"population": 32439750,
|
| 16589 |
+
"score": 0.45
|
| 16590 |
},
|
| 16591 |
{
|
| 16592 |
"name": "Kinyarwanda",
|
|
|
|
| 16662 |
]
|
| 16663 |
},
|
| 16664 |
"US": {
|
| 16665 |
+
"score": 0.46680423711359387,
|
| 16666 |
"languages": [
|
| 16667 |
{
|
| 16668 |
"name": "English",
|
|
|
|
| 16692 |
"name": "Russian",
|
| 16693 |
"bcp_47": "ru",
|
| 16694 |
"population": 798334,
|
| 16695 |
+
"score": 0.45
|
| 16696 |
},
|
| 16697 |
{
|
| 16698 |
"name": "German",
|
| 16699 |
"bcp_47": "de",
|
| 16700 |
"population": 1563403,
|
| 16701 |
+
"score": 0.49
|
| 16702 |
},
|
| 16703 |
{
|
| 16704 |
"name": "Vietnamese",
|
| 16705 |
"bcp_47": "vi",
|
| 16706 |
"population": 1130973,
|
| 16707 |
+
"score": 0.45
|
| 16708 |
},
|
| 16709 |
{
|
| 16710 |
"name": "Korean",
|
| 16711 |
"bcp_47": "ko",
|
| 16712 |
"population": 997917,
|
| 16713 |
+
"score": 0.41
|
| 16714 |
},
|
| 16715 |
{
|
| 16716 |
"name": "Italian",
|
| 16717 |
"bcp_47": "it",
|
| 16718 |
"population": 1130973,
|
| 16719 |
+
"score": 0.47
|
| 16720 |
},
|
| 16721 |
{
|
| 16722 |
"name": "Filipino",
|
| 16723 |
"bcp_47": "fil",
|
| 16724 |
"population": 1397084,
|
| 16725 |
+
"score": 0.42
|
| 16726 |
},
|
| 16727 |
{
|
| 16728 |
"name": "Yiddish",
|
|
|
|
| 16925 |
]
|
| 16926 |
},
|
| 16927 |
"ZA": {
|
| 16928 |
+
"score": 0.12442237800209865,
|
| 16929 |
"languages": [
|
| 16930 |
{
|
| 16931 |
"name": "English",
|
|
|
|
| 16943 |
"name": "Swahili",
|
| 16944 |
"bcp_47": "sw",
|
| 16945 |
"population": 1016,
|
| 16946 |
+
"score": 0.45
|
| 16947 |
},
|
| 16948 |
{
|
| 16949 |
"name": "Zulu",
|
|
|
|
| 17125 |
]
|
| 17126 |
},
|
| 17127 |
"ID": {
|
| 17128 |
+
"score": 0.3194548673228042,
|
| 17129 |
"languages": [
|
| 17130 |
{
|
| 17131 |
"name": "Chinese",
|
|
|
|
| 17137 |
"name": "Indonesian",
|
| 17138 |
"bcp_47": "id",
|
| 17139 |
"population": 170896640,
|
| 17140 |
+
"score": 0.47
|
| 17141 |
},
|
| 17142 |
{
|
| 17143 |
"name": "Javanese",
|
| 17144 |
"bcp_47": "jv",
|
| 17145 |
"population": 90788840,
|
| 17146 |
+
"score": 0.41
|
| 17147 |
},
|
| 17148 |
{
|
| 17149 |
"name": "Malay",
|
|
|
|
| 17304 |
]
|
| 17305 |
},
|
| 17306 |
"MN": {
|
| 17307 |
+
"score": 0.006903243016889744,
|
| 17308 |
"languages": [
|
| 17309 |
{
|
| 17310 |
"name": "Chinese",
|
|
|
|
| 17316 |
"name": "Russian",
|
| 17317 |
"bcp_47": "ru",
|
| 17318 |
"population": 4118,
|
| 17319 |
+
"score": 0.45
|
| 17320 |
},
|
| 17321 |
{
|
| 17322 |
"name": "Kazakh",
|
|
|
|
| 17408 |
]
|
| 17409 |
},
|
| 17410 |
"VN": {
|
| 17411 |
+
"score": 0.44527479082463184,
|
| 17412 |
"languages": [
|
| 17413 |
{
|
| 17414 |
"name": "Chinese",
|
|
|
|
| 17420 |
"name": "Vietnamese",
|
| 17421 |
"bcp_47": "vi",
|
| 17422 |
"population": 84900318,
|
| 17423 |
+
"score": 0.45
|
| 17424 |
},
|
| 17425 |
{
|
| 17426 |
"name": "Hmong Njua",
|
|
|
|
| 17603 |
]
|
| 17604 |
},
|
| 17605 |
"GQ": {
|
| 17606 |
+
"score": 0.27923739669086073,
|
| 17607 |
"languages": [
|
| 17608 |
{
|
| 17609 |
"name": "Spanish",
|
|
|
|
| 17621 |
"name": "Portuguese",
|
| 17622 |
"bcp_47": "pt",
|
| 17623 |
"population": 1,
|
| 17624 |
+
"score": 0.45
|
| 17625 |
},
|
| 17626 |
{
|
| 17627 |
"name": "Fang",
|
|
|
|
| 17700 |
]
|
| 17701 |
},
|
| 17702 |
"PY": {
|
| 17703 |
+
"score": 0.03322879759433273,
|
| 17704 |
"languages": [
|
| 17705 |
{
|
| 17706 |
"name": "Spanish",
|
|
|
|
| 17712 |
"name": "German",
|
| 17713 |
"bcp_47": "de",
|
| 17714 |
"population": 208559,
|
| 17715 |
+
"score": 0.49
|
| 17716 |
},
|
| 17717 |
{
|
| 17718 |
"name": "Guarani",
|
|
|
|
| 17819 |
]
|
| 17820 |
},
|
| 17821 |
"IR": {
|
| 17822 |
+
"score": 0.23949254115959248,
|
| 17823 |
"languages": [
|
| 17824 |
{
|
| 17825 |
"name": "Arabic",
|
|
|
|
| 17831 |
"name": "Persian",
|
| 17832 |
"bcp_47": "fa",
|
| 17833 |
"population": 63692475,
|
| 17834 |
+
"score": 0.41
|
| 17835 |
},
|
| 17836 |
{
|
| 17837 |
"name": "Pashto",
|
|
|
|
| 18166 |
]
|
| 18167 |
},
|
| 18168 |
"OM": {
|
| 18169 |
+
"score": 0.3961930102252659,
|
| 18170 |
"languages": [
|
| 18171 |
{
|
| 18172 |
"name": "Arabic",
|
|
|
|
| 18178 |
"name": "Persian",
|
| 18179 |
"bcp_47": "fa",
|
| 18180 |
"population": 43849,
|
| 18181 |
+
"score": 0.41
|
| 18182 |
},
|
| 18183 |
{
|
| 18184 |
"name": "Baluchi",
|
|
|
|
| 18206 |
]
|
| 18207 |
},
|
| 18208 |
"QA": {
|
| 18209 |
+
"score": 0.41777205848450016,
|
| 18210 |
"languages": [
|
| 18211 |
{
|
| 18212 |
"name": "Arabic",
|
|
|
|
| 18218 |
"name": "Persian",
|
| 18219 |
"bcp_47": "fa",
|
| 18220 |
"population": 268859,
|
| 18221 |
+
"score": 0.41
|
| 18222 |
},
|
| 18223 |
{
|
| 18224 |
"name": "Malayalam",
|
|
|
|
| 18246 |
]
|
| 18247 |
},
|
| 18248 |
"SO": {
|
| 18249 |
+
"score": 0.1326691120161243,
|
| 18250 |
"languages": [
|
| 18251 |
{
|
| 18252 |
"name": "Arabic",
|
|
|
|
| 18258 |
"name": "Swahili",
|
| 18259 |
"bcp_47": "sw",
|
| 18260 |
"population": 235142,
|
| 18261 |
+
"score": 0.45
|
| 18262 |
},
|
| 18263 |
{
|
| 18264 |
"name": "Oromo",
|
|
|
|
| 18333 |
]
|
| 18334 |
},
|
| 18335 |
"TJ": {
|
| 18336 |
+
"score": 0.05075244729560809,
|
| 18337 |
"languages": [
|
| 18338 |
{
|
| 18339 |
"name": "Arabic",
|
|
|
|
| 18345 |
"name": "Russian",
|
| 18346 |
"bcp_47": "ru",
|
| 18347 |
"population": 1064840,
|
| 18348 |
+
"score": 0.45
|
| 18349 |
},
|
| 18350 |
{
|
| 18351 |
"name": "Persian",
|
| 18352 |
"bcp_47": "fa",
|
| 18353 |
"population": 69215,
|
| 18354 |
+
"score": 0.41
|
| 18355 |
},
|
| 18356 |
{
|
| 18357 |
"name": "Tajik",
|
|
|
|
| 18454 |
]
|
| 18455 |
},
|
| 18456 |
"CD": {
|
| 18457 |
+
"score": 0.34013185580025246,
|
| 18458 |
"languages": [
|
| 18459 |
{
|
| 18460 |
"name": "French",
|
|
|
|
| 18466 |
"name": "Swahili",
|
| 18467 |
"bcp_47": "sw",
|
| 18468 |
"population": 50890000,
|
| 18469 |
+
"score": 0.45
|
| 18470 |
},
|
| 18471 |
{
|
| 18472 |
"name": "Kinyarwanda",
|
|
|
|
| 18718 |
]
|
| 18719 |
},
|
| 18720 |
"RE": {
|
| 18721 |
+
"score": 0.26908571814147125,
|
| 18722 |
"languages": [
|
| 18723 |
{
|
| 18724 |
"name": "French",
|
|
|
|
| 18730 |
"name": "Tamil",
|
| 18731 |
"bcp_47": "ta",
|
| 18732 |
"population": 118138,
|
| 18733 |
+
"score": 0.41
|
| 18734 |
},
|
| 18735 |
{
|
| 18736 |
"name": "Réunion Creole French",
|
|
|
|
| 18887 |
]
|
| 18888 |
},
|
| 18889 |
"YT": {
|
| 18890 |
+
"score": 0.15850059031877214,
|
| 18891 |
"languages": [
|
| 18892 |
{
|
| 18893 |
"name": "French",
|
|
|
|
| 18899 |
"name": "Swahili",
|
| 18900 |
"bcp_47": "sw",
|
| 18901 |
"population": 2716,
|
| 18902 |
+
"score": 0.45
|
| 18903 |
},
|
| 18904 |
{
|
| 18905 |
"name": "Comorian",
|
|
|
|
| 18916 |
]
|
| 18917 |
},
|
| 18918 |
"AO": {
|
| 18919 |
+
"score": 0.2478014326653792,
|
| 18920 |
"languages": [
|
| 18921 |
{
|
| 18922 |
"name": "Portuguese",
|
| 18923 |
"bcp_47": "pt",
|
| 18924 |
"population": 21789941,
|
| 18925 |
+
"score": 0.45
|
| 18926 |
},
|
| 18927 |
{
|
| 18928 |
"name": "Umbundu",
|
|
|
|
| 18945 |
]
|
| 18946 |
},
|
| 18947 |
"CV": {
|
| 18948 |
+
"score": 0.20479048002332564,
|
| 18949 |
"languages": [
|
| 18950 |
{
|
| 18951 |
"name": "Portuguese",
|
| 18952 |
"bcp_47": "pt",
|
| 18953 |
"population": 443274,
|
| 18954 |
+
"score": 0.45
|
| 18955 |
},
|
| 18956 |
{
|
| 18957 |
"name": "Kabuverdianu",
|
|
|
|
| 18962 |
]
|
| 18963 |
},
|
| 18964 |
"GW": {
|
| 18965 |
+
"score": 0.43859551519338624,
|
| 18966 |
"languages": [
|
| 18967 |
{
|
| 18968 |
"name": "Portuguese",
|
| 18969 |
"bcp_47": "pt",
|
| 18970 |
"population": 1927100,
|
| 18971 |
+
"score": 0.45
|
| 18972 |
},
|
| 18973 |
{
|
| 18974 |
"name": "Fula",
|
|
|
|
| 18985 |
]
|
| 18986 |
},
|
| 18987 |
"MZ": {
|
| 18988 |
+
"score": 0.1480934184335346,
|
| 18989 |
"languages": [
|
| 18990 |
{
|
| 18991 |
"name": "Portuguese",
|
| 18992 |
"bcp_47": "pt",
|
| 18993 |
"population": 8126514,
|
| 18994 |
+
"score": 0.45
|
| 18995 |
},
|
| 18996 |
{
|
| 18997 |
"name": "Swahili",
|
| 18998 |
"bcp_47": "sw",
|
| 18999 |
"population": 9330,
|
| 19000 |
+
"score": 0.45
|
| 19001 |
},
|
| 19002 |
{
|
| 19003 |
"name": "Nyanja",
|
|
|
|
| 19062 |
]
|
| 19063 |
},
|
| 19064 |
"ST": {
|
| 19065 |
+
"score": 0.45,
|
| 19066 |
"languages": [
|
| 19067 |
{
|
| 19068 |
"name": "Portuguese",
|
| 19069 |
"bcp_47": "pt",
|
| 19070 |
"population": 179454,
|
| 19071 |
+
"score": 0.45
|
| 19072 |
}
|
| 19073 |
]
|
| 19074 |
},
|
| 19075 |
"TL": {
|
| 19076 |
+
"score": 0.225,
|
| 19077 |
"languages": [
|
| 19078 |
{
|
| 19079 |
"name": "Portuguese",
|
| 19080 |
"bcp_47": "pt",
|
| 19081 |
"population": 816395,
|
| 19082 |
+
"score": 0.45
|
| 19083 |
},
|
| 19084 |
{
|
| 19085 |
"name": "Tetum",
|
|
|
|
| 19090 |
]
|
| 19091 |
},
|
| 19092 |
"BY": {
|
| 19093 |
+
"score": 0.04821427057437069,
|
| 19094 |
"languages": [
|
| 19095 |
{
|
| 19096 |
"name": "Russian",
|
| 19097 |
"bcp_47": "ru",
|
| 19098 |
"population": 1137350,
|
| 19099 |
+
"score": 0.45
|
| 19100 |
},
|
| 19101 |
{
|
| 19102 |
"name": "Belarusian",
|
|
|
|
| 19107 |
]
|
| 19108 |
},
|
| 19109 |
"GE": {
|
| 19110 |
+
"score": 0.03423789210395573,
|
| 19111 |
"languages": [
|
| 19112 |
{
|
| 19113 |
"name": "Russian",
|
| 19114 |
"bcp_47": "ru",
|
| 19115 |
"population": 359730,
|
| 19116 |
+
"score": 0.45
|
| 19117 |
},
|
| 19118 |
{
|
| 19119 |
"name": "Kurdish",
|
|
|
|
| 19154 |
]
|
| 19155 |
},
|
| 19156 |
"KG": {
|
| 19157 |
+
"score": 0.19285714285714287,
|
| 19158 |
"languages": [
|
| 19159 |
{
|
| 19160 |
"name": "Russian",
|
| 19161 |
"bcp_47": "ru",
|
| 19162 |
"population": 2147364,
|
| 19163 |
+
"score": 0.45
|
| 19164 |
},
|
| 19165 |
{
|
| 19166 |
"name": "Kyrgyz",
|
|
|
|
| 19171 |
]
|
| 19172 |
},
|
| 19173 |
"MD": {
|
| 19174 |
+
"score": 0.014563109130777574,
|
| 19175 |
"languages": [
|
| 19176 |
{
|
| 19177 |
"name": "Russian",
|
| 19178 |
"bcp_47": "ru",
|
| 19179 |
"population": 100935,
|
| 19180 |
+
"score": 0.45
|
| 19181 |
},
|
| 19182 |
{
|
| 19183 |
"name": "Ukrainian",
|
|
|
|
| 19206 |
]
|
| 19207 |
},
|
| 19208 |
"RU": {
|
| 19209 |
+
"score": 0.4065329789745318,
|
| 19210 |
"languages": [
|
| 19211 |
{
|
| 19212 |
"name": "Russian",
|
| 19213 |
"bcp_47": "ru",
|
| 19214 |
"population": 133218680,
|
| 19215 |
+
"score": 0.45
|
| 19216 |
},
|
| 19217 |
{
|
| 19218 |
"name": "Azerbaijani",
|
|
|
|
| 19427 |
]
|
| 19428 |
},
|
| 19429 |
"SJ": {
|
| 19430 |
+
"score": 0.20059435364041606,
|
| 19431 |
"languages": [
|
| 19432 |
{
|
| 19433 |
"name": "Russian",
|
| 19434 |
"bcp_47": "ru",
|
| 19435 |
"population": 1200,
|
| 19436 |
+
"score": 0.45
|
| 19437 |
},
|
| 19438 |
{
|
| 19439 |
"name": "Norwegian Bokmål",
|
|
|
|
| 19444 |
]
|
| 19445 |
},
|
| 19446 |
"TM": {
|
| 19447 |
+
"score": 0.059080984625687366,
|
| 19448 |
"languages": [
|
| 19449 |
{
|
| 19450 |
"name": "Russian",
|
| 19451 |
"bcp_47": "ru",
|
| 19452 |
"population": 663436,
|
| 19453 |
+
"score": 0.45
|
| 19454 |
},
|
| 19455 |
{
|
| 19456 |
"name": "Uzbek",
|
|
|
|
| 19473 |
]
|
| 19474 |
},
|
| 19475 |
"UA": {
|
| 19476 |
+
"score": 0.17534632621240526,
|
| 19477 |
"languages": [
|
| 19478 |
{
|
| 19479 |
"name": "Russian",
|
| 19480 |
"bcp_47": "ru",
|
| 19481 |
"population": 20204534,
|
| 19482 |
+
"score": 0.45
|
| 19483 |
},
|
| 19484 |
{
|
| 19485 |
"name": "Turkish",
|
| 19486 |
"bcp_47": "tr",
|
| 19487 |
"population": 184476,
|
| 19488 |
+
"score": 0.44
|
| 19489 |
},
|
| 19490 |
{
|
| 19491 |
"name": "Polish",
|
|
|
|
| 19550 |
]
|
| 19551 |
},
|
| 19552 |
"UZ": {
|
| 19553 |
+
"score": 0.05701615696541229,
|
| 19554 |
"languages": [
|
| 19555 |
{
|
| 19556 |
"name": "Russian",
|
| 19557 |
"bcp_47": "ru",
|
| 19558 |
"population": 4279156,
|
| 19559 |
+
"score": 0.45
|
| 19560 |
},
|
| 19561 |
{
|
| 19562 |
"name": "Turkish",
|
| 19563 |
"bcp_47": "tr",
|
| 19564 |
"population": 232297,
|
| 19565 |
+
"score": 0.44
|
| 19566 |
},
|
| 19567 |
{
|
| 19568 |
"name": "Uzbek",
|
|
|
|
| 19579 |
]
|
| 19580 |
},
|
| 19581 |
"LI": {
|
| 19582 |
+
"score": 0.26022294592577516,
|
| 19583 |
"languages": [
|
| 19584 |
{
|
| 19585 |
"name": "German",
|
| 19586 |
"bcp_47": "de",
|
| 19587 |
"population": 39137,
|
| 19588 |
+
"score": 0.49
|
| 19589 |
},
|
| 19590 |
{
|
| 19591 |
"name": "Swiss German",
|
|
|
|
| 19602 |
]
|
| 19603 |
},
|
| 19604 |
"JP": {
|
| 19605 |
+
"score": 0.4560515108353953,
|
| 19606 |
"languages": [
|
| 19607 |
{
|
| 19608 |
"name": "Japanese",
|
| 19609 |
"bcp_47": "ja",
|
| 19610 |
"population": 119231650,
|
| 19611 |
+
"score": 0.46
|
| 19612 |
},
|
| 19613 |
{
|
| 19614 |
"name": "Korean",
|
| 19615 |
"bcp_47": "ko",
|
| 19616 |
"population": 652636,
|
| 19617 |
+
"score": 0.41
|
| 19618 |
},
|
| 19619 |
{
|
| 19620 |
"name": "Central Okinawan",
|
|
|
|
| 19625 |
]
|
| 19626 |
},
|
| 19627 |
"AF": {
|
| 19628 |
+
"score": 0.19133182400153392,
|
| 19629 |
"languages": [
|
| 19630 |
{
|
| 19631 |
"name": "Persian",
|
| 19632 |
"bcp_47": "fa",
|
| 19633 |
"population": 18321900,
|
| 19634 |
+
"score": 0.41
|
| 19635 |
},
|
| 19636 |
{
|
| 19637 |
"name": "Pashto",
|
|
|
|
| 19684 |
]
|
| 19685 |
},
|
| 19686 |
"MK": {
|
| 19687 |
+
"score": 0.016125668065966572,
|
| 19688 |
"languages": [
|
| 19689 |
{
|
| 19690 |
"name": "Turkish",
|
| 19691 |
"bcp_47": "tr",
|
| 19692 |
"population": 74409,
|
| 19693 |
+
"score": 0.44
|
| 19694 |
},
|
| 19695 |
{
|
| 19696 |
"name": "Albanian",
|
|
|
|
| 19707 |
]
|
| 19708 |
},
|
| 19709 |
"KP": {
|
| 19710 |
+
"score": 0.41,
|
| 19711 |
"languages": [
|
| 19712 |
{
|
| 19713 |
"name": "Korean",
|
| 19714 |
"bcp_47": "ko",
|
| 19715 |
"population": 22566280,
|
| 19716 |
+
"score": 0.41
|
| 19717 |
}
|
| 19718 |
]
|
| 19719 |
},
|
| 19720 |
"KR": {
|
| 19721 |
+
"score": 0.41,
|
| 19722 |
"languages": [
|
| 19723 |
{
|
| 19724 |
"name": "Korean",
|
| 19725 |
"bcp_47": "ko",
|
| 19726 |
"population": 51835100,
|
| 19727 |
+
"score": 0.41
|
| 19728 |
}
|
| 19729 |
]
|
| 19730 |
},
|
| 19731 |
"SM": {
|
| 19732 |
+
"score": 0.4654018916371436,
|
| 19733 |
"languages": [
|
| 19734 |
{
|
| 19735 |
"name": "Italian",
|
| 19736 |
"bcp_47": "it",
|
| 19737 |
"population": 30466,
|
| 19738 |
+
"score": 0.47
|
| 19739 |
},
|
| 19740 |
{
|
| 19741 |
"name": "Esperanto",
|
|
|
|
| 19746 |
]
|
| 19747 |
},
|
| 19748 |
"VA": {
|
| 19749 |
+
"score": 0.235,
|
| 19750 |
"languages": [
|
| 19751 |
{
|
| 19752 |
"name": "Italian",
|
| 19753 |
"bcp_47": "it",
|
| 19754 |
"population": 820,
|
| 19755 |
+
"score": 0.47
|
| 19756 |
},
|
| 19757 |
{
|
| 19758 |
"name": "Latin",
|
results.json
CHANGED
|
@@ -3,29 +3,29 @@
|
|
| 3 |
{
|
| 4 |
"task": "classification",
|
| 5 |
"metric": "accuracy",
|
| 6 |
-
"score": 0.
|
| 7 |
-
"bcp_47":
|
| 8 |
"model": 12
|
| 9 |
},
|
| 10 |
{
|
| 11 |
"task": "language_modeling",
|
| 12 |
"metric": "chrf",
|
| 13 |
-
"score": 0.
|
| 14 |
-
"bcp_47":
|
| 15 |
"model": 12
|
| 16 |
},
|
| 17 |
{
|
| 18 |
"task": "translation",
|
| 19 |
"metric": "bleu",
|
| 20 |
-
"score": 0.
|
| 21 |
-
"bcp_47":
|
| 22 |
"model": 12
|
| 23 |
},
|
| 24 |
{
|
| 25 |
"task": "translation",
|
| 26 |
"metric": "chrf",
|
| 27 |
-
"score": 0.
|
| 28 |
-
"bcp_47":
|
| 29 |
"model": 12
|
| 30 |
}
|
| 31 |
],
|
|
@@ -41,7 +41,7 @@
|
|
| 41 |
"model": "amazon/nova-micro-v1",
|
| 42 |
"task": "language_modeling",
|
| 43 |
"metric": "chrf",
|
| 44 |
-
"score": 0.
|
| 45 |
"bcp_47": 2
|
| 46 |
},
|
| 47 |
{
|
|
@@ -69,7 +69,7 @@
|
|
| 69 |
"model": "google/gemini-2.0-flash-001",
|
| 70 |
"task": "language_modeling",
|
| 71 |
"metric": "chrf",
|
| 72 |
-
"score": 0.
|
| 73 |
"bcp_47": 2
|
| 74 |
},
|
| 75 |
{
|
|
@@ -97,7 +97,7 @@
|
|
| 97 |
"model": "google/gemini-2.0-flash-lite-001",
|
| 98 |
"task": "language_modeling",
|
| 99 |
"metric": "chrf",
|
| 100 |
-
"score": 0.
|
| 101 |
"bcp_47": 2
|
| 102 |
},
|
| 103 |
{
|
|
@@ -125,7 +125,7 @@
|
|
| 125 |
"model": "google/gemma-3-27b-it",
|
| 126 |
"task": "language_modeling",
|
| 127 |
"metric": "chrf",
|
| 128 |
-
"score": 0.
|
| 129 |
"bcp_47": 2
|
| 130 |
},
|
| 131 |
{
|
|
@@ -153,7 +153,7 @@
|
|
| 153 |
"model": "meta-llama/llama-3-70b-instruct",
|
| 154 |
"task": "language_modeling",
|
| 155 |
"metric": "chrf",
|
| 156 |
-
"score": 0.
|
| 157 |
"bcp_47": 2
|
| 158 |
},
|
| 159 |
{
|
|
@@ -181,14 +181,14 @@
|
|
| 181 |
"model": "meta-llama/llama-3.1-70b-instruct",
|
| 182 |
"task": "language_modeling",
|
| 183 |
"metric": "chrf",
|
| 184 |
-
"score": 0.
|
| 185 |
"bcp_47": 2
|
| 186 |
},
|
| 187 |
{
|
| 188 |
"model": "meta-llama/llama-3.1-70b-instruct",
|
| 189 |
"task": "translation",
|
| 190 |
"metric": "bleu",
|
| 191 |
-
"score": 0.
|
| 192 |
"bcp_47": 2
|
| 193 |
},
|
| 194 |
{
|
|
@@ -202,29 +202,29 @@
|
|
| 202 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 203 |
"task": "classification",
|
| 204 |
"metric": "accuracy",
|
| 205 |
-
"score": 0.
|
| 206 |
-
"bcp_47":
|
| 207 |
},
|
| 208 |
{
|
| 209 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 210 |
"task": "language_modeling",
|
| 211 |
"metric": "chrf",
|
| 212 |
-
"score": 0.
|
| 213 |
-
"bcp_47":
|
| 214 |
},
|
| 215 |
{
|
| 216 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 217 |
"task": "translation",
|
| 218 |
"metric": "bleu",
|
| 219 |
-
"score": 0.
|
| 220 |
-
"bcp_47":
|
| 221 |
},
|
| 222 |
{
|
| 223 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 224 |
"task": "translation",
|
| 225 |
"metric": "chrf",
|
| 226 |
-
"score": 0.
|
| 227 |
-
"bcp_47":
|
| 228 |
},
|
| 229 |
{
|
| 230 |
"model": "microsoft/phi-4-multimodal-instruct",
|
|
@@ -237,7 +237,7 @@
|
|
| 237 |
"model": "microsoft/phi-4-multimodal-instruct",
|
| 238 |
"task": "language_modeling",
|
| 239 |
"metric": "chrf",
|
| 240 |
-
"score": 0.
|
| 241 |
"bcp_47": 2
|
| 242 |
},
|
| 243 |
{
|
|
@@ -265,7 +265,7 @@
|
|
| 265 |
"model": "mistralai/mistral-nemo",
|
| 266 |
"task": "language_modeling",
|
| 267 |
"metric": "chrf",
|
| 268 |
-
"score": 0.
|
| 269 |
"bcp_47": 2
|
| 270 |
},
|
| 271 |
{
|
|
@@ -293,7 +293,7 @@
|
|
| 293 |
"model": "mistralai/mistral-small-24b-instruct-2501",
|
| 294 |
"task": "language_modeling",
|
| 295 |
"metric": "chrf",
|
| 296 |
-
"score": 0.
|
| 297 |
"bcp_47": 2
|
| 298 |
},
|
| 299 |
{
|
|
@@ -321,7 +321,7 @@
|
|
| 321 |
"model": "openai/gpt-4o-mini",
|
| 322 |
"task": "language_modeling",
|
| 323 |
"metric": "chrf",
|
| 324 |
-
"score": 0.
|
| 325 |
"bcp_47": 2
|
| 326 |
},
|
| 327 |
{
|
|
@@ -349,7 +349,7 @@
|
|
| 349 |
"model": "qwen/qwq-32b",
|
| 350 |
"task": "language_modeling",
|
| 351 |
"metric": "chrf",
|
| 352 |
-
"score": 0.
|
| 353 |
"bcp_47": 2
|
| 354 |
},
|
| 355 |
{
|
|
@@ -701,7 +701,7 @@
|
|
| 701 |
"in_benchmark": true,
|
| 702 |
"task": "language_modeling",
|
| 703 |
"metric": "chrf",
|
| 704 |
-
"score": 0.
|
| 705 |
"model": 1.0
|
| 706 |
},
|
| 707 |
{
|
|
@@ -827,10 +827,58 @@
|
|
| 827 |
"commonvoice_hours": null,
|
| 828 |
"commonvoice_locale": null,
|
| 829 |
"in_benchmark": true,
|
| 830 |
-
"task":
|
| 831 |
-
"metric":
|
| 832 |
-
"score":
|
| 833 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 834 |
},
|
| 835 |
{
|
| 836 |
"bcp_47": "as",
|
|
@@ -1613,7 +1661,7 @@
|
|
| 1613 |
"in_benchmark": true,
|
| 1614 |
"task": "language_modeling",
|
| 1615 |
"metric": "chrf",
|
| 1616 |
-
"score": 0.
|
| 1617 |
"model": 1.0
|
| 1618 |
},
|
| 1619 |
{
|
|
@@ -1992,7 +2040,7 @@
|
|
| 1992 |
"family": "Indo-European",
|
| 1993 |
"flores_path": "cat_Latn",
|
| 1994 |
"fleurs_tag": "ca_es",
|
| 1995 |
-
"commonvoice_hours":
|
| 1996 |
"commonvoice_locale": "ca",
|
| 1997 |
"in_benchmark": true,
|
| 1998 |
"task": null,
|
|
@@ -2587,10 +2635,58 @@
|
|
| 2587 |
"commonvoice_hours": 1360.0,
|
| 2588 |
"commonvoice_locale": "de",
|
| 2589 |
"in_benchmark": true,
|
| 2590 |
-
"task":
|
| 2591 |
-
"metric":
|
| 2592 |
-
"score":
|
| 2593 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2594 |
},
|
| 2595 |
{
|
| 2596 |
"bcp_47": "den",
|
|
@@ -2925,7 +3021,7 @@
|
|
| 2925 |
"in_benchmark": true,
|
| 2926 |
"task": "language_modeling",
|
| 2927 |
"metric": "chrf",
|
| 2928 |
-
"score": 0.
|
| 2929 |
"model": 12.0
|
| 2930 |
},
|
| 2931 |
{
|
|
@@ -2941,7 +3037,7 @@
|
|
| 2941 |
"in_benchmark": true,
|
| 2942 |
"task": "translation",
|
| 2943 |
"metric": "bleu",
|
| 2944 |
-
"score": 0.
|
| 2945 |
"model": 12.0
|
| 2946 |
},
|
| 2947 |
{
|
|
@@ -3005,7 +3101,7 @@
|
|
| 3005 |
"in_benchmark": true,
|
| 3006 |
"task": "language_modeling",
|
| 3007 |
"metric": "chrf",
|
| 3008 |
-
"score": 0.
|
| 3009 |
"model": 1.0
|
| 3010 |
},
|
| 3011 |
{
|
|
@@ -3080,7 +3176,7 @@
|
|
| 3080 |
"family": null,
|
| 3081 |
"flores_path": "eus_Latn",
|
| 3082 |
"fleurs_tag": null,
|
| 3083 |
-
"commonvoice_hours":
|
| 3084 |
"commonvoice_locale": "eu",
|
| 3085 |
"in_benchmark": true,
|
| 3086 |
"task": null,
|
|
@@ -3131,10 +3227,58 @@
|
|
| 3131 |
"commonvoice_hours": 370.0,
|
| 3132 |
"commonvoice_locale": "fa",
|
| 3133 |
"in_benchmark": true,
|
| 3134 |
-
"task":
|
| 3135 |
-
"metric":
|
| 3136 |
-
"score":
|
| 3137 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3138 |
},
|
| 3139 |
{
|
| 3140 |
"bcp_47": "fan",
|
|
@@ -3243,10 +3387,58 @@
|
|
| 3243 |
"commonvoice_hours": 0.0,
|
| 3244 |
"commonvoice_locale": "tl",
|
| 3245 |
"in_benchmark": true,
|
| 3246 |
-
"task":
|
| 3247 |
-
"metric":
|
| 3248 |
-
"score":
|
| 3249 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3250 |
},
|
| 3251 |
{
|
| 3252 |
"bcp_47": "fit",
|
|
@@ -3341,7 +3533,7 @@
|
|
| 3341 |
"in_benchmark": true,
|
| 3342 |
"task": "language_modeling",
|
| 3343 |
"metric": "chrf",
|
| 3344 |
-
"score": 0.
|
| 3345 |
"model": 1.0
|
| 3346 |
},
|
| 3347 |
{
|
|
@@ -3544,7 +3736,7 @@
|
|
| 3544 |
"family": "Indo-European",
|
| 3545 |
"flores_path": "gle_Latn",
|
| 3546 |
"fleurs_tag": "ga_ie",
|
| 3547 |
-
"commonvoice_hours":
|
| 3548 |
"commonvoice_locale": "ga-IE",
|
| 3549 |
"in_benchmark": true,
|
| 3550 |
"task": null,
|
|
@@ -3899,36 +4091,84 @@
|
|
| 3899 |
"commonvoice_hours": 0.0,
|
| 3900 |
"commonvoice_locale": "gu-IN",
|
| 3901 |
"in_benchmark": true,
|
| 3902 |
-
"task":
|
| 3903 |
-
"metric":
|
| 3904 |
-
"score":
|
| 3905 |
-
"model":
|
| 3906 |
},
|
| 3907 |
{
|
| 3908 |
-
"bcp_47": "
|
| 3909 |
-
"speakers":
|
| 3910 |
-
"language_name": "
|
| 3911 |
-
"autonym": "
|
| 3912 |
-
"family": "
|
| 3913 |
-
"flores_path":
|
| 3914 |
-
"fleurs_tag":
|
| 3915 |
-
"commonvoice_hours":
|
| 3916 |
-
"commonvoice_locale":
|
| 3917 |
-
"in_benchmark":
|
| 3918 |
-
"task":
|
| 3919 |
-
"metric":
|
| 3920 |
-
"score":
|
| 3921 |
-
"model":
|
| 3922 |
},
|
| 3923 |
{
|
| 3924 |
-
"bcp_47": "
|
| 3925 |
-
"speakers":
|
| 3926 |
-
"language_name": "
|
| 3927 |
-
"autonym": "
|
| 3928 |
-
"family": "
|
| 3929 |
-
"flores_path":
|
| 3930 |
-
"fleurs_tag":
|
| 3931 |
-
"commonvoice_hours": 0.0,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3932 |
"commonvoice_locale": "guc",
|
| 3933 |
"in_benchmark": false,
|
| 3934 |
"task": null,
|
|
@@ -4125,7 +4365,7 @@
|
|
| 4125 |
"in_benchmark": true,
|
| 4126 |
"task": "language_modeling",
|
| 4127 |
"metric": "chrf",
|
| 4128 |
-
"score": 0.
|
| 4129 |
"model": 1.0
|
| 4130 |
},
|
| 4131 |
{
|
|
@@ -4507,10 +4747,58 @@
|
|
| 4507 |
"commonvoice_hours": 33.0,
|
| 4508 |
"commonvoice_locale": "id",
|
| 4509 |
"in_benchmark": true,
|
| 4510 |
-
"task":
|
| 4511 |
-
"metric":
|
| 4512 |
-
"score":
|
| 4513 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4514 |
},
|
| 4515 |
{
|
| 4516 |
"bcp_47": "ie",
|
|
@@ -4667,10 +4955,58 @@
|
|
| 4667 |
"commonvoice_hours": 362.0,
|
| 4668 |
"commonvoice_locale": "it",
|
| 4669 |
"in_benchmark": true,
|
| 4670 |
-
"task":
|
| 4671 |
-
"metric":
|
| 4672 |
-
"score":
|
| 4673 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4674 |
},
|
| 4675 |
{
|
| 4676 |
"bcp_47": "iu",
|
|
@@ -4715,10 +5051,58 @@
|
|
| 4715 |
"commonvoice_hours": 222.0,
|
| 4716 |
"commonvoice_locale": "ja",
|
| 4717 |
"in_benchmark": true,
|
| 4718 |
-
"task":
|
| 4719 |
-
"metric":
|
| 4720 |
-
"score":
|
| 4721 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4722 |
},
|
| 4723 |
{
|
| 4724 |
"bcp_47": "jam",
|
|
@@ -4827,39 +5211,87 @@
|
|
| 4827 |
"commonvoice_hours": 0.0,
|
| 4828 |
"commonvoice_locale": "jv",
|
| 4829 |
"in_benchmark": true,
|
| 4830 |
-
"task":
|
| 4831 |
-
"metric":
|
| 4832 |
-
"score":
|
| 4833 |
-
"model":
|
| 4834 |
},
|
| 4835 |
{
|
| 4836 |
-
"bcp_47": "
|
| 4837 |
-
"speakers":
|
| 4838 |
-
"language_name": "
|
| 4839 |
-
"autonym": "
|
| 4840 |
-
"family": "
|
| 4841 |
-
"flores_path": "
|
| 4842 |
-
"fleurs_tag": "
|
| 4843 |
-
"commonvoice_hours":
|
| 4844 |
-
"commonvoice_locale": "
|
| 4845 |
"in_benchmark": true,
|
| 4846 |
-
"task":
|
| 4847 |
-
"metric":
|
| 4848 |
-
"score":
|
| 4849 |
-
"model":
|
| 4850 |
},
|
| 4851 |
{
|
| 4852 |
-
"bcp_47": "
|
| 4853 |
-
"speakers":
|
| 4854 |
-
"language_name": "
|
| 4855 |
-
"autonym": "
|
| 4856 |
-
"family": "
|
| 4857 |
-
"flores_path":
|
| 4858 |
-
"fleurs_tag":
|
| 4859 |
-
"commonvoice_hours": 0.0,
|
| 4860 |
-
"commonvoice_locale": "
|
| 4861 |
-
"in_benchmark":
|
| 4862 |
-
"task":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4863 |
"metric": null,
|
| 4864 |
"score": null,
|
| 4865 |
"model": null
|
|
@@ -4952,7 +5384,7 @@
|
|
| 4952 |
"family": "Abkhaz-Adyge",
|
| 4953 |
"flores_path": null,
|
| 4954 |
"fleurs_tag": null,
|
| 4955 |
-
"commonvoice_hours":
|
| 4956 |
"commonvoice_locale": "kbd",
|
| 4957 |
"in_benchmark": false,
|
| 4958 |
"task": null,
|
|
@@ -5451,10 +5883,58 @@
|
|
| 5451 |
"commonvoice_hours": 1.7,
|
| 5452 |
"commonvoice_locale": "ko",
|
| 5453 |
"in_benchmark": true,
|
| 5454 |
-
"task":
|
| 5455 |
-
"metric":
|
| 5456 |
-
"score":
|
| 5457 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5458 |
},
|
| 5459 |
{
|
| 5460 |
"bcp_47": "koi",
|
|
@@ -5752,7 +6232,7 @@
|
|
| 5752 |
"family": "Indo-European",
|
| 5753 |
"flores_path": null,
|
| 5754 |
"fleurs_tag": null,
|
| 5755 |
-
"commonvoice_hours":
|
| 5756 |
"commonvoice_locale": "kw",
|
| 5757 |
"in_benchmark": false,
|
| 5758 |
"task": null,
|
|
@@ -6872,7 +7352,7 @@
|
|
| 6872 |
"family": "Indo-European",
|
| 6873 |
"flores_path": "mkd_Cyrl",
|
| 6874 |
"fleurs_tag": "mk_mk",
|
| 6875 |
-
"commonvoice_hours":
|
| 6876 |
"commonvoice_locale": "mk",
|
| 6877 |
"in_benchmark": true,
|
| 6878 |
"task": null,
|
|
@@ -7019,10 +7499,58 @@
|
|
| 7019 |
"commonvoice_hours": 20.0,
|
| 7020 |
"commonvoice_locale": "mr",
|
| 7021 |
"in_benchmark": true,
|
| 7022 |
-
"task":
|
| 7023 |
-
"metric":
|
| 7024 |
-
"score":
|
| 7025 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 7026 |
},
|
| 7027 |
{
|
| 7028 |
"bcp_47": "mrd",
|
|
@@ -7976,7 +8504,7 @@
|
|
| 7976 |
"family": "Indo-European",
|
| 7977 |
"flores_path": null,
|
| 7978 |
"fleurs_tag": null,
|
| 7979 |
-
"commonvoice_hours": 0.
|
| 7980 |
"commonvoice_locale": "os",
|
| 7981 |
"in_benchmark": false,
|
| 7982 |
"task": null,
|
|
@@ -8029,7 +8557,7 @@
|
|
| 8029 |
"in_benchmark": true,
|
| 8030 |
"task": "language_modeling",
|
| 8031 |
"metric": "chrf",
|
| 8032 |
-
"score": 0.
|
| 8033 |
"model": 1.0
|
| 8034 |
},
|
| 8035 |
{
|
|
@@ -8397,7 +8925,7 @@
|
|
| 8397 |
"in_benchmark": true,
|
| 8398 |
"task": "language_modeling",
|
| 8399 |
"metric": "chrf",
|
| 8400 |
-
"score": 0.
|
| 8401 |
"model": 1.0
|
| 8402 |
},
|
| 8403 |
{
|
|
@@ -8824,13 +9352,61 @@
|
|
| 8824 |
"family": "Indo-European",
|
| 8825 |
"flores_path": "rus_Cyrl",
|
| 8826 |
"fleurs_tag": "ru_ru",
|
| 8827 |
-
"commonvoice_hours":
|
| 8828 |
"commonvoice_locale": "ru",
|
| 8829 |
"in_benchmark": true,
|
| 8830 |
-
"task":
|
| 8831 |
-
"metric":
|
| 8832 |
-
"score":
|
| 8833 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 8834 |
},
|
| 8835 |
{
|
| 8836 |
"bcp_47": "rue",
|
|
@@ -9224,7 +9800,7 @@
|
|
| 9224 |
"family": null,
|
| 9225 |
"flores_path": null,
|
| 9226 |
"fleurs_tag": null,
|
| 9227 |
-
"commonvoice_hours":
|
| 9228 |
"commonvoice_locale": "sei",
|
| 9229 |
"in_benchmark": false,
|
| 9230 |
"task": null,
|
|
@@ -9803,32 +10379,80 @@
|
|
| 9803 |
"commonvoice_hours": 411.0,
|
| 9804 |
"commonvoice_locale": "sw",
|
| 9805 |
"in_benchmark": true,
|
| 9806 |
-
"task":
|
| 9807 |
-
"metric":
|
| 9808 |
-
"score":
|
| 9809 |
-
"model":
|
| 9810 |
},
|
| 9811 |
{
|
| 9812 |
-
"bcp_47": "
|
| 9813 |
-
"speakers":
|
| 9814 |
-
"language_name": "
|
| 9815 |
-
"autonym": "
|
| 9816 |
"family": "Atlantic-Congo",
|
| 9817 |
-
"flores_path":
|
| 9818 |
-
"fleurs_tag":
|
| 9819 |
-
"commonvoice_hours":
|
| 9820 |
-
"commonvoice_locale":
|
| 9821 |
-
"in_benchmark":
|
| 9822 |
-
"task":
|
| 9823 |
-
"metric":
|
| 9824 |
-
"score":
|
| 9825 |
-
"model":
|
| 9826 |
},
|
| 9827 |
{
|
| 9828 |
-
"bcp_47": "
|
| 9829 |
-
"speakers":
|
| 9830 |
-
"language_name": "
|
| 9831 |
-
"autonym": "
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 9832 |
"family": "Indo-European",
|
| 9833 |
"flores_path": null,
|
| 9834 |
"fleurs_tag": null,
|
|
@@ -9931,10 +10555,58 @@
|
|
| 9931 |
"commonvoice_hours": 234.0,
|
| 9932 |
"commonvoice_locale": "ta",
|
| 9933 |
"in_benchmark": true,
|
| 9934 |
-
"task":
|
| 9935 |
-
"metric":
|
| 9936 |
-
"score":
|
| 9937 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 9938 |
},
|
| 9939 |
{
|
| 9940 |
"bcp_47": "taj",
|
|
@@ -10043,10 +10715,58 @@
|
|
| 10043 |
"commonvoice_hours": 0.3,
|
| 10044 |
"commonvoice_locale": "te",
|
| 10045 |
"in_benchmark": true,
|
| 10046 |
-
"task":
|
| 10047 |
-
"metric":
|
| 10048 |
-
"score":
|
| 10049 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10050 |
},
|
| 10051 |
{
|
| 10052 |
"bcp_47": "tem",
|
|
@@ -10411,10 +11131,58 @@
|
|
| 10411 |
"commonvoice_hours": 128.0,
|
| 10412 |
"commonvoice_locale": "tr",
|
| 10413 |
"in_benchmark": true,
|
| 10414 |
-
"task":
|
| 10415 |
-
"metric":
|
| 10416 |
-
"score":
|
| 10417 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10418 |
},
|
| 10419 |
{
|
| 10420 |
"bcp_47": "tru",
|
|
@@ -10829,7 +11597,7 @@
|
|
| 10829 |
"in_benchmark": true,
|
| 10830 |
"task": "language_modeling",
|
| 10831 |
"metric": "chrf",
|
| 10832 |
-
"score": 0.
|
| 10833 |
"model": 1.0
|
| 10834 |
},
|
| 10835 |
{
|
|
@@ -10845,7 +11613,7 @@
|
|
| 10845 |
"in_benchmark": true,
|
| 10846 |
"task": "translation",
|
| 10847 |
"metric": "bleu",
|
| 10848 |
-
"score": 0.
|
| 10849 |
"model": 1.0
|
| 10850 |
},
|
| 10851 |
{
|
|
@@ -10955,42 +11723,90 @@
|
|
| 10955 |
"commonvoice_hours": 6.0,
|
| 10956 |
"commonvoice_locale": "vi",
|
| 10957 |
"in_benchmark": true,
|
| 10958 |
-
"task":
|
| 10959 |
-
"metric":
|
| 10960 |
-
"score":
|
| 10961 |
-
"model":
|
| 10962 |
},
|
| 10963 |
{
|
| 10964 |
-
"bcp_47": "
|
| 10965 |
-
"speakers":
|
| 10966 |
-
"language_name": "
|
| 10967 |
-
"autonym": "
|
| 10968 |
-
"family": "
|
| 10969 |
-
"flores_path":
|
| 10970 |
-
"fleurs_tag":
|
| 10971 |
-
"commonvoice_hours":
|
| 10972 |
-
"commonvoice_locale":
|
| 10973 |
-
"in_benchmark":
|
| 10974 |
-
"task":
|
| 10975 |
-
"metric":
|
| 10976 |
-
"score":
|
| 10977 |
-
"model":
|
| 10978 |
},
|
| 10979 |
{
|
| 10980 |
-
"bcp_47": "
|
| 10981 |
-
"speakers":
|
| 10982 |
-
"language_name": "
|
| 10983 |
-
"autonym": "
|
| 10984 |
-
"family": "
|
| 10985 |
-
"flores_path":
|
| 10986 |
-
"fleurs_tag":
|
| 10987 |
-
"commonvoice_hours":
|
| 10988 |
-
"commonvoice_locale":
|
| 10989 |
-
"in_benchmark":
|
| 10990 |
-
"task":
|
| 10991 |
-
"metric":
|
| 10992 |
-
"score":
|
| 10993 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10994 |
},
|
| 10995 |
{
|
| 10996 |
"bcp_47": "vmf",
|
|
@@ -11499,10 +12315,58 @@
|
|
| 11499 |
"commonvoice_hours": 203.0,
|
| 11500 |
"commonvoice_locale": "yue",
|
| 11501 |
"in_benchmark": true,
|
| 11502 |
-
"task":
|
| 11503 |
-
"metric":
|
| 11504 |
-
"score":
|
| 11505 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 11506 |
},
|
| 11507 |
{
|
| 11508 |
"bcp_47": "za",
|
|
@@ -11613,7 +12477,7 @@
|
|
| 11613 |
"in_benchmark": true,
|
| 11614 |
"task": "language_modeling",
|
| 11615 |
"metric": "chrf",
|
| 11616 |
-
"score": 0.
|
| 11617 |
"model": 12.0
|
| 11618 |
},
|
| 11619 |
{
|
|
@@ -11711,7 +12575,7 @@
|
|
| 11711 |
"bcp_47": "en",
|
| 11712 |
"task": "language_modeling",
|
| 11713 |
"metric": "chrf",
|
| 11714 |
-
"score": 0.
|
| 11715 |
"sentence_nr": 14.5
|
| 11716 |
},
|
| 11717 |
{
|
|
@@ -11743,7 +12607,7 @@
|
|
| 11743 |
"bcp_47": "zh",
|
| 11744 |
"task": "language_modeling",
|
| 11745 |
"metric": "chrf",
|
| 11746 |
-
"score": 0.
|
| 11747 |
"sentence_nr": 14.5
|
| 11748 |
},
|
| 11749 |
{
|
|
@@ -11775,7 +12639,7 @@
|
|
| 11775 |
"bcp_47": "en",
|
| 11776 |
"task": "language_modeling",
|
| 11777 |
"metric": "chrf",
|
| 11778 |
-
"score": 0.
|
| 11779 |
"sentence_nr": 14.5
|
| 11780 |
},
|
| 11781 |
{
|
|
@@ -11807,7 +12671,7 @@
|
|
| 11807 |
"bcp_47": "zh",
|
| 11808 |
"task": "language_modeling",
|
| 11809 |
"metric": "chrf",
|
| 11810 |
-
"score": 0.
|
| 11811 |
"sentence_nr": 14.5
|
| 11812 |
},
|
| 11813 |
{
|
|
@@ -11839,7 +12703,7 @@
|
|
| 11839 |
"bcp_47": "en",
|
| 11840 |
"task": "language_modeling",
|
| 11841 |
"metric": "chrf",
|
| 11842 |
-
"score": 0.
|
| 11843 |
"sentence_nr": 14.5
|
| 11844 |
},
|
| 11845 |
{
|
|
@@ -11871,7 +12735,7 @@
|
|
| 11871 |
"bcp_47": "zh",
|
| 11872 |
"task": "language_modeling",
|
| 11873 |
"metric": "chrf",
|
| 11874 |
-
"score": 0.
|
| 11875 |
"sentence_nr": 14.5
|
| 11876 |
},
|
| 11877 |
{
|
|
@@ -11903,7 +12767,7 @@
|
|
| 11903 |
"bcp_47": "en",
|
| 11904 |
"task": "language_modeling",
|
| 11905 |
"metric": "chrf",
|
| 11906 |
-
"score": 0.
|
| 11907 |
"sentence_nr": 14.5
|
| 11908 |
},
|
| 11909 |
{
|
|
@@ -11935,7 +12799,7 @@
|
|
| 11935 |
"bcp_47": "zh",
|
| 11936 |
"task": "language_modeling",
|
| 11937 |
"metric": "chrf",
|
| 11938 |
-
"score": 0.
|
| 11939 |
"sentence_nr": 14.5
|
| 11940 |
},
|
| 11941 |
{
|
|
@@ -11967,7 +12831,7 @@
|
|
| 11967 |
"bcp_47": "en",
|
| 11968 |
"task": "language_modeling",
|
| 11969 |
"metric": "chrf",
|
| 11970 |
-
"score": 0.
|
| 11971 |
"sentence_nr": 14.5
|
| 11972 |
},
|
| 11973 |
{
|
|
@@ -11999,7 +12863,7 @@
|
|
| 11999 |
"bcp_47": "zh",
|
| 12000 |
"task": "language_modeling",
|
| 12001 |
"metric": "chrf",
|
| 12002 |
-
"score": 0.
|
| 12003 |
"sentence_nr": 14.5
|
| 12004 |
},
|
| 12005 |
{
|
|
@@ -12031,7 +12895,7 @@
|
|
| 12031 |
"bcp_47": "en",
|
| 12032 |
"task": "language_modeling",
|
| 12033 |
"metric": "chrf",
|
| 12034 |
-
"score": 0.
|
| 12035 |
"sentence_nr": 14.5
|
| 12036 |
},
|
| 12037 |
{
|
|
@@ -12039,7 +12903,7 @@
|
|
| 12039 |
"bcp_47": "en",
|
| 12040 |
"task": "translation",
|
| 12041 |
"metric": "bleu",
|
| 12042 |
-
"score": 0.
|
| 12043 |
"sentence_nr": 14.5
|
| 12044 |
},
|
| 12045 |
{
|
|
@@ -12063,7 +12927,7 @@
|
|
| 12063 |
"bcp_47": "zh",
|
| 12064 |
"task": "language_modeling",
|
| 12065 |
"metric": "chrf",
|
| 12066 |
-
"score": 0.
|
| 12067 |
"sentence_nr": 14.5
|
| 12068 |
},
|
| 12069 |
{
|
|
@@ -12095,7 +12959,7 @@
|
|
| 12095 |
"bcp_47": "ar",
|
| 12096 |
"task": "language_modeling",
|
| 12097 |
"metric": "chrf",
|
| 12098 |
-
"score": 0.
|
| 12099 |
"sentence_nr": 14.5
|
| 12100 |
},
|
| 12101 |
{
|
|
@@ -12114,6 +12978,38 @@
|
|
| 12114 |
"score": 0.4684314458952127,
|
| 12115 |
"sentence_nr": 14.5
|
| 12116 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 12117 |
{
|
| 12118 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12119 |
"bcp_47": "bn",
|
|
@@ -12127,7 +13023,7 @@
|
|
| 12127 |
"bcp_47": "bn",
|
| 12128 |
"task": "language_modeling",
|
| 12129 |
"metric": "chrf",
|
| 12130 |
-
"score": 0.
|
| 12131 |
"sentence_nr": 14.5
|
| 12132 |
},
|
| 12133 |
{
|
|
@@ -12146,6 +13042,38 @@
|
|
| 12146 |
"score": 0.4076175886917154,
|
| 12147 |
"sentence_nr": 14.5
|
| 12148 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 12149 |
{
|
| 12150 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12151 |
"bcp_47": "en",
|
|
@@ -12159,7 +13087,7 @@
|
|
| 12159 |
"bcp_47": "en",
|
| 12160 |
"task": "language_modeling",
|
| 12161 |
"metric": "chrf",
|
| 12162 |
-
"score": 0.
|
| 12163 |
"sentence_nr": 14.5
|
| 12164 |
},
|
| 12165 |
{
|
|
@@ -12191,7 +13119,7 @@
|
|
| 12191 |
"bcp_47": "es",
|
| 12192 |
"task": "language_modeling",
|
| 12193 |
"metric": "chrf",
|
| 12194 |
-
"score": 0.
|
| 12195 |
"sentence_nr": 14.5
|
| 12196 |
},
|
| 12197 |
{
|
|
@@ -12212,162 +13140,674 @@
|
|
| 12212 |
},
|
| 12213 |
{
|
| 12214 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12215 |
-
"bcp_47": "
|
| 12216 |
"task": "classification",
|
| 12217 |
"metric": "accuracy",
|
| 12218 |
-
"score": 0.
|
| 12219 |
"sentence_nr": 14.5
|
| 12220 |
},
|
| 12221 |
{
|
| 12222 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12223 |
-
"bcp_47": "
|
| 12224 |
"task": "language_modeling",
|
| 12225 |
"metric": "chrf",
|
| 12226 |
-
"score": 0.
|
| 12227 |
"sentence_nr": 14.5
|
| 12228 |
},
|
| 12229 |
{
|
| 12230 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12231 |
-
"bcp_47": "
|
| 12232 |
"task": "translation",
|
| 12233 |
"metric": "bleu",
|
| 12234 |
-
"score": 0.
|
| 12235 |
"sentence_nr": 14.5
|
| 12236 |
},
|
| 12237 |
{
|
| 12238 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12239 |
-
"bcp_47": "
|
| 12240 |
"task": "translation",
|
| 12241 |
"metric": "chrf",
|
| 12242 |
-
"score": 0.
|
| 12243 |
"sentence_nr": 14.5
|
| 12244 |
},
|
| 12245 |
{
|
| 12246 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12247 |
-
"bcp_47": "
|
| 12248 |
"task": "classification",
|
| 12249 |
"metric": "accuracy",
|
| 12250 |
-
"score": 0.
|
| 12251 |
"sentence_nr": 14.5
|
| 12252 |
},
|
| 12253 |
{
|
| 12254 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12255 |
-
"bcp_47": "
|
| 12256 |
"task": "language_modeling",
|
| 12257 |
"metric": "chrf",
|
| 12258 |
-
"score": 0.
|
| 12259 |
"sentence_nr": 14.5
|
| 12260 |
},
|
| 12261 |
{
|
| 12262 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12263 |
-
"bcp_47": "
|
| 12264 |
"task": "translation",
|
| 12265 |
"metric": "bleu",
|
| 12266 |
-
"score": 0.
|
| 12267 |
"sentence_nr": 14.5
|
| 12268 |
},
|
| 12269 |
{
|
| 12270 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12271 |
-
"bcp_47": "
|
| 12272 |
"task": "translation",
|
| 12273 |
"metric": "chrf",
|
| 12274 |
-
"score": 0.
|
| 12275 |
"sentence_nr": 14.5
|
| 12276 |
},
|
| 12277 |
{
|
| 12278 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12279 |
-
"bcp_47": "
|
| 12280 |
"task": "classification",
|
| 12281 |
"metric": "accuracy",
|
| 12282 |
-
"score": 0.
|
| 12283 |
"sentence_nr": 14.5
|
| 12284 |
},
|
| 12285 |
{
|
| 12286 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12287 |
-
"bcp_47": "
|
| 12288 |
"task": "language_modeling",
|
| 12289 |
"metric": "chrf",
|
| 12290 |
-
"score": 0.
|
| 12291 |
"sentence_nr": 14.5
|
| 12292 |
},
|
| 12293 |
{
|
| 12294 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12295 |
-
"bcp_47": "
|
| 12296 |
"task": "translation",
|
| 12297 |
"metric": "bleu",
|
| 12298 |
-
"score": 0.
|
| 12299 |
"sentence_nr": 14.5
|
| 12300 |
},
|
| 12301 |
{
|
| 12302 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12303 |
-
"bcp_47": "
|
| 12304 |
"task": "translation",
|
| 12305 |
"metric": "chrf",
|
| 12306 |
-
"score": 0.
|
| 12307 |
"sentence_nr": 14.5
|
| 12308 |
},
|
| 12309 |
{
|
| 12310 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12311 |
-
"bcp_47": "
|
| 12312 |
"task": "classification",
|
| 12313 |
"metric": "accuracy",
|
| 12314 |
-
"score": 0.
|
| 12315 |
"sentence_nr": 14.5
|
| 12316 |
},
|
| 12317 |
{
|
| 12318 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12319 |
-
"bcp_47": "
|
| 12320 |
"task": "language_modeling",
|
| 12321 |
"metric": "chrf",
|
| 12322 |
-
"score": 0.
|
| 12323 |
"sentence_nr": 14.5
|
| 12324 |
},
|
| 12325 |
{
|
| 12326 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12327 |
-
"bcp_47": "
|
| 12328 |
"task": "translation",
|
| 12329 |
"metric": "bleu",
|
| 12330 |
-
"score": 0.
|
| 12331 |
"sentence_nr": 14.5
|
| 12332 |
},
|
| 12333 |
{
|
| 12334 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12335 |
-
"bcp_47": "
|
| 12336 |
"task": "translation",
|
| 12337 |
"metric": "chrf",
|
| 12338 |
-
"score": 0.
|
| 12339 |
"sentence_nr": 14.5
|
| 12340 |
},
|
| 12341 |
{
|
| 12342 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12343 |
-
"bcp_47": "
|
| 12344 |
"task": "classification",
|
| 12345 |
"metric": "accuracy",
|
| 12346 |
-
"score": 0.
|
| 12347 |
"sentence_nr": 14.5
|
| 12348 |
},
|
| 12349 |
{
|
| 12350 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12351 |
-
"bcp_47": "
|
| 12352 |
"task": "language_modeling",
|
| 12353 |
"metric": "chrf",
|
| 12354 |
-
"score": 0.
|
| 12355 |
"sentence_nr": 14.5
|
| 12356 |
},
|
| 12357 |
{
|
| 12358 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12359 |
-
"bcp_47": "
|
| 12360 |
"task": "translation",
|
| 12361 |
"metric": "bleu",
|
| 12362 |
-
"score": 0.
|
| 12363 |
"sentence_nr": 14.5
|
| 12364 |
},
|
| 12365 |
{
|
| 12366 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12367 |
-
"bcp_47": "
|
| 12368 |
"task": "translation",
|
| 12369 |
"metric": "chrf",
|
| 12370 |
-
"score": 0.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 12371 |
"sentence_nr": 14.5
|
| 12372 |
},
|
| 12373 |
{
|
|
@@ -12383,7 +13823,7 @@
|
|
| 12383 |
"bcp_47": "zh",
|
| 12384 |
"task": "language_modeling",
|
| 12385 |
"metric": "chrf",
|
| 12386 |
-
"score": 0.
|
| 12387 |
"sentence_nr": 14.5
|
| 12388 |
},
|
| 12389 |
{
|
|
@@ -12415,7 +13855,7 @@
|
|
| 12415 |
"bcp_47": "en",
|
| 12416 |
"task": "language_modeling",
|
| 12417 |
"metric": "chrf",
|
| 12418 |
-
"score": 0.
|
| 12419 |
"sentence_nr": 14.5
|
| 12420 |
},
|
| 12421 |
{
|
|
@@ -12447,7 +13887,7 @@
|
|
| 12447 |
"bcp_47": "zh",
|
| 12448 |
"task": "language_modeling",
|
| 12449 |
"metric": "chrf",
|
| 12450 |
-
"score": 0.
|
| 12451 |
"sentence_nr": 14.5
|
| 12452 |
},
|
| 12453 |
{
|
|
@@ -12479,7 +13919,7 @@
|
|
| 12479 |
"bcp_47": "en",
|
| 12480 |
"task": "language_modeling",
|
| 12481 |
"metric": "chrf",
|
| 12482 |
-
"score": 0.
|
| 12483 |
"sentence_nr": 14.5
|
| 12484 |
},
|
| 12485 |
{
|
|
@@ -12511,7 +13951,7 @@
|
|
| 12511 |
"bcp_47": "zh",
|
| 12512 |
"task": "language_modeling",
|
| 12513 |
"metric": "chrf",
|
| 12514 |
-
"score": 0.
|
| 12515 |
"sentence_nr": 14.5
|
| 12516 |
},
|
| 12517 |
{
|
|
@@ -12543,7 +13983,7 @@
|
|
| 12543 |
"bcp_47": "en",
|
| 12544 |
"task": "language_modeling",
|
| 12545 |
"metric": "chrf",
|
| 12546 |
-
"score": 0.
|
| 12547 |
"sentence_nr": 14.5
|
| 12548 |
},
|
| 12549 |
{
|
|
@@ -12575,7 +14015,7 @@
|
|
| 12575 |
"bcp_47": "zh",
|
| 12576 |
"task": "language_modeling",
|
| 12577 |
"metric": "chrf",
|
| 12578 |
-
"score": 0.
|
| 12579 |
"sentence_nr": 14.5
|
| 12580 |
},
|
| 12581 |
{
|
|
@@ -12607,7 +14047,7 @@
|
|
| 12607 |
"bcp_47": "en",
|
| 12608 |
"task": "language_modeling",
|
| 12609 |
"metric": "chrf",
|
| 12610 |
-
"score": 0.
|
| 12611 |
"sentence_nr": 14.5
|
| 12612 |
},
|
| 12613 |
{
|
|
@@ -12639,7 +14079,7 @@
|
|
| 12639 |
"bcp_47": "zh",
|
| 12640 |
"task": "language_modeling",
|
| 12641 |
"metric": "chrf",
|
| 12642 |
-
"score": 0.
|
| 12643 |
"sentence_nr": 14.5
|
| 12644 |
},
|
| 12645 |
{
|
|
@@ -12671,7 +14111,7 @@
|
|
| 12671 |
"bcp_47": "en",
|
| 12672 |
"task": "language_modeling",
|
| 12673 |
"metric": "chrf",
|
| 12674 |
-
"score": 0.
|
| 12675 |
"sentence_nr": 14.5
|
| 12676 |
},
|
| 12677 |
{
|
|
@@ -12703,7 +14143,7 @@
|
|
| 12703 |
"bcp_47": "zh",
|
| 12704 |
"task": "language_modeling",
|
| 12705 |
"metric": "chrf",
|
| 12706 |
-
"score": 0.
|
| 12707 |
"sentence_nr": 14.5
|
| 12708 |
},
|
| 12709 |
{
|
|
|
|
| 3 |
{
|
| 4 |
"task": "classification",
|
| 5 |
"metric": "accuracy",
|
| 6 |
+
"score": 0.5353333333333333,
|
| 7 |
+
"bcp_47": 28,
|
| 8 |
"model": 12
|
| 9 |
},
|
| 10 |
{
|
| 11 |
"task": "language_modeling",
|
| 12 |
"metric": "chrf",
|
| 13 |
+
"score": 0.9172787041570468,
|
| 14 |
+
"bcp_47": 28,
|
| 15 |
"model": 12
|
| 16 |
},
|
| 17 |
{
|
| 18 |
"task": "translation",
|
| 19 |
"metric": "bleu",
|
| 20 |
+
"score": 0.31440758611811165,
|
| 21 |
+
"bcp_47": 28,
|
| 22 |
"model": 12
|
| 23 |
},
|
| 24 |
{
|
| 25 |
"task": "translation",
|
| 26 |
"metric": "chrf",
|
| 27 |
+
"score": 0.4776446463431595,
|
| 28 |
+
"bcp_47": 28,
|
| 29 |
"model": 12
|
| 30 |
}
|
| 31 |
],
|
|
|
|
| 41 |
"model": "amazon/nova-micro-v1",
|
| 42 |
"task": "language_modeling",
|
| 43 |
"metric": "chrf",
|
| 44 |
+
"score": 0.9358428899682786,
|
| 45 |
"bcp_47": 2
|
| 46 |
},
|
| 47 |
{
|
|
|
|
| 69 |
"model": "google/gemini-2.0-flash-001",
|
| 70 |
"task": "language_modeling",
|
| 71 |
"metric": "chrf",
|
| 72 |
+
"score": 0.9585325034195884,
|
| 73 |
"bcp_47": 2
|
| 74 |
},
|
| 75 |
{
|
|
|
|
| 97 |
"model": "google/gemini-2.0-flash-lite-001",
|
| 98 |
"task": "language_modeling",
|
| 99 |
"metric": "chrf",
|
| 100 |
+
"score": 0.9574729426945592,
|
| 101 |
"bcp_47": 2
|
| 102 |
},
|
| 103 |
{
|
|
|
|
| 125 |
"model": "google/gemma-3-27b-it",
|
| 126 |
"task": "language_modeling",
|
| 127 |
"metric": "chrf",
|
| 128 |
+
"score": 0.9402106879094536,
|
| 129 |
"bcp_47": 2
|
| 130 |
},
|
| 131 |
{
|
|
|
|
| 153 |
"model": "meta-llama/llama-3-70b-instruct",
|
| 154 |
"task": "language_modeling",
|
| 155 |
"metric": "chrf",
|
| 156 |
+
"score": 0.9555990324827045,
|
| 157 |
"bcp_47": 2
|
| 158 |
},
|
| 159 |
{
|
|
|
|
| 181 |
"model": "meta-llama/llama-3.1-70b-instruct",
|
| 182 |
"task": "language_modeling",
|
| 183 |
"metric": "chrf",
|
| 184 |
+
"score": 0.9458265879125298,
|
| 185 |
"bcp_47": 2
|
| 186 |
},
|
| 187 |
{
|
| 188 |
"model": "meta-llama/llama-3.1-70b-instruct",
|
| 189 |
"task": "translation",
|
| 190 |
"metric": "bleu",
|
| 191 |
+
"score": 0.4318584195195329,
|
| 192 |
"bcp_47": 2
|
| 193 |
},
|
| 194 |
{
|
|
|
|
| 202 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 203 |
"task": "classification",
|
| 204 |
"metric": "accuracy",
|
| 205 |
+
"score": 0.5142857142857143,
|
| 206 |
+
"bcp_47": 28
|
| 207 |
},
|
| 208 |
{
|
| 209 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 210 |
"task": "language_modeling",
|
| 211 |
"metric": "chrf",
|
| 212 |
+
"score": 0.9422717613037961,
|
| 213 |
+
"bcp_47": 28
|
| 214 |
},
|
| 215 |
{
|
| 216 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 217 |
"task": "translation",
|
| 218 |
"metric": "bleu",
|
| 219 |
+
"score": 0.28045810258852616,
|
| 220 |
+
"bcp_47": 28
|
| 221 |
},
|
| 222 |
{
|
| 223 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 224 |
"task": "translation",
|
| 225 |
"metric": "chrf",
|
| 226 |
+
"score": 0.45694310450071773,
|
| 227 |
+
"bcp_47": 28
|
| 228 |
},
|
| 229 |
{
|
| 230 |
"model": "microsoft/phi-4-multimodal-instruct",
|
|
|
|
| 237 |
"model": "microsoft/phi-4-multimodal-instruct",
|
| 238 |
"task": "language_modeling",
|
| 239 |
"metric": "chrf",
|
| 240 |
+
"score": 0.8811352896333067,
|
| 241 |
"bcp_47": 2
|
| 242 |
},
|
| 243 |
{
|
|
|
|
| 265 |
"model": "mistralai/mistral-nemo",
|
| 266 |
"task": "language_modeling",
|
| 267 |
"metric": "chrf",
|
| 268 |
+
"score": 0.8612477844203897,
|
| 269 |
"bcp_47": 2
|
| 270 |
},
|
| 271 |
{
|
|
|
|
| 293 |
"model": "mistralai/mistral-small-24b-instruct-2501",
|
| 294 |
"task": "language_modeling",
|
| 295 |
"metric": "chrf",
|
| 296 |
+
"score": 0.8782400543225595,
|
| 297 |
"bcp_47": 2
|
| 298 |
},
|
| 299 |
{
|
|
|
|
| 321 |
"model": "openai/gpt-4o-mini",
|
| 322 |
"task": "language_modeling",
|
| 323 |
"metric": "chrf",
|
| 324 |
+
"score": 0.9560369064537906,
|
| 325 |
"bcp_47": 2
|
| 326 |
},
|
| 327 |
{
|
|
|
|
| 349 |
"model": "qwen/qwq-32b",
|
| 350 |
"task": "language_modeling",
|
| 351 |
"metric": "chrf",
|
| 352 |
+
"score": 0.47001826645586636,
|
| 353 |
"bcp_47": 2
|
| 354 |
},
|
| 355 |
{
|
|
|
|
| 701 |
"in_benchmark": true,
|
| 702 |
"task": "language_modeling",
|
| 703 |
"metric": "chrf",
|
| 704 |
+
"score": 0.9392314289764625,
|
| 705 |
"model": 1.0
|
| 706 |
},
|
| 707 |
{
|
|
|
|
| 827 |
"commonvoice_hours": null,
|
| 828 |
"commonvoice_locale": null,
|
| 829 |
"in_benchmark": true,
|
| 830 |
+
"task": "classification",
|
| 831 |
+
"metric": "accuracy",
|
| 832 |
+
"score": 0.4,
|
| 833 |
+
"model": 1.0
|
| 834 |
+
},
|
| 835 |
+
{
|
| 836 |
+
"bcp_47": "arz",
|
| 837 |
+
"speakers": 66639360,
|
| 838 |
+
"language_name": "Egyptian Arabic",
|
| 839 |
+
"autonym": "Egyptian Arabic",
|
| 840 |
+
"family": "Afro-Asiatic",
|
| 841 |
+
"flores_path": "arz_Arab",
|
| 842 |
+
"fleurs_tag": null,
|
| 843 |
+
"commonvoice_hours": null,
|
| 844 |
+
"commonvoice_locale": null,
|
| 845 |
+
"in_benchmark": true,
|
| 846 |
+
"task": "language_modeling",
|
| 847 |
+
"metric": "chrf",
|
| 848 |
+
"score": 0.930329195667362,
|
| 849 |
+
"model": 1.0
|
| 850 |
+
},
|
| 851 |
+
{
|
| 852 |
+
"bcp_47": "arz",
|
| 853 |
+
"speakers": 66639360,
|
| 854 |
+
"language_name": "Egyptian Arabic",
|
| 855 |
+
"autonym": "Egyptian Arabic",
|
| 856 |
+
"family": "Afro-Asiatic",
|
| 857 |
+
"flores_path": "arz_Arab",
|
| 858 |
+
"fleurs_tag": null,
|
| 859 |
+
"commonvoice_hours": null,
|
| 860 |
+
"commonvoice_locale": null,
|
| 861 |
+
"in_benchmark": true,
|
| 862 |
+
"task": "translation",
|
| 863 |
+
"metric": "bleu",
|
| 864 |
+
"score": 0.19793415292805128,
|
| 865 |
+
"model": 1.0
|
| 866 |
+
},
|
| 867 |
+
{
|
| 868 |
+
"bcp_47": "arz",
|
| 869 |
+
"speakers": 66639360,
|
| 870 |
+
"language_name": "Egyptian Arabic",
|
| 871 |
+
"autonym": "Egyptian Arabic",
|
| 872 |
+
"family": "Afro-Asiatic",
|
| 873 |
+
"flores_path": "arz_Arab",
|
| 874 |
+
"fleurs_tag": null,
|
| 875 |
+
"commonvoice_hours": null,
|
| 876 |
+
"commonvoice_locale": null,
|
| 877 |
+
"in_benchmark": true,
|
| 878 |
+
"task": "translation",
|
| 879 |
+
"metric": "chrf",
|
| 880 |
+
"score": 0.3881278724939126,
|
| 881 |
+
"model": 1.0
|
| 882 |
},
|
| 883 |
{
|
| 884 |
"bcp_47": "as",
|
|
|
|
| 1661 |
"in_benchmark": true,
|
| 1662 |
"task": "language_modeling",
|
| 1663 |
"metric": "chrf",
|
| 1664 |
+
"score": 0.9097658392566466,
|
| 1665 |
"model": 1.0
|
| 1666 |
},
|
| 1667 |
{
|
|
|
|
| 2040 |
"family": "Indo-European",
|
| 2041 |
"flores_path": "cat_Latn",
|
| 2042 |
"fleurs_tag": "ca_es",
|
| 2043 |
+
"commonvoice_hours": 2845.0,
|
| 2044 |
"commonvoice_locale": "ca",
|
| 2045 |
"in_benchmark": true,
|
| 2046 |
"task": null,
|
|
|
|
| 2635 |
"commonvoice_hours": 1360.0,
|
| 2636 |
"commonvoice_locale": "de",
|
| 2637 |
"in_benchmark": true,
|
| 2638 |
+
"task": "classification",
|
| 2639 |
+
"metric": "accuracy",
|
| 2640 |
+
"score": 0.6666666666666666,
|
| 2641 |
+
"model": 1.0
|
| 2642 |
+
},
|
| 2643 |
+
{
|
| 2644 |
+
"bcp_47": "de",
|
| 2645 |
+
"speakers": 136350226,
|
| 2646 |
+
"language_name": "German",
|
| 2647 |
+
"autonym": "Deutsch",
|
| 2648 |
+
"family": "Indo-European",
|
| 2649 |
+
"flores_path": "deu_Latn",
|
| 2650 |
+
"fleurs_tag": "de_de",
|
| 2651 |
+
"commonvoice_hours": 1360.0,
|
| 2652 |
+
"commonvoice_locale": "de",
|
| 2653 |
+
"in_benchmark": true,
|
| 2654 |
+
"task": "language_modeling",
|
| 2655 |
+
"metric": "chrf",
|
| 2656 |
+
"score": 0.9594656177914042,
|
| 2657 |
+
"model": 1.0
|
| 2658 |
+
},
|
| 2659 |
+
{
|
| 2660 |
+
"bcp_47": "de",
|
| 2661 |
+
"speakers": 136350226,
|
| 2662 |
+
"language_name": "German",
|
| 2663 |
+
"autonym": "Deutsch",
|
| 2664 |
+
"family": "Indo-European",
|
| 2665 |
+
"flores_path": "deu_Latn",
|
| 2666 |
+
"fleurs_tag": "de_de",
|
| 2667 |
+
"commonvoice_hours": 1360.0,
|
| 2668 |
+
"commonvoice_locale": "de",
|
| 2669 |
+
"in_benchmark": true,
|
| 2670 |
+
"task": "translation",
|
| 2671 |
+
"metric": "bleu",
|
| 2672 |
+
"score": 0.3207642359472324,
|
| 2673 |
+
"model": 1.0
|
| 2674 |
+
},
|
| 2675 |
+
{
|
| 2676 |
+
"bcp_47": "de",
|
| 2677 |
+
"speakers": 136350226,
|
| 2678 |
+
"language_name": "German",
|
| 2679 |
+
"autonym": "Deutsch",
|
| 2680 |
+
"family": "Indo-European",
|
| 2681 |
+
"flores_path": "deu_Latn",
|
| 2682 |
+
"fleurs_tag": "de_de",
|
| 2683 |
+
"commonvoice_hours": 1360.0,
|
| 2684 |
+
"commonvoice_locale": "de",
|
| 2685 |
+
"in_benchmark": true,
|
| 2686 |
+
"task": "translation",
|
| 2687 |
+
"metric": "chrf",
|
| 2688 |
+
"score": 0.49973270743869647,
|
| 2689 |
+
"model": 1.0
|
| 2690 |
},
|
| 2691 |
{
|
| 2692 |
"bcp_47": "den",
|
|
|
|
| 3021 |
"in_benchmark": true,
|
| 3022 |
"task": "language_modeling",
|
| 3023 |
"metric": "chrf",
|
| 3024 |
+
"score": 0.9180269549823046,
|
| 3025 |
"model": 12.0
|
| 3026 |
},
|
| 3027 |
{
|
|
|
|
| 3037 |
"in_benchmark": true,
|
| 3038 |
"task": "translation",
|
| 3039 |
"metric": "bleu",
|
| 3040 |
+
"score": 0.3703633711863608,
|
| 3041 |
"model": 12.0
|
| 3042 |
},
|
| 3043 |
{
|
|
|
|
| 3101 |
"in_benchmark": true,
|
| 3102 |
"task": "language_modeling",
|
| 3103 |
"metric": "chrf",
|
| 3104 |
+
"score": 0.9569342865902168,
|
| 3105 |
"model": 1.0
|
| 3106 |
},
|
| 3107 |
{
|
|
|
|
| 3176 |
"family": null,
|
| 3177 |
"flores_path": "eus_Latn",
|
| 3178 |
"fleurs_tag": null,
|
| 3179 |
+
"commonvoice_hours": 336.0,
|
| 3180 |
"commonvoice_locale": "eu",
|
| 3181 |
"in_benchmark": true,
|
| 3182 |
"task": null,
|
|
|
|
| 3227 |
"commonvoice_hours": 370.0,
|
| 3228 |
"commonvoice_locale": "fa",
|
| 3229 |
"in_benchmark": true,
|
| 3230 |
+
"task": "classification",
|
| 3231 |
+
"metric": "accuracy",
|
| 3232 |
+
"score": 0.4,
|
| 3233 |
+
"model": 1.0
|
| 3234 |
+
},
|
| 3235 |
+
{
|
| 3236 |
+
"bcp_47": "fa",
|
| 3237 |
+
"speakers": 84710459,
|
| 3238 |
+
"language_name": "Persian",
|
| 3239 |
+
"autonym": "فارسی",
|
| 3240 |
+
"family": "Indo-European",
|
| 3241 |
+
"flores_path": "pes_Arab",
|
| 3242 |
+
"fleurs_tag": "fa_ir",
|
| 3243 |
+
"commonvoice_hours": 370.0,
|
| 3244 |
+
"commonvoice_locale": "fa",
|
| 3245 |
+
"in_benchmark": true,
|
| 3246 |
+
"task": "language_modeling",
|
| 3247 |
+
"metric": "chrf",
|
| 3248 |
+
"score": 0.9414698824984596,
|
| 3249 |
+
"model": 1.0
|
| 3250 |
+
},
|
| 3251 |
+
{
|
| 3252 |
+
"bcp_47": "fa",
|
| 3253 |
+
"speakers": 84710459,
|
| 3254 |
+
"language_name": "Persian",
|
| 3255 |
+
"autonym": "فارسی",
|
| 3256 |
+
"family": "Indo-European",
|
| 3257 |
+
"flores_path": "pes_Arab",
|
| 3258 |
+
"fleurs_tag": "fa_ir",
|
| 3259 |
+
"commonvoice_hours": 370.0,
|
| 3260 |
+
"commonvoice_locale": "fa",
|
| 3261 |
+
"in_benchmark": true,
|
| 3262 |
+
"task": "translation",
|
| 3263 |
+
"metric": "bleu",
|
| 3264 |
+
"score": 0.26232478733341374,
|
| 3265 |
+
"model": 1.0
|
| 3266 |
+
},
|
| 3267 |
+
{
|
| 3268 |
+
"bcp_47": "fa",
|
| 3269 |
+
"speakers": 84710459,
|
| 3270 |
+
"language_name": "Persian",
|
| 3271 |
+
"autonym": "فارسی",
|
| 3272 |
+
"family": "Indo-European",
|
| 3273 |
+
"flores_path": "pes_Arab",
|
| 3274 |
+
"fleurs_tag": "fa_ir",
|
| 3275 |
+
"commonvoice_hours": 370.0,
|
| 3276 |
+
"commonvoice_locale": "fa",
|
| 3277 |
+
"in_benchmark": true,
|
| 3278 |
+
"task": "translation",
|
| 3279 |
+
"metric": "chrf",
|
| 3280 |
+
"score": 0.44641220608314985,
|
| 3281 |
+
"model": 1.0
|
| 3282 |
},
|
| 3283 |
{
|
| 3284 |
"bcp_47": "fan",
|
|
|
|
| 3387 |
"commonvoice_hours": 0.0,
|
| 3388 |
"commonvoice_locale": "tl",
|
| 3389 |
"in_benchmark": true,
|
| 3390 |
+
"task": "classification",
|
| 3391 |
+
"metric": "accuracy",
|
| 3392 |
+
"score": 0.43333333333333335,
|
| 3393 |
+
"model": 1.0
|
| 3394 |
+
},
|
| 3395 |
+
{
|
| 3396 |
+
"bcp_47": "fil",
|
| 3397 |
+
"speakers": 67471096,
|
| 3398 |
+
"language_name": "Filipino",
|
| 3399 |
+
"autonym": "Filipino",
|
| 3400 |
+
"family": "Austronesian",
|
| 3401 |
+
"flores_path": "fil_Latn",
|
| 3402 |
+
"fleurs_tag": "fil_ph",
|
| 3403 |
+
"commonvoice_hours": 0.0,
|
| 3404 |
+
"commonvoice_locale": "tl",
|
| 3405 |
+
"in_benchmark": true,
|
| 3406 |
+
"task": "language_modeling",
|
| 3407 |
+
"metric": "chrf",
|
| 3408 |
+
"score": 0.9402707475255596,
|
| 3409 |
+
"model": 1.0
|
| 3410 |
+
},
|
| 3411 |
+
{
|
| 3412 |
+
"bcp_47": "fil",
|
| 3413 |
+
"speakers": 67471096,
|
| 3414 |
+
"language_name": "Filipino",
|
| 3415 |
+
"autonym": "Filipino",
|
| 3416 |
+
"family": "Austronesian",
|
| 3417 |
+
"flores_path": "fil_Latn",
|
| 3418 |
+
"fleurs_tag": "fil_ph",
|
| 3419 |
+
"commonvoice_hours": 0.0,
|
| 3420 |
+
"commonvoice_locale": "tl",
|
| 3421 |
+
"in_benchmark": true,
|
| 3422 |
+
"task": "translation",
|
| 3423 |
+
"metric": "bleu",
|
| 3424 |
+
"score": 0.29097818784870333,
|
| 3425 |
+
"model": 1.0
|
| 3426 |
+
},
|
| 3427 |
+
{
|
| 3428 |
+
"bcp_47": "fil",
|
| 3429 |
+
"speakers": 67471096,
|
| 3430 |
+
"language_name": "Filipino",
|
| 3431 |
+
"autonym": "Filipino",
|
| 3432 |
+
"family": "Austronesian",
|
| 3433 |
+
"flores_path": "fil_Latn",
|
| 3434 |
+
"fleurs_tag": "fil_ph",
|
| 3435 |
+
"commonvoice_hours": 0.0,
|
| 3436 |
+
"commonvoice_locale": "tl",
|
| 3437 |
+
"in_benchmark": true,
|
| 3438 |
+
"task": "translation",
|
| 3439 |
+
"metric": "chrf",
|
| 3440 |
+
"score": 0.44978114149245985,
|
| 3441 |
+
"model": 1.0
|
| 3442 |
},
|
| 3443 |
{
|
| 3444 |
"bcp_47": "fit",
|
|
|
|
| 3533 |
"in_benchmark": true,
|
| 3534 |
"task": "language_modeling",
|
| 3535 |
"metric": "chrf",
|
| 3536 |
+
"score": 0.9815706066541411,
|
| 3537 |
"model": 1.0
|
| 3538 |
},
|
| 3539 |
{
|
|
|
|
| 3736 |
"family": "Indo-European",
|
| 3737 |
"flores_path": "gle_Latn",
|
| 3738 |
"fleurs_tag": "ga_ie",
|
| 3739 |
+
"commonvoice_hours": 6.0,
|
| 3740 |
"commonvoice_locale": "ga-IE",
|
| 3741 |
"in_benchmark": true,
|
| 3742 |
"task": null,
|
|
|
|
| 4091 |
"commonvoice_hours": 0.0,
|
| 4092 |
"commonvoice_locale": "gu-IN",
|
| 4093 |
"in_benchmark": true,
|
| 4094 |
+
"task": "classification",
|
| 4095 |
+
"metric": "accuracy",
|
| 4096 |
+
"score": 0.43333333333333335,
|
| 4097 |
+
"model": 1.0
|
| 4098 |
},
|
| 4099 |
{
|
| 4100 |
+
"bcp_47": "gu",
|
| 4101 |
+
"speakers": 61721799,
|
| 4102 |
+
"language_name": "Gujarati",
|
| 4103 |
+
"autonym": "ગુજરાતી",
|
| 4104 |
+
"family": "Indo-European",
|
| 4105 |
+
"flores_path": "guj_Gujr",
|
| 4106 |
+
"fleurs_tag": "gu_in",
|
| 4107 |
+
"commonvoice_hours": 0.0,
|
| 4108 |
+
"commonvoice_locale": "gu-IN",
|
| 4109 |
+
"in_benchmark": true,
|
| 4110 |
+
"task": "language_modeling",
|
| 4111 |
+
"metric": "chrf",
|
| 4112 |
+
"score": 0.938086045460355,
|
| 4113 |
+
"model": 1.0
|
| 4114 |
},
|
| 4115 |
{
|
| 4116 |
+
"bcp_47": "gu",
|
| 4117 |
+
"speakers": 61721799,
|
| 4118 |
+
"language_name": "Gujarati",
|
| 4119 |
+
"autonym": "ગુજરાતી",
|
| 4120 |
+
"family": "Indo-European",
|
| 4121 |
+
"flores_path": "guj_Gujr",
|
| 4122 |
+
"fleurs_tag": "gu_in",
|
| 4123 |
+
"commonvoice_hours": 0.0,
|
| 4124 |
+
"commonvoice_locale": "gu-IN",
|
| 4125 |
+
"in_benchmark": true,
|
| 4126 |
+
"task": "translation",
|
| 4127 |
+
"metric": "bleu",
|
| 4128 |
+
"score": 0.26442484966880464,
|
| 4129 |
+
"model": 1.0
|
| 4130 |
+
},
|
| 4131 |
+
{
|
| 4132 |
+
"bcp_47": "gu",
|
| 4133 |
+
"speakers": 61721799,
|
| 4134 |
+
"language_name": "Gujarati",
|
| 4135 |
+
"autonym": "ગુજરાતી",
|
| 4136 |
+
"family": "Indo-European",
|
| 4137 |
+
"flores_path": "guj_Gujr",
|
| 4138 |
+
"fleurs_tag": "gu_in",
|
| 4139 |
+
"commonvoice_hours": 0.0,
|
| 4140 |
+
"commonvoice_locale": "gu-IN",
|
| 4141 |
+
"in_benchmark": true,
|
| 4142 |
+
"task": "translation",
|
| 4143 |
+
"metric": "chrf",
|
| 4144 |
+
"score": 0.44452182973195975,
|
| 4145 |
+
"model": 1.0
|
| 4146 |
+
},
|
| 4147 |
+
{
|
| 4148 |
+
"bcp_47": "gub",
|
| 4149 |
+
"speakers": 17784,
|
| 4150 |
+
"language_name": "Guajajára",
|
| 4151 |
+
"autonym": "Guajajára",
|
| 4152 |
+
"family": "Tupian",
|
| 4153 |
+
"flores_path": null,
|
| 4154 |
+
"fleurs_tag": null,
|
| 4155 |
+
"commonvoice_hours": null,
|
| 4156 |
+
"commonvoice_locale": null,
|
| 4157 |
+
"in_benchmark": false,
|
| 4158 |
+
"task": null,
|
| 4159 |
+
"metric": null,
|
| 4160 |
+
"score": null,
|
| 4161 |
+
"model": null
|
| 4162 |
+
},
|
| 4163 |
+
{
|
| 4164 |
+
"bcp_47": "guc",
|
| 4165 |
+
"speakers": 132529,
|
| 4166 |
+
"language_name": "Wayuu",
|
| 4167 |
+
"autonym": "Wayuu",
|
| 4168 |
+
"family": "Arawakan",
|
| 4169 |
+
"flores_path": null,
|
| 4170 |
+
"fleurs_tag": null,
|
| 4171 |
+
"commonvoice_hours": 0.0,
|
| 4172 |
"commonvoice_locale": "guc",
|
| 4173 |
"in_benchmark": false,
|
| 4174 |
"task": null,
|
|
|
|
| 4365 |
"in_benchmark": true,
|
| 4366 |
"task": "language_modeling",
|
| 4367 |
"metric": "chrf",
|
| 4368 |
+
"score": 0.9428185393832219,
|
| 4369 |
"model": 1.0
|
| 4370 |
},
|
| 4371 |
{
|
|
|
|
| 4747 |
"commonvoice_hours": 33.0,
|
| 4748 |
"commonvoice_locale": "id",
|
| 4749 |
"in_benchmark": true,
|
| 4750 |
+
"task": "classification",
|
| 4751 |
+
"metric": "accuracy",
|
| 4752 |
+
"score": 0.6333333333333333,
|
| 4753 |
+
"model": 1.0
|
| 4754 |
+
},
|
| 4755 |
+
{
|
| 4756 |
+
"bcp_47": "id",
|
| 4757 |
+
"speakers": 171207687,
|
| 4758 |
+
"language_name": "Indonesian",
|
| 4759 |
+
"autonym": "Bahasa Indonesia",
|
| 4760 |
+
"family": "Austronesian",
|
| 4761 |
+
"flores_path": "ind_Latn",
|
| 4762 |
+
"fleurs_tag": "id_id",
|
| 4763 |
+
"commonvoice_hours": 33.0,
|
| 4764 |
+
"commonvoice_locale": "id",
|
| 4765 |
+
"in_benchmark": true,
|
| 4766 |
+
"task": "language_modeling",
|
| 4767 |
+
"metric": "chrf",
|
| 4768 |
+
"score": 0.9598314474300775,
|
| 4769 |
+
"model": 1.0
|
| 4770 |
+
},
|
| 4771 |
+
{
|
| 4772 |
+
"bcp_47": "id",
|
| 4773 |
+
"speakers": 171207687,
|
| 4774 |
+
"language_name": "Indonesian",
|
| 4775 |
+
"autonym": "Bahasa Indonesia",
|
| 4776 |
+
"family": "Austronesian",
|
| 4777 |
+
"flores_path": "ind_Latn",
|
| 4778 |
+
"fleurs_tag": "id_id",
|
| 4779 |
+
"commonvoice_hours": 33.0,
|
| 4780 |
+
"commonvoice_locale": "id",
|
| 4781 |
+
"in_benchmark": true,
|
| 4782 |
+
"task": "translation",
|
| 4783 |
+
"metric": "bleu",
|
| 4784 |
+
"score": 0.29354203311552335,
|
| 4785 |
+
"model": 1.0
|
| 4786 |
+
},
|
| 4787 |
+
{
|
| 4788 |
+
"bcp_47": "id",
|
| 4789 |
+
"speakers": 171207687,
|
| 4790 |
+
"language_name": "Indonesian",
|
| 4791 |
+
"autonym": "Bahasa Indonesia",
|
| 4792 |
+
"family": "Austronesian",
|
| 4793 |
+
"flores_path": "ind_Latn",
|
| 4794 |
+
"fleurs_tag": "id_id",
|
| 4795 |
+
"commonvoice_hours": 33.0,
|
| 4796 |
+
"commonvoice_locale": "id",
|
| 4797 |
+
"in_benchmark": true,
|
| 4798 |
+
"task": "translation",
|
| 4799 |
+
"metric": "chrf",
|
| 4800 |
+
"score": 0.4723493656022861,
|
| 4801 |
+
"model": 1.0
|
| 4802 |
},
|
| 4803 |
{
|
| 4804 |
"bcp_47": "ie",
|
|
|
|
| 4955 |
"commonvoice_hours": 362.0,
|
| 4956 |
"commonvoice_locale": "it",
|
| 4957 |
"in_benchmark": true,
|
| 4958 |
+
"task": "classification",
|
| 4959 |
+
"metric": "accuracy",
|
| 4960 |
+
"score": 0.6666666666666666,
|
| 4961 |
+
"model": 1.0
|
| 4962 |
+
},
|
| 4963 |
+
{
|
| 4964 |
+
"bcp_47": "it",
|
| 4965 |
+
"speakers": 70247060,
|
| 4966 |
+
"language_name": "Italian",
|
| 4967 |
+
"autonym": "Italiano",
|
| 4968 |
+
"family": "Indo-European",
|
| 4969 |
+
"flores_path": "ita_Latn",
|
| 4970 |
+
"fleurs_tag": "it_it",
|
| 4971 |
+
"commonvoice_hours": 362.0,
|
| 4972 |
+
"commonvoice_locale": "it",
|
| 4973 |
+
"in_benchmark": true,
|
| 4974 |
+
"task": "language_modeling",
|
| 4975 |
+
"metric": "chrf",
|
| 4976 |
+
"score": 0.9439490413212892,
|
| 4977 |
+
"model": 1.0
|
| 4978 |
+
},
|
| 4979 |
+
{
|
| 4980 |
+
"bcp_47": "it",
|
| 4981 |
+
"speakers": 70247060,
|
| 4982 |
+
"language_name": "Italian",
|
| 4983 |
+
"autonym": "Italiano",
|
| 4984 |
+
"family": "Indo-European",
|
| 4985 |
+
"flores_path": "ita_Latn",
|
| 4986 |
+
"fleurs_tag": "it_it",
|
| 4987 |
+
"commonvoice_hours": 362.0,
|
| 4988 |
+
"commonvoice_locale": "it",
|
| 4989 |
+
"in_benchmark": true,
|
| 4990 |
+
"task": "translation",
|
| 4991 |
+
"metric": "bleu",
|
| 4992 |
+
"score": 0.28142583904826096,
|
| 4993 |
+
"model": 1.0
|
| 4994 |
+
},
|
| 4995 |
+
{
|
| 4996 |
+
"bcp_47": "it",
|
| 4997 |
+
"speakers": 70247060,
|
| 4998 |
+
"language_name": "Italian",
|
| 4999 |
+
"autonym": "Italiano",
|
| 5000 |
+
"family": "Indo-European",
|
| 5001 |
+
"flores_path": "ita_Latn",
|
| 5002 |
+
"fleurs_tag": "it_it",
|
| 5003 |
+
"commonvoice_hours": 362.0,
|
| 5004 |
+
"commonvoice_locale": "it",
|
| 5005 |
+
"in_benchmark": true,
|
| 5006 |
+
"task": "translation",
|
| 5007 |
+
"metric": "chrf",
|
| 5008 |
+
"score": 0.4707591889357925,
|
| 5009 |
+
"model": 1.0
|
| 5010 |
},
|
| 5011 |
{
|
| 5012 |
"bcp_47": "iu",
|
|
|
|
| 5051 |
"commonvoice_hours": 222.0,
|
| 5052 |
"commonvoice_locale": "ja",
|
| 5053 |
"in_benchmark": true,
|
| 5054 |
+
"task": "classification",
|
| 5055 |
+
"metric": "accuracy",
|
| 5056 |
+
"score": 0.6333333333333333,
|
| 5057 |
+
"model": 1.0
|
| 5058 |
+
},
|
| 5059 |
+
{
|
| 5060 |
+
"bcp_47": "ja",
|
| 5061 |
+
"speakers": 119729026,
|
| 5062 |
+
"language_name": "Japanese",
|
| 5063 |
+
"autonym": "日本語",
|
| 5064 |
+
"family": "Japonic",
|
| 5065 |
+
"flores_path": "jpn_Jpan",
|
| 5066 |
+
"fleurs_tag": "ja_jp",
|
| 5067 |
+
"commonvoice_hours": 222.0,
|
| 5068 |
+
"commonvoice_locale": "ja",
|
| 5069 |
+
"in_benchmark": true,
|
| 5070 |
+
"task": "language_modeling",
|
| 5071 |
+
"metric": "chrf",
|
| 5072 |
+
"score": 0.9371132855221468,
|
| 5073 |
+
"model": 1.0
|
| 5074 |
+
},
|
| 5075 |
+
{
|
| 5076 |
+
"bcp_47": "ja",
|
| 5077 |
+
"speakers": 119729026,
|
| 5078 |
+
"language_name": "Japanese",
|
| 5079 |
+
"autonym": "日本語",
|
| 5080 |
+
"family": "Japonic",
|
| 5081 |
+
"flores_path": "jpn_Jpan",
|
| 5082 |
+
"fleurs_tag": "ja_jp",
|
| 5083 |
+
"commonvoice_hours": 222.0,
|
| 5084 |
+
"commonvoice_locale": "ja",
|
| 5085 |
+
"in_benchmark": true,
|
| 5086 |
+
"task": "translation",
|
| 5087 |
+
"metric": "bleu",
|
| 5088 |
+
"score": 0.2723410893967824,
|
| 5089 |
+
"model": 1.0
|
| 5090 |
+
},
|
| 5091 |
+
{
|
| 5092 |
+
"bcp_47": "ja",
|
| 5093 |
+
"speakers": 119729026,
|
| 5094 |
+
"language_name": "Japanese",
|
| 5095 |
+
"autonym": "日本語",
|
| 5096 |
+
"family": "Japonic",
|
| 5097 |
+
"flores_path": "jpn_Jpan",
|
| 5098 |
+
"fleurs_tag": "ja_jp",
|
| 5099 |
+
"commonvoice_hours": 222.0,
|
| 5100 |
+
"commonvoice_locale": "ja",
|
| 5101 |
+
"in_benchmark": true,
|
| 5102 |
+
"task": "translation",
|
| 5103 |
+
"metric": "chrf",
|
| 5104 |
+
"score": 0.43929453749366865,
|
| 5105 |
+
"model": 1.0
|
| 5106 |
},
|
| 5107 |
{
|
| 5108 |
"bcp_47": "jam",
|
|
|
|
| 5211 |
"commonvoice_hours": 0.0,
|
| 5212 |
"commonvoice_locale": "jv",
|
| 5213 |
"in_benchmark": true,
|
| 5214 |
+
"task": "classification",
|
| 5215 |
+
"metric": "accuracy",
|
| 5216 |
+
"score": 0.4666666666666667,
|
| 5217 |
+
"model": 1.0
|
| 5218 |
},
|
| 5219 |
{
|
| 5220 |
+
"bcp_47": "jv",
|
| 5221 |
+
"speakers": 91180665,
|
| 5222 |
+
"language_name": "Javanese",
|
| 5223 |
+
"autonym": "Jawa",
|
| 5224 |
+
"family": "Austronesian",
|
| 5225 |
+
"flores_path": "jav_Latn",
|
| 5226 |
+
"fleurs_tag": "jv_id",
|
| 5227 |
+
"commonvoice_hours": 0.0,
|
| 5228 |
+
"commonvoice_locale": "jv",
|
| 5229 |
"in_benchmark": true,
|
| 5230 |
+
"task": "language_modeling",
|
| 5231 |
+
"metric": "chrf",
|
| 5232 |
+
"score": 0.9298143194922116,
|
| 5233 |
+
"model": 1.0
|
| 5234 |
},
|
| 5235 |
{
|
| 5236 |
+
"bcp_47": "jv",
|
| 5237 |
+
"speakers": 91180665,
|
| 5238 |
+
"language_name": "Javanese",
|
| 5239 |
+
"autonym": "Jawa",
|
| 5240 |
+
"family": "Austronesian",
|
| 5241 |
+
"flores_path": "jav_Latn",
|
| 5242 |
+
"fleurs_tag": "jv_id",
|
| 5243 |
+
"commonvoice_hours": 0.0,
|
| 5244 |
+
"commonvoice_locale": "jv",
|
| 5245 |
+
"in_benchmark": true,
|
| 5246 |
+
"task": "translation",
|
| 5247 |
+
"metric": "bleu",
|
| 5248 |
+
"score": 0.23729186537968905,
|
| 5249 |
+
"model": 1.0
|
| 5250 |
+
},
|
| 5251 |
+
{
|
| 5252 |
+
"bcp_47": "jv",
|
| 5253 |
+
"speakers": 91180665,
|
| 5254 |
+
"language_name": "Javanese",
|
| 5255 |
+
"autonym": "Jawa",
|
| 5256 |
+
"family": "Austronesian",
|
| 5257 |
+
"flores_path": "jav_Latn",
|
| 5258 |
+
"fleurs_tag": "jv_id",
|
| 5259 |
+
"commonvoice_hours": 0.0,
|
| 5260 |
+
"commonvoice_locale": "jv",
|
| 5261 |
+
"in_benchmark": true,
|
| 5262 |
+
"task": "translation",
|
| 5263 |
+
"metric": "chrf",
|
| 5264 |
+
"score": 0.4198940727847352,
|
| 5265 |
+
"model": 1.0
|
| 5266 |
+
},
|
| 5267 |
+
{
|
| 5268 |
+
"bcp_47": "ka",
|
| 5269 |
+
"speakers": 3543646,
|
| 5270 |
+
"language_name": "Georgian",
|
| 5271 |
+
"autonym": "ქართული",
|
| 5272 |
+
"family": "Kartvelian",
|
| 5273 |
+
"flores_path": "kat_Geor",
|
| 5274 |
+
"fleurs_tag": "ka_ge",
|
| 5275 |
+
"commonvoice_hours": 158.0,
|
| 5276 |
+
"commonvoice_locale": "ka",
|
| 5277 |
+
"in_benchmark": true,
|
| 5278 |
+
"task": null,
|
| 5279 |
+
"metric": null,
|
| 5280 |
+
"score": null,
|
| 5281 |
+
"model": null
|
| 5282 |
+
},
|
| 5283 |
+
{
|
| 5284 |
+
"bcp_47": "kaa",
|
| 5285 |
+
"speakers": 489046,
|
| 5286 |
+
"language_name": "Kara-Kalpak",
|
| 5287 |
+
"autonym": "Kara-Kalpak",
|
| 5288 |
+
"family": "Turkic",
|
| 5289 |
+
"flores_path": null,
|
| 5290 |
+
"fleurs_tag": null,
|
| 5291 |
+
"commonvoice_hours": 0.0,
|
| 5292 |
+
"commonvoice_locale": "kaa",
|
| 5293 |
+
"in_benchmark": false,
|
| 5294 |
+
"task": null,
|
| 5295 |
"metric": null,
|
| 5296 |
"score": null,
|
| 5297 |
"model": null
|
|
|
|
| 5384 |
"family": "Abkhaz-Adyge",
|
| 5385 |
"flores_path": null,
|
| 5386 |
"fleurs_tag": null,
|
| 5387 |
+
"commonvoice_hours": 19.0,
|
| 5388 |
"commonvoice_locale": "kbd",
|
| 5389 |
"in_benchmark": false,
|
| 5390 |
"task": null,
|
|
|
|
| 5883 |
"commonvoice_hours": 1.7,
|
| 5884 |
"commonvoice_locale": "ko",
|
| 5885 |
"in_benchmark": true,
|
| 5886 |
+
"task": "classification",
|
| 5887 |
+
"metric": "accuracy",
|
| 5888 |
+
"score": 0.5333333333333333,
|
| 5889 |
+
"model": 1.0
|
| 5890 |
+
},
|
| 5891 |
+
{
|
| 5892 |
+
"bcp_47": "ko",
|
| 5893 |
+
"speakers": 78357046,
|
| 5894 |
+
"language_name": "Korean",
|
| 5895 |
+
"autonym": "한국어",
|
| 5896 |
+
"family": "Koreanic",
|
| 5897 |
+
"flores_path": "kor_Hang",
|
| 5898 |
+
"fleurs_tag": "ko_kr",
|
| 5899 |
+
"commonvoice_hours": 1.7,
|
| 5900 |
+
"commonvoice_locale": "ko",
|
| 5901 |
+
"in_benchmark": true,
|
| 5902 |
+
"task": "language_modeling",
|
| 5903 |
+
"metric": "chrf",
|
| 5904 |
+
"score": 0.9355445912073929,
|
| 5905 |
+
"model": 1.0
|
| 5906 |
+
},
|
| 5907 |
+
{
|
| 5908 |
+
"bcp_47": "ko",
|
| 5909 |
+
"speakers": 78357046,
|
| 5910 |
+
"language_name": "Korean",
|
| 5911 |
+
"autonym": "한국어",
|
| 5912 |
+
"family": "Koreanic",
|
| 5913 |
+
"flores_path": "kor_Hang",
|
| 5914 |
+
"fleurs_tag": "ko_kr",
|
| 5915 |
+
"commonvoice_hours": 1.7,
|
| 5916 |
+
"commonvoice_locale": "ko",
|
| 5917 |
+
"in_benchmark": true,
|
| 5918 |
+
"task": "translation",
|
| 5919 |
+
"metric": "bleu",
|
| 5920 |
+
"score": 0.20332074778330964,
|
| 5921 |
+
"model": 1.0
|
| 5922 |
+
},
|
| 5923 |
+
{
|
| 5924 |
+
"bcp_47": "ko",
|
| 5925 |
+
"speakers": 78357046,
|
| 5926 |
+
"language_name": "Korean",
|
| 5927 |
+
"autonym": "한국어",
|
| 5928 |
+
"family": "Koreanic",
|
| 5929 |
+
"flores_path": "kor_Hang",
|
| 5930 |
+
"fleurs_tag": "ko_kr",
|
| 5931 |
+
"commonvoice_hours": 1.7,
|
| 5932 |
+
"commonvoice_locale": "ko",
|
| 5933 |
+
"in_benchmark": true,
|
| 5934 |
+
"task": "translation",
|
| 5935 |
+
"metric": "chrf",
|
| 5936 |
+
"score": 0.4005255477730261,
|
| 5937 |
+
"model": 1.0
|
| 5938 |
},
|
| 5939 |
{
|
| 5940 |
"bcp_47": "koi",
|
|
|
|
| 6232 |
"family": "Indo-European",
|
| 6233 |
"flores_path": null,
|
| 6234 |
"fleurs_tag": null,
|
| 6235 |
+
"commonvoice_hours": 8.1,
|
| 6236 |
"commonvoice_locale": "kw",
|
| 6237 |
"in_benchmark": false,
|
| 6238 |
"task": null,
|
|
|
|
| 7352 |
"family": "Indo-European",
|
| 7353 |
"flores_path": "mkd_Cyrl",
|
| 7354 |
"fleurs_tag": "mk_mk",
|
| 7355 |
+
"commonvoice_hours": 19.0,
|
| 7356 |
"commonvoice_locale": "mk",
|
| 7357 |
"in_benchmark": true,
|
| 7358 |
"task": null,
|
|
|
|
| 7499 |
"commonvoice_hours": 20.0,
|
| 7500 |
"commonvoice_locale": "mr",
|
| 7501 |
"in_benchmark": true,
|
| 7502 |
+
"task": "classification",
|
| 7503 |
+
"metric": "accuracy",
|
| 7504 |
+
"score": 0.6333333333333333,
|
| 7505 |
+
"model": 1.0
|
| 7506 |
+
},
|
| 7507 |
+
{
|
| 7508 |
+
"bcp_47": "mr",
|
| 7509 |
+
"speakers": 92826300,
|
| 7510 |
+
"language_name": "Marathi",
|
| 7511 |
+
"autonym": "मराठी",
|
| 7512 |
+
"family": "Indo-European",
|
| 7513 |
+
"flores_path": "mar_Deva",
|
| 7514 |
+
"fleurs_tag": "mr_in",
|
| 7515 |
+
"commonvoice_hours": 20.0,
|
| 7516 |
+
"commonvoice_locale": "mr",
|
| 7517 |
+
"in_benchmark": true,
|
| 7518 |
+
"task": "language_modeling",
|
| 7519 |
+
"metric": "chrf",
|
| 7520 |
+
"score": 0.9440892312053646,
|
| 7521 |
+
"model": 1.0
|
| 7522 |
+
},
|
| 7523 |
+
{
|
| 7524 |
+
"bcp_47": "mr",
|
| 7525 |
+
"speakers": 92826300,
|
| 7526 |
+
"language_name": "Marathi",
|
| 7527 |
+
"autonym": "मराठी",
|
| 7528 |
+
"family": "Indo-European",
|
| 7529 |
+
"flores_path": "mar_Deva",
|
| 7530 |
+
"fleurs_tag": "mr_in",
|
| 7531 |
+
"commonvoice_hours": 20.0,
|
| 7532 |
+
"commonvoice_locale": "mr",
|
| 7533 |
+
"in_benchmark": true,
|
| 7534 |
+
"task": "translation",
|
| 7535 |
+
"metric": "bleu",
|
| 7536 |
+
"score": 0.24903049799655144,
|
| 7537 |
+
"model": 1.0
|
| 7538 |
+
},
|
| 7539 |
+
{
|
| 7540 |
+
"bcp_47": "mr",
|
| 7541 |
+
"speakers": 92826300,
|
| 7542 |
+
"language_name": "Marathi",
|
| 7543 |
+
"autonym": "मराठी",
|
| 7544 |
+
"family": "Indo-European",
|
| 7545 |
+
"flores_path": "mar_Deva",
|
| 7546 |
+
"fleurs_tag": "mr_in",
|
| 7547 |
+
"commonvoice_hours": 20.0,
|
| 7548 |
+
"commonvoice_locale": "mr",
|
| 7549 |
+
"in_benchmark": true,
|
| 7550 |
+
"task": "translation",
|
| 7551 |
+
"metric": "chrf",
|
| 7552 |
+
"score": 0.42489125861884175,
|
| 7553 |
+
"model": 1.0
|
| 7554 |
},
|
| 7555 |
{
|
| 7556 |
"bcp_47": "mrd",
|
|
|
|
| 8504 |
"family": "Indo-European",
|
| 8505 |
"flores_path": null,
|
| 8506 |
"fleurs_tag": null,
|
| 8507 |
+
"commonvoice_hours": 0.8,
|
| 8508 |
"commonvoice_locale": "os",
|
| 8509 |
"in_benchmark": false,
|
| 8510 |
"task": null,
|
|
|
|
| 8557 |
"in_benchmark": true,
|
| 8558 |
"task": "language_modeling",
|
| 8559 |
"metric": "chrf",
|
| 8560 |
+
"score": 0.9025298113664532,
|
| 8561 |
"model": 1.0
|
| 8562 |
},
|
| 8563 |
{
|
|
|
|
| 8925 |
"in_benchmark": true,
|
| 8926 |
"task": "language_modeling",
|
| 8927 |
"metric": "chrf",
|
| 8928 |
+
"score": 0.9641423549595803,
|
| 8929 |
"model": 1.0
|
| 8930 |
},
|
| 8931 |
{
|
|
|
|
| 9352 |
"family": "Indo-European",
|
| 9353 |
"flores_path": "rus_Cyrl",
|
| 9354 |
"fleurs_tag": "ru_ru",
|
| 9355 |
+
"commonvoice_hours": 243.0,
|
| 9356 |
"commonvoice_locale": "ru",
|
| 9357 |
"in_benchmark": true,
|
| 9358 |
+
"task": "classification",
|
| 9359 |
+
"metric": "accuracy",
|
| 9360 |
+
"score": 0.5666666666666667,
|
| 9361 |
+
"model": 1.0
|
| 9362 |
+
},
|
| 9363 |
+
{
|
| 9364 |
+
"bcp_47": "ru",
|
| 9365 |
+
"speakers": 195841151,
|
| 9366 |
+
"language_name": "Russian",
|
| 9367 |
+
"autonym": "Русский",
|
| 9368 |
+
"family": "Indo-European",
|
| 9369 |
+
"flores_path": "rus_Cyrl",
|
| 9370 |
+
"fleurs_tag": "ru_ru",
|
| 9371 |
+
"commonvoice_hours": 243.0,
|
| 9372 |
+
"commonvoice_locale": "ru",
|
| 9373 |
+
"in_benchmark": true,
|
| 9374 |
+
"task": "language_modeling",
|
| 9375 |
+
"metric": "chrf",
|
| 9376 |
+
"score": 0.9663696817874857,
|
| 9377 |
+
"model": 1.0
|
| 9378 |
+
},
|
| 9379 |
+
{
|
| 9380 |
+
"bcp_47": "ru",
|
| 9381 |
+
"speakers": 195841151,
|
| 9382 |
+
"language_name": "Russian",
|
| 9383 |
+
"autonym": "Русский",
|
| 9384 |
+
"family": "Indo-European",
|
| 9385 |
+
"flores_path": "rus_Cyrl",
|
| 9386 |
+
"fleurs_tag": "ru_ru",
|
| 9387 |
+
"commonvoice_hours": 243.0,
|
| 9388 |
+
"commonvoice_locale": "ru",
|
| 9389 |
+
"in_benchmark": true,
|
| 9390 |
+
"task": "translation",
|
| 9391 |
+
"metric": "bleu",
|
| 9392 |
+
"score": 0.26015179309825326,
|
| 9393 |
+
"model": 1.0
|
| 9394 |
+
},
|
| 9395 |
+
{
|
| 9396 |
+
"bcp_47": "ru",
|
| 9397 |
+
"speakers": 195841151,
|
| 9398 |
+
"language_name": "Russian",
|
| 9399 |
+
"autonym": "Русский",
|
| 9400 |
+
"family": "Indo-European",
|
| 9401 |
+
"flores_path": "rus_Cyrl",
|
| 9402 |
+
"fleurs_tag": "ru_ru",
|
| 9403 |
+
"commonvoice_hours": 243.0,
|
| 9404 |
+
"commonvoice_locale": "ru",
|
| 9405 |
+
"in_benchmark": true,
|
| 9406 |
+
"task": "translation",
|
| 9407 |
+
"metric": "chrf",
|
| 9408 |
+
"score": 0.4525762744858351,
|
| 9409 |
+
"model": 1.0
|
| 9410 |
},
|
| 9411 |
{
|
| 9412 |
"bcp_47": "rue",
|
|
|
|
| 9800 |
"family": null,
|
| 9801 |
"flores_path": null,
|
| 9802 |
"fleurs_tag": null,
|
| 9803 |
+
"commonvoice_hours": 2.5,
|
| 9804 |
"commonvoice_locale": "sei",
|
| 9805 |
"in_benchmark": false,
|
| 9806 |
"task": null,
|
|
|
|
| 10379 |
"commonvoice_hours": 411.0,
|
| 10380 |
"commonvoice_locale": "sw",
|
| 10381 |
"in_benchmark": true,
|
| 10382 |
+
"task": "classification",
|
| 10383 |
+
"metric": "accuracy",
|
| 10384 |
+
"score": 0.5666666666666667,
|
| 10385 |
+
"model": 1.0
|
| 10386 |
},
|
| 10387 |
{
|
| 10388 |
+
"bcp_47": "sw",
|
| 10389 |
+
"speakers": 171610296,
|
| 10390 |
+
"language_name": "Swahili",
|
| 10391 |
+
"autonym": "Kiswahili",
|
| 10392 |
"family": "Atlantic-Congo",
|
| 10393 |
+
"flores_path": "swh_Latn",
|
| 10394 |
+
"fleurs_tag": "sw_ke",
|
| 10395 |
+
"commonvoice_hours": 411.0,
|
| 10396 |
+
"commonvoice_locale": "sw",
|
| 10397 |
+
"in_benchmark": true,
|
| 10398 |
+
"task": "language_modeling",
|
| 10399 |
+
"metric": "chrf",
|
| 10400 |
+
"score": 0.9401745263817055,
|
| 10401 |
+
"model": 1.0
|
| 10402 |
},
|
| 10403 |
{
|
| 10404 |
+
"bcp_47": "sw",
|
| 10405 |
+
"speakers": 171610296,
|
| 10406 |
+
"language_name": "Swahili",
|
| 10407 |
+
"autonym": "Kiswahili",
|
| 10408 |
+
"family": "Atlantic-Congo",
|
| 10409 |
+
"flores_path": "swh_Latn",
|
| 10410 |
+
"fleurs_tag": "sw_ke",
|
| 10411 |
+
"commonvoice_hours": 411.0,
|
| 10412 |
+
"commonvoice_locale": "sw",
|
| 10413 |
+
"in_benchmark": true,
|
| 10414 |
+
"task": "translation",
|
| 10415 |
+
"metric": "bleu",
|
| 10416 |
+
"score": 0.30022614000139736,
|
| 10417 |
+
"model": 1.0
|
| 10418 |
+
},
|
| 10419 |
+
{
|
| 10420 |
+
"bcp_47": "sw",
|
| 10421 |
+
"speakers": 171610296,
|
| 10422 |
+
"language_name": "Swahili",
|
| 10423 |
+
"autonym": "Kiswahili",
|
| 10424 |
+
"family": "Atlantic-Congo",
|
| 10425 |
+
"flores_path": "swh_Latn",
|
| 10426 |
+
"fleurs_tag": "sw_ke",
|
| 10427 |
+
"commonvoice_hours": 411.0,
|
| 10428 |
+
"commonvoice_locale": "sw",
|
| 10429 |
+
"in_benchmark": true,
|
| 10430 |
+
"task": "translation",
|
| 10431 |
+
"metric": "chrf",
|
| 10432 |
+
"score": 0.46620999112028233,
|
| 10433 |
+
"model": 1.0
|
| 10434 |
+
},
|
| 10435 |
+
{
|
| 10436 |
+
"bcp_47": "swb",
|
| 10437 |
+
"speakers": 170720,
|
| 10438 |
+
"language_name": "Comorian",
|
| 10439 |
+
"autonym": "Comorian",
|
| 10440 |
+
"family": "Atlantic-Congo",
|
| 10441 |
+
"flores_path": null,
|
| 10442 |
+
"fleurs_tag": null,
|
| 10443 |
+
"commonvoice_hours": null,
|
| 10444 |
+
"commonvoice_locale": null,
|
| 10445 |
+
"in_benchmark": false,
|
| 10446 |
+
"task": null,
|
| 10447 |
+
"metric": null,
|
| 10448 |
+
"score": null,
|
| 10449 |
+
"model": null
|
| 10450 |
+
},
|
| 10451 |
+
{
|
| 10452 |
+
"bcp_47": "swg",
|
| 10453 |
+
"speakers": 801597,
|
| 10454 |
+
"language_name": "Swabian",
|
| 10455 |
+
"autonym": "Swabian",
|
| 10456 |
"family": "Indo-European",
|
| 10457 |
"flores_path": null,
|
| 10458 |
"fleurs_tag": null,
|
|
|
|
| 10555 |
"commonvoice_hours": 234.0,
|
| 10556 |
"commonvoice_locale": "ta",
|
| 10557 |
"in_benchmark": true,
|
| 10558 |
+
"task": "classification",
|
| 10559 |
+
"metric": "accuracy",
|
| 10560 |
+
"score": 0.43333333333333335,
|
| 10561 |
+
"model": 1.0
|
| 10562 |
+
},
|
| 10563 |
+
{
|
| 10564 |
+
"bcp_47": "ta",
|
| 10565 |
+
"speakers": 85616159,
|
| 10566 |
+
"language_name": "Tamil",
|
| 10567 |
+
"autonym": "தமிழ்",
|
| 10568 |
+
"family": "Dravidian",
|
| 10569 |
+
"flores_path": "tam_Taml",
|
| 10570 |
+
"fleurs_tag": "ta_in",
|
| 10571 |
+
"commonvoice_hours": 234.0,
|
| 10572 |
+
"commonvoice_locale": "ta",
|
| 10573 |
+
"in_benchmark": true,
|
| 10574 |
+
"task": "language_modeling",
|
| 10575 |
+
"metric": "chrf",
|
| 10576 |
+
"score": 0.9641464401452432,
|
| 10577 |
+
"model": 1.0
|
| 10578 |
+
},
|
| 10579 |
+
{
|
| 10580 |
+
"bcp_47": "ta",
|
| 10581 |
+
"speakers": 85616159,
|
| 10582 |
+
"language_name": "Tamil",
|
| 10583 |
+
"autonym": "தமிழ்",
|
| 10584 |
+
"family": "Dravidian",
|
| 10585 |
+
"flores_path": "tam_Taml",
|
| 10586 |
+
"fleurs_tag": "ta_in",
|
| 10587 |
+
"commonvoice_hours": 234.0,
|
| 10588 |
+
"commonvoice_locale": "ta",
|
| 10589 |
+
"in_benchmark": true,
|
| 10590 |
+
"task": "translation",
|
| 10591 |
+
"metric": "bleu",
|
| 10592 |
+
"score": 0.2528104486727614,
|
| 10593 |
+
"model": 1.0
|
| 10594 |
+
},
|
| 10595 |
+
{
|
| 10596 |
+
"bcp_47": "ta",
|
| 10597 |
+
"speakers": 85616159,
|
| 10598 |
+
"language_name": "Tamil",
|
| 10599 |
+
"autonym": "தமிழ்",
|
| 10600 |
+
"family": "Dravidian",
|
| 10601 |
+
"flores_path": "tam_Taml",
|
| 10602 |
+
"fleurs_tag": "ta_in",
|
| 10603 |
+
"commonvoice_hours": 234.0,
|
| 10604 |
+
"commonvoice_locale": "ta",
|
| 10605 |
+
"in_benchmark": true,
|
| 10606 |
+
"task": "translation",
|
| 10607 |
+
"metric": "chrf",
|
| 10608 |
+
"score": 0.42077045938882934,
|
| 10609 |
+
"model": 1.0
|
| 10610 |
},
|
| 10611 |
{
|
| 10612 |
"bcp_47": "taj",
|
|
|
|
| 10715 |
"commonvoice_hours": 0.3,
|
| 10716 |
"commonvoice_locale": "te",
|
| 10717 |
"in_benchmark": true,
|
| 10718 |
+
"task": "classification",
|
| 10719 |
+
"metric": "accuracy",
|
| 10720 |
+
"score": 0.36666666666666664,
|
| 10721 |
+
"model": 1.0
|
| 10722 |
+
},
|
| 10723 |
+
{
|
| 10724 |
+
"bcp_47": "te",
|
| 10725 |
+
"speakers": 95478480,
|
| 10726 |
+
"language_name": "Telugu",
|
| 10727 |
+
"autonym": "తెలుగు",
|
| 10728 |
+
"family": "Dravidian",
|
| 10729 |
+
"flores_path": "tel_Telu",
|
| 10730 |
+
"fleurs_tag": "te_in",
|
| 10731 |
+
"commonvoice_hours": 0.3,
|
| 10732 |
+
"commonvoice_locale": "te",
|
| 10733 |
+
"in_benchmark": true,
|
| 10734 |
+
"task": "language_modeling",
|
| 10735 |
+
"metric": "chrf",
|
| 10736 |
+
"score": 0.9513838296654142,
|
| 10737 |
+
"model": 1.0
|
| 10738 |
+
},
|
| 10739 |
+
{
|
| 10740 |
+
"bcp_47": "te",
|
| 10741 |
+
"speakers": 95478480,
|
| 10742 |
+
"language_name": "Telugu",
|
| 10743 |
+
"autonym": "తెలుగు",
|
| 10744 |
+
"family": "Dravidian",
|
| 10745 |
+
"flores_path": "tel_Telu",
|
| 10746 |
+
"fleurs_tag": "te_in",
|
| 10747 |
+
"commonvoice_hours": 0.3,
|
| 10748 |
+
"commonvoice_locale": "te",
|
| 10749 |
+
"in_benchmark": true,
|
| 10750 |
+
"task": "translation",
|
| 10751 |
+
"metric": "bleu",
|
| 10752 |
+
"score": 0.28338449781147135,
|
| 10753 |
+
"model": 1.0
|
| 10754 |
+
},
|
| 10755 |
+
{
|
| 10756 |
+
"bcp_47": "te",
|
| 10757 |
+
"speakers": 95478480,
|
| 10758 |
+
"language_name": "Telugu",
|
| 10759 |
+
"autonym": "తెలుగు",
|
| 10760 |
+
"family": "Dravidian",
|
| 10761 |
+
"flores_path": "tel_Telu",
|
| 10762 |
+
"fleurs_tag": "te_in",
|
| 10763 |
+
"commonvoice_hours": 0.3,
|
| 10764 |
+
"commonvoice_locale": "te",
|
| 10765 |
+
"in_benchmark": true,
|
| 10766 |
+
"task": "translation",
|
| 10767 |
+
"metric": "chrf",
|
| 10768 |
+
"score": 0.467003606031036,
|
| 10769 |
+
"model": 1.0
|
| 10770 |
},
|
| 10771 |
{
|
| 10772 |
"bcp_47": "tem",
|
|
|
|
| 11131 |
"commonvoice_hours": 128.0,
|
| 11132 |
"commonvoice_locale": "tr",
|
| 11133 |
"in_benchmark": true,
|
| 11134 |
+
"task": "classification",
|
| 11135 |
+
"metric": "accuracy",
|
| 11136 |
+
"score": 0.5333333333333333,
|
| 11137 |
+
"model": 1.0
|
| 11138 |
+
},
|
| 11139 |
+
{
|
| 11140 |
+
"bcp_47": "tr",
|
| 11141 |
+
"speakers": 80360704,
|
| 11142 |
+
"language_name": "Turkish",
|
| 11143 |
+
"autonym": "Türkçe",
|
| 11144 |
+
"family": "Turkic",
|
| 11145 |
+
"flores_path": "tur_Latn",
|
| 11146 |
+
"fleurs_tag": "tr_tr",
|
| 11147 |
+
"commonvoice_hours": 128.0,
|
| 11148 |
+
"commonvoice_locale": "tr",
|
| 11149 |
+
"in_benchmark": true,
|
| 11150 |
+
"task": "language_modeling",
|
| 11151 |
+
"metric": "chrf",
|
| 11152 |
+
"score": 0.9446670623712353,
|
| 11153 |
+
"model": 1.0
|
| 11154 |
+
},
|
| 11155 |
+
{
|
| 11156 |
+
"bcp_47": "tr",
|
| 11157 |
+
"speakers": 80360704,
|
| 11158 |
+
"language_name": "Turkish",
|
| 11159 |
+
"autonym": "Türkçe",
|
| 11160 |
+
"family": "Turkic",
|
| 11161 |
+
"flores_path": "tur_Latn",
|
| 11162 |
+
"fleurs_tag": "tr_tr",
|
| 11163 |
+
"commonvoice_hours": 128.0,
|
| 11164 |
+
"commonvoice_locale": "tr",
|
| 11165 |
+
"in_benchmark": true,
|
| 11166 |
+
"task": "translation",
|
| 11167 |
+
"metric": "bleu",
|
| 11168 |
+
"score": 0.2844596261435892,
|
| 11169 |
+
"model": 1.0
|
| 11170 |
+
},
|
| 11171 |
+
{
|
| 11172 |
+
"bcp_47": "tr",
|
| 11173 |
+
"speakers": 80360704,
|
| 11174 |
+
"language_name": "Turkish",
|
| 11175 |
+
"autonym": "Türkçe",
|
| 11176 |
+
"family": "Turkic",
|
| 11177 |
+
"flores_path": "tur_Latn",
|
| 11178 |
+
"fleurs_tag": "tr_tr",
|
| 11179 |
+
"commonvoice_hours": 128.0,
|
| 11180 |
+
"commonvoice_locale": "tr",
|
| 11181 |
+
"in_benchmark": true,
|
| 11182 |
+
"task": "translation",
|
| 11183 |
+
"metric": "chrf",
|
| 11184 |
+
"score": 0.4525478264239361,
|
| 11185 |
+
"model": 1.0
|
| 11186 |
},
|
| 11187 |
{
|
| 11188 |
"bcp_47": "tru",
|
|
|
|
| 11597 |
"in_benchmark": true,
|
| 11598 |
"task": "language_modeling",
|
| 11599 |
"metric": "chrf",
|
| 11600 |
+
"score": 0.9182703887696211,
|
| 11601 |
"model": 1.0
|
| 11602 |
},
|
| 11603 |
{
|
|
|
|
| 11613 |
"in_benchmark": true,
|
| 11614 |
"task": "translation",
|
| 11615 |
"metric": "bleu",
|
| 11616 |
+
"score": 0.2434522914619727,
|
| 11617 |
"model": 1.0
|
| 11618 |
},
|
| 11619 |
{
|
|
|
|
| 11723 |
"commonvoice_hours": 6.0,
|
| 11724 |
"commonvoice_locale": "vi",
|
| 11725 |
"in_benchmark": true,
|
| 11726 |
+
"task": "classification",
|
| 11727 |
+
"metric": "accuracy",
|
| 11728 |
+
"score": 0.6,
|
| 11729 |
+
"model": 1.0
|
| 11730 |
},
|
| 11731 |
{
|
| 11732 |
+
"bcp_47": "vi",
|
| 11733 |
+
"speakers": 86222962,
|
| 11734 |
+
"language_name": "Vietnamese",
|
| 11735 |
+
"autonym": "Tiếng Việt",
|
| 11736 |
+
"family": "Austroasiatic",
|
| 11737 |
+
"flores_path": "vie_Latn",
|
| 11738 |
+
"fleurs_tag": "vi_vn",
|
| 11739 |
+
"commonvoice_hours": 6.0,
|
| 11740 |
+
"commonvoice_locale": "vi",
|
| 11741 |
+
"in_benchmark": true,
|
| 11742 |
+
"task": "language_modeling",
|
| 11743 |
+
"metric": "chrf",
|
| 11744 |
+
"score": 0.9580044761495575,
|
| 11745 |
+
"model": 1.0
|
| 11746 |
},
|
| 11747 |
{
|
| 11748 |
+
"bcp_47": "vi",
|
| 11749 |
+
"speakers": 86222962,
|
| 11750 |
+
"language_name": "Vietnamese",
|
| 11751 |
+
"autonym": "Tiếng Việt",
|
| 11752 |
+
"family": "Austroasiatic",
|
| 11753 |
+
"flores_path": "vie_Latn",
|
| 11754 |
+
"fleurs_tag": "vi_vn",
|
| 11755 |
+
"commonvoice_hours": 6.0,
|
| 11756 |
+
"commonvoice_locale": "vi",
|
| 11757 |
+
"in_benchmark": true,
|
| 11758 |
+
"task": "translation",
|
| 11759 |
+
"metric": "bleu",
|
| 11760 |
+
"score": 0.25541664062319624,
|
| 11761 |
+
"model": 1.0
|
| 11762 |
+
},
|
| 11763 |
+
{
|
| 11764 |
+
"bcp_47": "vi",
|
| 11765 |
+
"speakers": 86222962,
|
| 11766 |
+
"language_name": "Vietnamese",
|
| 11767 |
+
"autonym": "Tiếng Việt",
|
| 11768 |
+
"family": "Austroasiatic",
|
| 11769 |
+
"flores_path": "vie_Latn",
|
| 11770 |
+
"fleurs_tag": "vi_vn",
|
| 11771 |
+
"commonvoice_hours": 6.0,
|
| 11772 |
+
"commonvoice_locale": "vi",
|
| 11773 |
+
"in_benchmark": true,
|
| 11774 |
+
"task": "translation",
|
| 11775 |
+
"metric": "chrf",
|
| 11776 |
+
"score": 0.43688984396841446,
|
| 11777 |
+
"model": 1.0
|
| 11778 |
+
},
|
| 11779 |
+
{
|
| 11780 |
+
"bcp_47": "vic",
|
| 11781 |
+
"speakers": 3113,
|
| 11782 |
+
"language_name": "Virgin Islands Creole English",
|
| 11783 |
+
"autonym": "Virgin Islands Creole English",
|
| 11784 |
+
"family": "Indo-European",
|
| 11785 |
+
"flores_path": null,
|
| 11786 |
+
"fleurs_tag": null,
|
| 11787 |
+
"commonvoice_hours": null,
|
| 11788 |
+
"commonvoice_locale": null,
|
| 11789 |
+
"in_benchmark": false,
|
| 11790 |
+
"task": null,
|
| 11791 |
+
"metric": null,
|
| 11792 |
+
"score": null,
|
| 11793 |
+
"model": null
|
| 11794 |
+
},
|
| 11795 |
+
{
|
| 11796 |
+
"bcp_47": "vls",
|
| 11797 |
+
"speakers": 1172070,
|
| 11798 |
+
"language_name": "West Flemish",
|
| 11799 |
+
"autonym": "West Flemish",
|
| 11800 |
+
"family": "Indo-European",
|
| 11801 |
+
"flores_path": null,
|
| 11802 |
+
"fleurs_tag": null,
|
| 11803 |
+
"commonvoice_hours": null,
|
| 11804 |
+
"commonvoice_locale": null,
|
| 11805 |
+
"in_benchmark": false,
|
| 11806 |
+
"task": null,
|
| 11807 |
+
"metric": null,
|
| 11808 |
+
"score": null,
|
| 11809 |
+
"model": null
|
| 11810 |
},
|
| 11811 |
{
|
| 11812 |
"bcp_47": "vmf",
|
|
|
|
| 12315 |
"commonvoice_hours": 203.0,
|
| 12316 |
"commonvoice_locale": "yue",
|
| 12317 |
"in_benchmark": true,
|
| 12318 |
+
"task": "classification",
|
| 12319 |
+
"metric": "accuracy",
|
| 12320 |
+
"score": 0.43333333333333335,
|
| 12321 |
+
"model": 1.0
|
| 12322 |
+
},
|
| 12323 |
+
{
|
| 12324 |
+
"bcp_47": "yue",
|
| 12325 |
+
"speakers": 79654759,
|
| 12326 |
+
"language_name": "Cantonese",
|
| 12327 |
+
"autonym": "粵語",
|
| 12328 |
+
"family": "Sino-Tibetan",
|
| 12329 |
+
"flores_path": "yue_Hant",
|
| 12330 |
+
"fleurs_tag": "yue_hant_hk",
|
| 12331 |
+
"commonvoice_hours": 203.0,
|
| 12332 |
+
"commonvoice_locale": "yue",
|
| 12333 |
+
"in_benchmark": true,
|
| 12334 |
+
"task": "language_modeling",
|
| 12335 |
+
"metric": "chrf",
|
| 12336 |
+
"score": 0.9022415223117748,
|
| 12337 |
+
"model": 1.0
|
| 12338 |
+
},
|
| 12339 |
+
{
|
| 12340 |
+
"bcp_47": "yue",
|
| 12341 |
+
"speakers": 79654759,
|
| 12342 |
+
"language_name": "Cantonese",
|
| 12343 |
+
"autonym": "粵語",
|
| 12344 |
+
"family": "Sino-Tibetan",
|
| 12345 |
+
"flores_path": "yue_Hant",
|
| 12346 |
+
"fleurs_tag": "yue_hant_hk",
|
| 12347 |
+
"commonvoice_hours": 203.0,
|
| 12348 |
+
"commonvoice_locale": "yue",
|
| 12349 |
+
"in_benchmark": true,
|
| 12350 |
+
"task": "translation",
|
| 12351 |
+
"metric": "bleu",
|
| 12352 |
+
"score": 0.22628178945118504,
|
| 12353 |
+
"model": 1.0
|
| 12354 |
+
},
|
| 12355 |
+
{
|
| 12356 |
+
"bcp_47": "yue",
|
| 12357 |
+
"speakers": 79654759,
|
| 12358 |
+
"language_name": "Cantonese",
|
| 12359 |
+
"autonym": "粵語",
|
| 12360 |
+
"family": "Sino-Tibetan",
|
| 12361 |
+
"flores_path": "yue_Hant",
|
| 12362 |
+
"fleurs_tag": "yue_hant_hk",
|
| 12363 |
+
"commonvoice_hours": 203.0,
|
| 12364 |
+
"commonvoice_locale": "yue",
|
| 12365 |
+
"in_benchmark": true,
|
| 12366 |
+
"task": "translation",
|
| 12367 |
+
"metric": "chrf",
|
| 12368 |
+
"score": 0.4052050858435178,
|
| 12369 |
+
"model": 1.0
|
| 12370 |
},
|
| 12371 |
{
|
| 12372 |
"bcp_47": "za",
|
|
|
|
| 12477 |
"in_benchmark": true,
|
| 12478 |
"task": "language_modeling",
|
| 12479 |
"metric": "chrf",
|
| 12480 |
+
"score": 0.862116462347859,
|
| 12481 |
"model": 12.0
|
| 12482 |
},
|
| 12483 |
{
|
|
|
|
| 12575 |
"bcp_47": "en",
|
| 12576 |
"task": "language_modeling",
|
| 12577 |
"metric": "chrf",
|
| 12578 |
+
"score": 0.9596433057062642,
|
| 12579 |
"sentence_nr": 14.5
|
| 12580 |
},
|
| 12581 |
{
|
|
|
|
| 12607 |
"bcp_47": "zh",
|
| 12608 |
"task": "language_modeling",
|
| 12609 |
"metric": "chrf",
|
| 12610 |
+
"score": 0.9120424742302929,
|
| 12611 |
"sentence_nr": 14.5
|
| 12612 |
},
|
| 12613 |
{
|
|
|
|
| 12639 |
"bcp_47": "en",
|
| 12640 |
"task": "language_modeling",
|
| 12641 |
"metric": "chrf",
|
| 12642 |
+
"score": 0.9854618933889567,
|
| 12643 |
"sentence_nr": 14.5
|
| 12644 |
},
|
| 12645 |
{
|
|
|
|
| 12671 |
"bcp_47": "zh",
|
| 12672 |
"task": "language_modeling",
|
| 12673 |
"metric": "chrf",
|
| 12674 |
+
"score": 0.93160311345022,
|
| 12675 |
"sentence_nr": 14.5
|
| 12676 |
},
|
| 12677 |
{
|
|
|
|
| 12703 |
"bcp_47": "en",
|
| 12704 |
"task": "language_modeling",
|
| 12705 |
"metric": "chrf",
|
| 12706 |
+
"score": 0.9840731165453181,
|
| 12707 |
"sentence_nr": 14.5
|
| 12708 |
},
|
| 12709 |
{
|
|
|
|
| 12735 |
"bcp_47": "zh",
|
| 12736 |
"task": "language_modeling",
|
| 12737 |
"metric": "chrf",
|
| 12738 |
+
"score": 0.9308727688438002,
|
| 12739 |
"sentence_nr": 14.5
|
| 12740 |
},
|
| 12741 |
{
|
|
|
|
| 12767 |
"bcp_47": "en",
|
| 12768 |
"task": "language_modeling",
|
| 12769 |
"metric": "chrf",
|
| 12770 |
+
"score": 0.9705999747171945,
|
| 12771 |
"sentence_nr": 14.5
|
| 12772 |
},
|
| 12773 |
{
|
|
|
|
| 12799 |
"bcp_47": "zh",
|
| 12800 |
"task": "language_modeling",
|
| 12801 |
"metric": "chrf",
|
| 12802 |
+
"score": 0.9098214011017126,
|
| 12803 |
"sentence_nr": 14.5
|
| 12804 |
},
|
| 12805 |
{
|
|
|
|
| 12831 |
"bcp_47": "en",
|
| 12832 |
"task": "language_modeling",
|
| 12833 |
"metric": "chrf",
|
| 12834 |
+
"score": 0.9802918604410554,
|
| 12835 |
"sentence_nr": 14.5
|
| 12836 |
},
|
| 12837 |
{
|
|
|
|
| 12863 |
"bcp_47": "zh",
|
| 12864 |
"task": "language_modeling",
|
| 12865 |
"metric": "chrf",
|
| 12866 |
+
"score": 0.9309062045243536,
|
| 12867 |
"sentence_nr": 14.5
|
| 12868 |
},
|
| 12869 |
{
|
|
|
|
| 12895 |
"bcp_47": "en",
|
| 12896 |
"task": "language_modeling",
|
| 12897 |
"metric": "chrf",
|
| 12898 |
+
"score": 0.9683113542489836,
|
| 12899 |
"sentence_nr": 14.5
|
| 12900 |
},
|
| 12901 |
{
|
|
|
|
| 12903 |
"bcp_47": "en",
|
| 12904 |
"task": "translation",
|
| 12905 |
"metric": "bleu",
|
| 12906 |
+
"score": 0.444507882217401,
|
| 12907 |
"sentence_nr": 14.5
|
| 12908 |
},
|
| 12909 |
{
|
|
|
|
| 12927 |
"bcp_47": "zh",
|
| 12928 |
"task": "language_modeling",
|
| 12929 |
"metric": "chrf",
|
| 12930 |
+
"score": 0.9233418215760759,
|
| 12931 |
"sentence_nr": 14.5
|
| 12932 |
},
|
| 12933 |
{
|
|
|
|
| 12959 |
"bcp_47": "ar",
|
| 12960 |
"task": "language_modeling",
|
| 12961 |
"metric": "chrf",
|
| 12962 |
+
"score": 0.9392314289764625,
|
| 12963 |
"sentence_nr": 14.5
|
| 12964 |
},
|
| 12965 |
{
|
|
|
|
| 12978 |
"score": 0.4684314458952127,
|
| 12979 |
"sentence_nr": 14.5
|
| 12980 |
},
|
| 12981 |
+
{
|
| 12982 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12983 |
+
"bcp_47": "arz",
|
| 12984 |
+
"task": "classification",
|
| 12985 |
+
"metric": "accuracy",
|
| 12986 |
+
"score": 0.4,
|
| 12987 |
+
"sentence_nr": 14.5
|
| 12988 |
+
},
|
| 12989 |
+
{
|
| 12990 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12991 |
+
"bcp_47": "arz",
|
| 12992 |
+
"task": "language_modeling",
|
| 12993 |
+
"metric": "chrf",
|
| 12994 |
+
"score": 0.930329195667362,
|
| 12995 |
+
"sentence_nr": 14.5
|
| 12996 |
+
},
|
| 12997 |
+
{
|
| 12998 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 12999 |
+
"bcp_47": "arz",
|
| 13000 |
+
"task": "translation",
|
| 13001 |
+
"metric": "bleu",
|
| 13002 |
+
"score": 0.19793415292805128,
|
| 13003 |
+
"sentence_nr": 14.5
|
| 13004 |
+
},
|
| 13005 |
+
{
|
| 13006 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13007 |
+
"bcp_47": "arz",
|
| 13008 |
+
"task": "translation",
|
| 13009 |
+
"metric": "chrf",
|
| 13010 |
+
"score": 0.3881278724939126,
|
| 13011 |
+
"sentence_nr": 14.5
|
| 13012 |
+
},
|
| 13013 |
{
|
| 13014 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13015 |
"bcp_47": "bn",
|
|
|
|
| 13023 |
"bcp_47": "bn",
|
| 13024 |
"task": "language_modeling",
|
| 13025 |
"metric": "chrf",
|
| 13026 |
+
"score": 0.9097658392566466,
|
| 13027 |
"sentence_nr": 14.5
|
| 13028 |
},
|
| 13029 |
{
|
|
|
|
| 13042 |
"score": 0.4076175886917154,
|
| 13043 |
"sentence_nr": 14.5
|
| 13044 |
},
|
| 13045 |
+
{
|
| 13046 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13047 |
+
"bcp_47": "de",
|
| 13048 |
+
"task": "classification",
|
| 13049 |
+
"metric": "accuracy",
|
| 13050 |
+
"score": 0.6666666666666666,
|
| 13051 |
+
"sentence_nr": 14.5
|
| 13052 |
+
},
|
| 13053 |
+
{
|
| 13054 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13055 |
+
"bcp_47": "de",
|
| 13056 |
+
"task": "language_modeling",
|
| 13057 |
+
"metric": "chrf",
|
| 13058 |
+
"score": 0.9594656177914042,
|
| 13059 |
+
"sentence_nr": 14.5
|
| 13060 |
+
},
|
| 13061 |
+
{
|
| 13062 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13063 |
+
"bcp_47": "de",
|
| 13064 |
+
"task": "translation",
|
| 13065 |
+
"metric": "bleu",
|
| 13066 |
+
"score": 0.3207642359472324,
|
| 13067 |
+
"sentence_nr": 14.5
|
| 13068 |
+
},
|
| 13069 |
+
{
|
| 13070 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13071 |
+
"bcp_47": "de",
|
| 13072 |
+
"task": "translation",
|
| 13073 |
+
"metric": "chrf",
|
| 13074 |
+
"score": 0.49973270743869647,
|
| 13075 |
+
"sentence_nr": 14.5
|
| 13076 |
+
},
|
| 13077 |
{
|
| 13078 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13079 |
"bcp_47": "en",
|
|
|
|
| 13087 |
"bcp_47": "en",
|
| 13088 |
"task": "language_modeling",
|
| 13089 |
"metric": "chrf",
|
| 13090 |
+
"score": 0.9810108607325073,
|
| 13091 |
"sentence_nr": 14.5
|
| 13092 |
},
|
| 13093 |
{
|
|
|
|
| 13119 |
"bcp_47": "es",
|
| 13120 |
"task": "language_modeling",
|
| 13121 |
"metric": "chrf",
|
| 13122 |
+
"score": 0.9569342865902168,
|
| 13123 |
"sentence_nr": 14.5
|
| 13124 |
},
|
| 13125 |
{
|
|
|
|
| 13140 |
},
|
| 13141 |
{
|
| 13142 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13143 |
+
"bcp_47": "fa",
|
| 13144 |
"task": "classification",
|
| 13145 |
"metric": "accuracy",
|
| 13146 |
+
"score": 0.4,
|
| 13147 |
"sentence_nr": 14.5
|
| 13148 |
},
|
| 13149 |
{
|
| 13150 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13151 |
+
"bcp_47": "fa",
|
| 13152 |
"task": "language_modeling",
|
| 13153 |
"metric": "chrf",
|
| 13154 |
+
"score": 0.9414698824984596,
|
| 13155 |
"sentence_nr": 14.5
|
| 13156 |
},
|
| 13157 |
{
|
| 13158 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13159 |
+
"bcp_47": "fa",
|
| 13160 |
"task": "translation",
|
| 13161 |
"metric": "bleu",
|
| 13162 |
+
"score": 0.26232478733341374,
|
| 13163 |
"sentence_nr": 14.5
|
| 13164 |
},
|
| 13165 |
{
|
| 13166 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13167 |
+
"bcp_47": "fa",
|
| 13168 |
"task": "translation",
|
| 13169 |
"metric": "chrf",
|
| 13170 |
+
"score": 0.44641220608314985,
|
| 13171 |
"sentence_nr": 14.5
|
| 13172 |
},
|
| 13173 |
{
|
| 13174 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13175 |
+
"bcp_47": "fil",
|
| 13176 |
"task": "classification",
|
| 13177 |
"metric": "accuracy",
|
| 13178 |
+
"score": 0.43333333333333335,
|
| 13179 |
"sentence_nr": 14.5
|
| 13180 |
},
|
| 13181 |
{
|
| 13182 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13183 |
+
"bcp_47": "fil",
|
| 13184 |
"task": "language_modeling",
|
| 13185 |
"metric": "chrf",
|
| 13186 |
+
"score": 0.9402707475255596,
|
| 13187 |
"sentence_nr": 14.5
|
| 13188 |
},
|
| 13189 |
{
|
| 13190 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13191 |
+
"bcp_47": "fil",
|
| 13192 |
"task": "translation",
|
| 13193 |
"metric": "bleu",
|
| 13194 |
+
"score": 0.29097818784870333,
|
| 13195 |
"sentence_nr": 14.5
|
| 13196 |
},
|
| 13197 |
{
|
| 13198 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13199 |
+
"bcp_47": "fil",
|
| 13200 |
"task": "translation",
|
| 13201 |
"metric": "chrf",
|
| 13202 |
+
"score": 0.44978114149245985,
|
| 13203 |
"sentence_nr": 14.5
|
| 13204 |
},
|
| 13205 |
{
|
| 13206 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13207 |
+
"bcp_47": "fr",
|
| 13208 |
"task": "classification",
|
| 13209 |
"metric": "accuracy",
|
| 13210 |
+
"score": 0.5333333333333333,
|
| 13211 |
"sentence_nr": 14.5
|
| 13212 |
},
|
| 13213 |
{
|
| 13214 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13215 |
+
"bcp_47": "fr",
|
| 13216 |
"task": "language_modeling",
|
| 13217 |
"metric": "chrf",
|
| 13218 |
+
"score": 0.9815706066541411,
|
| 13219 |
"sentence_nr": 14.5
|
| 13220 |
},
|
| 13221 |
{
|
| 13222 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13223 |
+
"bcp_47": "fr",
|
| 13224 |
"task": "translation",
|
| 13225 |
"metric": "bleu",
|
| 13226 |
+
"score": 0.3193235920661593,
|
| 13227 |
"sentence_nr": 14.5
|
| 13228 |
},
|
| 13229 |
{
|
| 13230 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13231 |
+
"bcp_47": "fr",
|
| 13232 |
"task": "translation",
|
| 13233 |
"metric": "chrf",
|
| 13234 |
+
"score": 0.4875691290722964,
|
| 13235 |
"sentence_nr": 14.5
|
| 13236 |
},
|
| 13237 |
{
|
| 13238 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13239 |
+
"bcp_47": "gu",
|
| 13240 |
"task": "classification",
|
| 13241 |
"metric": "accuracy",
|
| 13242 |
+
"score": 0.43333333333333335,
|
| 13243 |
"sentence_nr": 14.5
|
| 13244 |
},
|
| 13245 |
{
|
| 13246 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13247 |
+
"bcp_47": "gu",
|
| 13248 |
"task": "language_modeling",
|
| 13249 |
"metric": "chrf",
|
| 13250 |
+
"score": 0.938086045460355,
|
| 13251 |
"sentence_nr": 14.5
|
| 13252 |
},
|
| 13253 |
{
|
| 13254 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13255 |
+
"bcp_47": "gu",
|
| 13256 |
"task": "translation",
|
| 13257 |
"metric": "bleu",
|
| 13258 |
+
"score": 0.26442484966880464,
|
| 13259 |
"sentence_nr": 14.5
|
| 13260 |
},
|
| 13261 |
{
|
| 13262 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13263 |
+
"bcp_47": "gu",
|
| 13264 |
"task": "translation",
|
| 13265 |
"metric": "chrf",
|
| 13266 |
+
"score": 0.44452182973195975,
|
| 13267 |
"sentence_nr": 14.5
|
| 13268 |
},
|
| 13269 |
{
|
| 13270 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13271 |
+
"bcp_47": "hi",
|
| 13272 |
"task": "classification",
|
| 13273 |
"metric": "accuracy",
|
| 13274 |
+
"score": 0.5333333333333333,
|
| 13275 |
"sentence_nr": 14.5
|
| 13276 |
},
|
| 13277 |
{
|
| 13278 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13279 |
+
"bcp_47": "hi",
|
| 13280 |
"task": "language_modeling",
|
| 13281 |
"metric": "chrf",
|
| 13282 |
+
"score": 0.9428185393832219,
|
| 13283 |
"sentence_nr": 14.5
|
| 13284 |
},
|
| 13285 |
{
|
| 13286 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13287 |
+
"bcp_47": "hi",
|
| 13288 |
"task": "translation",
|
| 13289 |
"metric": "bleu",
|
| 13290 |
+
"score": 0.31956422674397006,
|
| 13291 |
"sentence_nr": 14.5
|
| 13292 |
},
|
| 13293 |
{
|
| 13294 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13295 |
+
"bcp_47": "hi",
|
| 13296 |
"task": "translation",
|
| 13297 |
"metric": "chrf",
|
| 13298 |
+
"score": 0.4896277852320754,
|
| 13299 |
+
"sentence_nr": 14.5
|
| 13300 |
+
},
|
| 13301 |
+
{
|
| 13302 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13303 |
+
"bcp_47": "id",
|
| 13304 |
+
"task": "classification",
|
| 13305 |
+
"metric": "accuracy",
|
| 13306 |
+
"score": 0.6333333333333333,
|
| 13307 |
+
"sentence_nr": 14.5
|
| 13308 |
+
},
|
| 13309 |
+
{
|
| 13310 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13311 |
+
"bcp_47": "id",
|
| 13312 |
+
"task": "language_modeling",
|
| 13313 |
+
"metric": "chrf",
|
| 13314 |
+
"score": 0.9598314474300775,
|
| 13315 |
+
"sentence_nr": 14.5
|
| 13316 |
+
},
|
| 13317 |
+
{
|
| 13318 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13319 |
+
"bcp_47": "id",
|
| 13320 |
+
"task": "translation",
|
| 13321 |
+
"metric": "bleu",
|
| 13322 |
+
"score": 0.29354203311552335,
|
| 13323 |
+
"sentence_nr": 14.5
|
| 13324 |
+
},
|
| 13325 |
+
{
|
| 13326 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13327 |
+
"bcp_47": "id",
|
| 13328 |
+
"task": "translation",
|
| 13329 |
+
"metric": "chrf",
|
| 13330 |
+
"score": 0.4723493656022861,
|
| 13331 |
+
"sentence_nr": 14.5
|
| 13332 |
+
},
|
| 13333 |
+
{
|
| 13334 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13335 |
+
"bcp_47": "it",
|
| 13336 |
+
"task": "classification",
|
| 13337 |
+
"metric": "accuracy",
|
| 13338 |
+
"score": 0.6666666666666666,
|
| 13339 |
+
"sentence_nr": 14.5
|
| 13340 |
+
},
|
| 13341 |
+
{
|
| 13342 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13343 |
+
"bcp_47": "it",
|
| 13344 |
+
"task": "language_modeling",
|
| 13345 |
+
"metric": "chrf",
|
| 13346 |
+
"score": 0.9439490413212892,
|
| 13347 |
+
"sentence_nr": 14.5
|
| 13348 |
+
},
|
| 13349 |
+
{
|
| 13350 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13351 |
+
"bcp_47": "it",
|
| 13352 |
+
"task": "translation",
|
| 13353 |
+
"metric": "bleu",
|
| 13354 |
+
"score": 0.28142583904826096,
|
| 13355 |
+
"sentence_nr": 14.5
|
| 13356 |
+
},
|
| 13357 |
+
{
|
| 13358 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13359 |
+
"bcp_47": "it",
|
| 13360 |
+
"task": "translation",
|
| 13361 |
+
"metric": "chrf",
|
| 13362 |
+
"score": 0.4707591889357925,
|
| 13363 |
+
"sentence_nr": 14.5
|
| 13364 |
+
},
|
| 13365 |
+
{
|
| 13366 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13367 |
+
"bcp_47": "ja",
|
| 13368 |
+
"task": "classification",
|
| 13369 |
+
"metric": "accuracy",
|
| 13370 |
+
"score": 0.6333333333333333,
|
| 13371 |
+
"sentence_nr": 14.5
|
| 13372 |
+
},
|
| 13373 |
+
{
|
| 13374 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13375 |
+
"bcp_47": "ja",
|
| 13376 |
+
"task": "language_modeling",
|
| 13377 |
+
"metric": "chrf",
|
| 13378 |
+
"score": 0.9371132855221468,
|
| 13379 |
+
"sentence_nr": 14.5
|
| 13380 |
+
},
|
| 13381 |
+
{
|
| 13382 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13383 |
+
"bcp_47": "ja",
|
| 13384 |
+
"task": "translation",
|
| 13385 |
+
"metric": "bleu",
|
| 13386 |
+
"score": 0.2723410893967824,
|
| 13387 |
+
"sentence_nr": 14.5
|
| 13388 |
+
},
|
| 13389 |
+
{
|
| 13390 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13391 |
+
"bcp_47": "ja",
|
| 13392 |
+
"task": "translation",
|
| 13393 |
+
"metric": "chrf",
|
| 13394 |
+
"score": 0.43929453749366865,
|
| 13395 |
+
"sentence_nr": 14.5
|
| 13396 |
+
},
|
| 13397 |
+
{
|
| 13398 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13399 |
+
"bcp_47": "jv",
|
| 13400 |
+
"task": "classification",
|
| 13401 |
+
"metric": "accuracy",
|
| 13402 |
+
"score": 0.4666666666666667,
|
| 13403 |
+
"sentence_nr": 14.5
|
| 13404 |
+
},
|
| 13405 |
+
{
|
| 13406 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13407 |
+
"bcp_47": "jv",
|
| 13408 |
+
"task": "language_modeling",
|
| 13409 |
+
"metric": "chrf",
|
| 13410 |
+
"score": 0.9298143194922116,
|
| 13411 |
+
"sentence_nr": 14.5
|
| 13412 |
+
},
|
| 13413 |
+
{
|
| 13414 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13415 |
+
"bcp_47": "jv",
|
| 13416 |
+
"task": "translation",
|
| 13417 |
+
"metric": "bleu",
|
| 13418 |
+
"score": 0.23729186537968905,
|
| 13419 |
+
"sentence_nr": 14.5
|
| 13420 |
+
},
|
| 13421 |
+
{
|
| 13422 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13423 |
+
"bcp_47": "jv",
|
| 13424 |
+
"task": "translation",
|
| 13425 |
+
"metric": "chrf",
|
| 13426 |
+
"score": 0.4198940727847352,
|
| 13427 |
+
"sentence_nr": 14.5
|
| 13428 |
+
},
|
| 13429 |
+
{
|
| 13430 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13431 |
+
"bcp_47": "ko",
|
| 13432 |
+
"task": "classification",
|
| 13433 |
+
"metric": "accuracy",
|
| 13434 |
+
"score": 0.5333333333333333,
|
| 13435 |
+
"sentence_nr": 14.5
|
| 13436 |
+
},
|
| 13437 |
+
{
|
| 13438 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13439 |
+
"bcp_47": "ko",
|
| 13440 |
+
"task": "language_modeling",
|
| 13441 |
+
"metric": "chrf",
|
| 13442 |
+
"score": 0.9355445912073929,
|
| 13443 |
+
"sentence_nr": 14.5
|
| 13444 |
+
},
|
| 13445 |
+
{
|
| 13446 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13447 |
+
"bcp_47": "ko",
|
| 13448 |
+
"task": "translation",
|
| 13449 |
+
"metric": "bleu",
|
| 13450 |
+
"score": 0.20332074778330964,
|
| 13451 |
+
"sentence_nr": 14.5
|
| 13452 |
+
},
|
| 13453 |
+
{
|
| 13454 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13455 |
+
"bcp_47": "ko",
|
| 13456 |
+
"task": "translation",
|
| 13457 |
+
"metric": "chrf",
|
| 13458 |
+
"score": 0.4005255477730261,
|
| 13459 |
+
"sentence_nr": 14.5
|
| 13460 |
+
},
|
| 13461 |
+
{
|
| 13462 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13463 |
+
"bcp_47": "mr",
|
| 13464 |
+
"task": "classification",
|
| 13465 |
+
"metric": "accuracy",
|
| 13466 |
+
"score": 0.6333333333333333,
|
| 13467 |
+
"sentence_nr": 14.5
|
| 13468 |
+
},
|
| 13469 |
+
{
|
| 13470 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13471 |
+
"bcp_47": "mr",
|
| 13472 |
+
"task": "language_modeling",
|
| 13473 |
+
"metric": "chrf",
|
| 13474 |
+
"score": 0.9440892312053646,
|
| 13475 |
+
"sentence_nr": 14.5
|
| 13476 |
+
},
|
| 13477 |
+
{
|
| 13478 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13479 |
+
"bcp_47": "mr",
|
| 13480 |
+
"task": "translation",
|
| 13481 |
+
"metric": "bleu",
|
| 13482 |
+
"score": 0.24903049799655144,
|
| 13483 |
+
"sentence_nr": 14.5
|
| 13484 |
+
},
|
| 13485 |
+
{
|
| 13486 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13487 |
+
"bcp_47": "mr",
|
| 13488 |
+
"task": "translation",
|
| 13489 |
+
"metric": "chrf",
|
| 13490 |
+
"score": 0.42489125861884175,
|
| 13491 |
+
"sentence_nr": 14.5
|
| 13492 |
+
},
|
| 13493 |
+
{
|
| 13494 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13495 |
+
"bcp_47": "pa",
|
| 13496 |
+
"task": "classification",
|
| 13497 |
+
"metric": "accuracy",
|
| 13498 |
+
"score": 0.4,
|
| 13499 |
+
"sentence_nr": 14.5
|
| 13500 |
+
},
|
| 13501 |
+
{
|
| 13502 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13503 |
+
"bcp_47": "pa",
|
| 13504 |
+
"task": "language_modeling",
|
| 13505 |
+
"metric": "chrf",
|
| 13506 |
+
"score": 0.9025298113664532,
|
| 13507 |
+
"sentence_nr": 14.5
|
| 13508 |
+
},
|
| 13509 |
+
{
|
| 13510 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13511 |
+
"bcp_47": "pa",
|
| 13512 |
+
"task": "translation",
|
| 13513 |
+
"metric": "bleu",
|
| 13514 |
+
"score": 0.3368333727390049,
|
| 13515 |
+
"sentence_nr": 14.5
|
| 13516 |
+
},
|
| 13517 |
+
{
|
| 13518 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13519 |
+
"bcp_47": "pa",
|
| 13520 |
+
"task": "translation",
|
| 13521 |
+
"metric": "chrf",
|
| 13522 |
+
"score": 0.4873541452250132,
|
| 13523 |
+
"sentence_nr": 14.5
|
| 13524 |
+
},
|
| 13525 |
+
{
|
| 13526 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13527 |
+
"bcp_47": "pt",
|
| 13528 |
+
"task": "classification",
|
| 13529 |
+
"metric": "accuracy",
|
| 13530 |
+
"score": 0.5,
|
| 13531 |
+
"sentence_nr": 14.5
|
| 13532 |
+
},
|
| 13533 |
+
{
|
| 13534 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13535 |
+
"bcp_47": "pt",
|
| 13536 |
+
"task": "language_modeling",
|
| 13537 |
+
"metric": "chrf",
|
| 13538 |
+
"score": 0.9641423549595803,
|
| 13539 |
+
"sentence_nr": 14.5
|
| 13540 |
+
},
|
| 13541 |
+
{
|
| 13542 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13543 |
+
"bcp_47": "pt",
|
| 13544 |
+
"task": "translation",
|
| 13545 |
+
"metric": "bleu",
|
| 13546 |
+
"score": 0.3110105331834714,
|
| 13547 |
+
"sentence_nr": 14.5
|
| 13548 |
+
},
|
| 13549 |
+
{
|
| 13550 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13551 |
+
"bcp_47": "pt",
|
| 13552 |
+
"task": "translation",
|
| 13553 |
+
"metric": "chrf",
|
| 13554 |
+
"score": 0.49172080600981716,
|
| 13555 |
+
"sentence_nr": 14.5
|
| 13556 |
+
},
|
| 13557 |
+
{
|
| 13558 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13559 |
+
"bcp_47": "ru",
|
| 13560 |
+
"task": "classification",
|
| 13561 |
+
"metric": "accuracy",
|
| 13562 |
+
"score": 0.5666666666666667,
|
| 13563 |
+
"sentence_nr": 14.5
|
| 13564 |
+
},
|
| 13565 |
+
{
|
| 13566 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13567 |
+
"bcp_47": "ru",
|
| 13568 |
+
"task": "language_modeling",
|
| 13569 |
+
"metric": "chrf",
|
| 13570 |
+
"score": 0.9663696817874857,
|
| 13571 |
+
"sentence_nr": 14.5
|
| 13572 |
+
},
|
| 13573 |
+
{
|
| 13574 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13575 |
+
"bcp_47": "ru",
|
| 13576 |
+
"task": "translation",
|
| 13577 |
+
"metric": "bleu",
|
| 13578 |
+
"score": 0.26015179309825326,
|
| 13579 |
+
"sentence_nr": 14.5
|
| 13580 |
+
},
|
| 13581 |
+
{
|
| 13582 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13583 |
+
"bcp_47": "ru",
|
| 13584 |
+
"task": "translation",
|
| 13585 |
+
"metric": "chrf",
|
| 13586 |
+
"score": 0.4525762744858351,
|
| 13587 |
+
"sentence_nr": 14.5
|
| 13588 |
+
},
|
| 13589 |
+
{
|
| 13590 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13591 |
+
"bcp_47": "sw",
|
| 13592 |
+
"task": "classification",
|
| 13593 |
+
"metric": "accuracy",
|
| 13594 |
+
"score": 0.5666666666666667,
|
| 13595 |
+
"sentence_nr": 14.5
|
| 13596 |
+
},
|
| 13597 |
+
{
|
| 13598 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13599 |
+
"bcp_47": "sw",
|
| 13600 |
+
"task": "language_modeling",
|
| 13601 |
+
"metric": "chrf",
|
| 13602 |
+
"score": 0.9401745263817055,
|
| 13603 |
+
"sentence_nr": 14.5
|
| 13604 |
+
},
|
| 13605 |
+
{
|
| 13606 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13607 |
+
"bcp_47": "sw",
|
| 13608 |
+
"task": "translation",
|
| 13609 |
+
"metric": "bleu",
|
| 13610 |
+
"score": 0.30022614000139736,
|
| 13611 |
+
"sentence_nr": 14.5
|
| 13612 |
+
},
|
| 13613 |
+
{
|
| 13614 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13615 |
+
"bcp_47": "sw",
|
| 13616 |
+
"task": "translation",
|
| 13617 |
+
"metric": "chrf",
|
| 13618 |
+
"score": 0.46620999112028233,
|
| 13619 |
+
"sentence_nr": 14.5
|
| 13620 |
+
},
|
| 13621 |
+
{
|
| 13622 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13623 |
+
"bcp_47": "ta",
|
| 13624 |
+
"task": "classification",
|
| 13625 |
+
"metric": "accuracy",
|
| 13626 |
+
"score": 0.43333333333333335,
|
| 13627 |
+
"sentence_nr": 14.5
|
| 13628 |
+
},
|
| 13629 |
+
{
|
| 13630 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13631 |
+
"bcp_47": "ta",
|
| 13632 |
+
"task": "language_modeling",
|
| 13633 |
+
"metric": "chrf",
|
| 13634 |
+
"score": 0.9641464401452432,
|
| 13635 |
+
"sentence_nr": 14.5
|
| 13636 |
+
},
|
| 13637 |
+
{
|
| 13638 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13639 |
+
"bcp_47": "ta",
|
| 13640 |
+
"task": "translation",
|
| 13641 |
+
"metric": "bleu",
|
| 13642 |
+
"score": 0.2528104486727614,
|
| 13643 |
+
"sentence_nr": 14.5
|
| 13644 |
+
},
|
| 13645 |
+
{
|
| 13646 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13647 |
+
"bcp_47": "ta",
|
| 13648 |
+
"task": "translation",
|
| 13649 |
+
"metric": "chrf",
|
| 13650 |
+
"score": 0.42077045938882934,
|
| 13651 |
+
"sentence_nr": 14.5
|
| 13652 |
+
},
|
| 13653 |
+
{
|
| 13654 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13655 |
+
"bcp_47": "te",
|
| 13656 |
+
"task": "classification",
|
| 13657 |
+
"metric": "accuracy",
|
| 13658 |
+
"score": 0.36666666666666664,
|
| 13659 |
+
"sentence_nr": 14.5
|
| 13660 |
+
},
|
| 13661 |
+
{
|
| 13662 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13663 |
+
"bcp_47": "te",
|
| 13664 |
+
"task": "language_modeling",
|
| 13665 |
+
"metric": "chrf",
|
| 13666 |
+
"score": 0.9513838296654142,
|
| 13667 |
+
"sentence_nr": 14.5
|
| 13668 |
+
},
|
| 13669 |
+
{
|
| 13670 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13671 |
+
"bcp_47": "te",
|
| 13672 |
+
"task": "translation",
|
| 13673 |
+
"metric": "bleu",
|
| 13674 |
+
"score": 0.28338449781147135,
|
| 13675 |
+
"sentence_nr": 14.5
|
| 13676 |
+
},
|
| 13677 |
+
{
|
| 13678 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13679 |
+
"bcp_47": "te",
|
| 13680 |
+
"task": "translation",
|
| 13681 |
+
"metric": "chrf",
|
| 13682 |
+
"score": 0.467003606031036,
|
| 13683 |
+
"sentence_nr": 14.5
|
| 13684 |
+
},
|
| 13685 |
+
{
|
| 13686 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13687 |
+
"bcp_47": "tr",
|
| 13688 |
+
"task": "classification",
|
| 13689 |
+
"metric": "accuracy",
|
| 13690 |
+
"score": 0.5333333333333333,
|
| 13691 |
+
"sentence_nr": 14.5
|
| 13692 |
+
},
|
| 13693 |
+
{
|
| 13694 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13695 |
+
"bcp_47": "tr",
|
| 13696 |
+
"task": "language_modeling",
|
| 13697 |
+
"metric": "chrf",
|
| 13698 |
+
"score": 0.9446670623712353,
|
| 13699 |
+
"sentence_nr": 14.5
|
| 13700 |
+
},
|
| 13701 |
+
{
|
| 13702 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13703 |
+
"bcp_47": "tr",
|
| 13704 |
+
"task": "translation",
|
| 13705 |
+
"metric": "bleu",
|
| 13706 |
+
"score": 0.2844596261435892,
|
| 13707 |
+
"sentence_nr": 14.5
|
| 13708 |
+
},
|
| 13709 |
+
{
|
| 13710 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13711 |
+
"bcp_47": "tr",
|
| 13712 |
+
"task": "translation",
|
| 13713 |
+
"metric": "chrf",
|
| 13714 |
+
"score": 0.4525478264239361,
|
| 13715 |
+
"sentence_nr": 14.5
|
| 13716 |
+
},
|
| 13717 |
+
{
|
| 13718 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13719 |
+
"bcp_47": "ur",
|
| 13720 |
+
"task": "classification",
|
| 13721 |
+
"metric": "accuracy",
|
| 13722 |
+
"score": 0.5,
|
| 13723 |
+
"sentence_nr": 14.5
|
| 13724 |
+
},
|
| 13725 |
+
{
|
| 13726 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13727 |
+
"bcp_47": "ur",
|
| 13728 |
+
"task": "language_modeling",
|
| 13729 |
+
"metric": "chrf",
|
| 13730 |
+
"score": 0.9182703887696211,
|
| 13731 |
+
"sentence_nr": 14.5
|
| 13732 |
+
},
|
| 13733 |
+
{
|
| 13734 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13735 |
+
"bcp_47": "ur",
|
| 13736 |
+
"task": "translation",
|
| 13737 |
+
"metric": "bleu",
|
| 13738 |
+
"score": 0.2434522914619727,
|
| 13739 |
+
"sentence_nr": 14.5
|
| 13740 |
+
},
|
| 13741 |
+
{
|
| 13742 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13743 |
+
"bcp_47": "ur",
|
| 13744 |
+
"task": "translation",
|
| 13745 |
+
"metric": "chrf",
|
| 13746 |
+
"score": 0.42196914378741973,
|
| 13747 |
+
"sentence_nr": 14.5
|
| 13748 |
+
},
|
| 13749 |
+
{
|
| 13750 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13751 |
+
"bcp_47": "vi",
|
| 13752 |
+
"task": "classification",
|
| 13753 |
+
"metric": "accuracy",
|
| 13754 |
+
"score": 0.6,
|
| 13755 |
+
"sentence_nr": 14.5
|
| 13756 |
+
},
|
| 13757 |
+
{
|
| 13758 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13759 |
+
"bcp_47": "vi",
|
| 13760 |
+
"task": "language_modeling",
|
| 13761 |
+
"metric": "chrf",
|
| 13762 |
+
"score": 0.9580044761495575,
|
| 13763 |
+
"sentence_nr": 14.5
|
| 13764 |
+
},
|
| 13765 |
+
{
|
| 13766 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13767 |
+
"bcp_47": "vi",
|
| 13768 |
+
"task": "translation",
|
| 13769 |
+
"metric": "bleu",
|
| 13770 |
+
"score": 0.25541664062319624,
|
| 13771 |
+
"sentence_nr": 14.5
|
| 13772 |
+
},
|
| 13773 |
+
{
|
| 13774 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13775 |
+
"bcp_47": "vi",
|
| 13776 |
+
"task": "translation",
|
| 13777 |
+
"metric": "chrf",
|
| 13778 |
+
"score": 0.43688984396841446,
|
| 13779 |
+
"sentence_nr": 14.5
|
| 13780 |
+
},
|
| 13781 |
+
{
|
| 13782 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13783 |
+
"bcp_47": "yue",
|
| 13784 |
+
"task": "classification",
|
| 13785 |
+
"metric": "accuracy",
|
| 13786 |
+
"score": 0.43333333333333335,
|
| 13787 |
+
"sentence_nr": 14.5
|
| 13788 |
+
},
|
| 13789 |
+
{
|
| 13790 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13791 |
+
"bcp_47": "yue",
|
| 13792 |
+
"task": "language_modeling",
|
| 13793 |
+
"metric": "chrf",
|
| 13794 |
+
"score": 0.9022415223117748,
|
| 13795 |
+
"sentence_nr": 14.5
|
| 13796 |
+
},
|
| 13797 |
+
{
|
| 13798 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13799 |
+
"bcp_47": "yue",
|
| 13800 |
+
"task": "translation",
|
| 13801 |
+
"metric": "bleu",
|
| 13802 |
+
"score": 0.22628178945118504,
|
| 13803 |
+
"sentence_nr": 14.5
|
| 13804 |
+
},
|
| 13805 |
+
{
|
| 13806 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
| 13807 |
+
"bcp_47": "yue",
|
| 13808 |
+
"task": "translation",
|
| 13809 |
+
"metric": "chrf",
|
| 13810 |
+
"score": 0.4052050858435178,
|
| 13811 |
"sentence_nr": 14.5
|
| 13812 |
},
|
| 13813 |
{
|
|
|
|
| 13823 |
"bcp_47": "zh",
|
| 13824 |
"task": "language_modeling",
|
| 13825 |
"metric": "chrf",
|
| 13826 |
+
"score": 0.9003842558834025,
|
| 13827 |
"sentence_nr": 14.5
|
| 13828 |
},
|
| 13829 |
{
|
|
|
|
| 13855 |
"bcp_47": "en",
|
| 13856 |
"task": "language_modeling",
|
| 13857 |
"metric": "chrf",
|
| 13858 |
+
"score": 0.9312514772455793,
|
| 13859 |
"sentence_nr": 14.5
|
| 13860 |
},
|
| 13861 |
{
|
|
|
|
| 13887 |
"bcp_47": "zh",
|
| 13888 |
"task": "language_modeling",
|
| 13889 |
"metric": "chrf",
|
| 13890 |
+
"score": 0.831019102021034,
|
| 13891 |
"sentence_nr": 14.5
|
| 13892 |
},
|
| 13893 |
{
|
|
|
|
| 13919 |
"bcp_47": "en",
|
| 13920 |
"task": "language_modeling",
|
| 13921 |
"metric": "chrf",
|
| 13922 |
+
"score": 0.9126664788853867,
|
| 13923 |
"sentence_nr": 14.5
|
| 13924 |
},
|
| 13925 |
{
|
|
|
|
| 13951 |
"bcp_47": "zh",
|
| 13952 |
"task": "language_modeling",
|
| 13953 |
"metric": "chrf",
|
| 13954 |
+
"score": 0.8098290899553928,
|
| 13955 |
"sentence_nr": 14.5
|
| 13956 |
},
|
| 13957 |
{
|
|
|
|
| 13983 |
"bcp_47": "en",
|
| 13984 |
"task": "language_modeling",
|
| 13985 |
"metric": "chrf",
|
| 13986 |
+
"score": 0.8397325387031247,
|
| 13987 |
"sentence_nr": 14.5
|
| 13988 |
},
|
| 13989 |
{
|
|
|
|
| 14015 |
"bcp_47": "zh",
|
| 14016 |
"task": "language_modeling",
|
| 14017 |
"metric": "chrf",
|
| 14018 |
+
"score": 0.9167475699419941,
|
| 14019 |
"sentence_nr": 14.5
|
| 14020 |
},
|
| 14021 |
{
|
|
|
|
| 14047 |
"bcp_47": "en",
|
| 14048 |
"task": "language_modeling",
|
| 14049 |
"metric": "chrf",
|
| 14050 |
+
"score": 0.9807297060840695,
|
| 14051 |
"sentence_nr": 14.5
|
| 14052 |
},
|
| 14053 |
{
|
|
|
|
| 14079 |
"bcp_47": "zh",
|
| 14080 |
"task": "language_modeling",
|
| 14081 |
"metric": "chrf",
|
| 14082 |
+
"score": 0.9313441068235117,
|
| 14083 |
"sentence_nr": 14.5
|
| 14084 |
},
|
| 14085 |
{
|
|
|
|
| 14111 |
"bcp_47": "en",
|
| 14112 |
"task": "language_modeling",
|
| 14113 |
"metric": "chrf",
|
| 14114 |
+
"score": 0.5225508930892153,
|
| 14115 |
"sentence_nr": 14.5
|
| 14116 |
},
|
| 14117 |
{
|
|
|
|
| 14143 |
"bcp_47": "zh",
|
| 14144 |
"task": "language_modeling",
|
| 14145 |
"metric": "chrf",
|
| 14146 |
+
"score": 0.4174856398225174,
|
| 14147 |
"sentence_nr": 14.5
|
| 14148 |
},
|
| 14149 |
{
|