David Pomerenke
commited on
Commit
·
eaf2d97
1
Parent(s):
7cdde63
spBLEU tokenizer, run on more languages
Browse files- bibliography.bib +16 -0
- data/INFO +1 -1
- evals/main.py +1 -1
- evals/tasks.py +3 -3
- frontend/public/{LICENSE → INFO} +0 -0
- frontend/public/results.json +371 -371
- results.json +1720 -280
bibliography.bib
CHANGED
@@ -209,6 +209,22 @@
|
|
209 |
keywords = {dataset,n=200}
|
210 |
}
|
211 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
212 |
@inproceedings{robinsonChatGPTMTCompetitive2023,
|
213 |
title = {{{ChatGPT MT}}: {{Competitive}} for {{High-}} (but {{Not Low-}}) {{Resource Languages}}},
|
214 |
shorttitle = {{{ChatGPT MT}}},
|
|
|
209 |
keywords = {dataset,n=200}
|
210 |
}
|
211 |
|
212 |
+
@misc{petrovLanguageModelTokenizers2023,
|
213 |
+
title = {Language {{Model Tokenizers Introduce Unfairness Between Languages}}},
|
214 |
+
author = {Petrov, Aleksandar and Malfa, Emanuele La and Torr, Philip H. S. and Bibi, Adel},
|
215 |
+
year = {2023},
|
216 |
+
month = oct,
|
217 |
+
number = {arXiv:2305.15425},
|
218 |
+
eprint = {2305.15425},
|
219 |
+
primaryclass = {cs},
|
220 |
+
publisher = {arXiv},
|
221 |
+
doi = {10.48550/arXiv.2305.15425},
|
222 |
+
urldate = {2025-03-24},
|
223 |
+
abstract = {Recent language models have shown impressive multilingual performance, even when not explicitly trained for it. Despite this, there are concerns about the quality of their outputs across different languages. In this paper, we show how disparity in the treatment of different languages arises at the tokenization stage, well before a model is even invoked. The same text translated into different languages can have drastically different tokenization lengths, with differences up to 15 times in some cases. These disparities persist even for tokenizers that are intentionally trained for multilingual support. Character-level and byte-level models also exhibit over 4 times the difference in the encoding length for some language pairs. This induces unfair treatment for some language communities in regard to the cost of accessing commercial language services, the processing time and latency, as well as the amount of content that can be provided as context to the models. Therefore, we make the case that we should train future language models using multilingually fair subword tokenizers.},
|
224 |
+
archiveprefix = {arXiv},
|
225 |
+
file = {/Users/david/Zotero/storage/NX3DT98Z/Petrov et al. - 2023 - Language Model Tokenizers Introduce Unfairness Between Languages.pdf;/Users/david/Zotero/storage/FKJQP22D/2305.html}
|
226 |
+
}
|
227 |
+
|
228 |
@inproceedings{robinsonChatGPTMTCompetitive2023,
|
229 |
title = {{{ChatGPT MT}}: {{Competitive}} for {{High-}} (but {{Not Low-}}) {{Resource Languages}}},
|
230 |
shorttitle = {{{ChatGPT MT}}},
|
data/INFO
CHANGED
@@ -2,4 +2,4 @@ fleurs: https://huggingface.co/datasets/google/fleurs via eval.py
|
|
2 |
floresp-v2.0-rc.3: https://github.com/openlanguagedata/flores
|
3 |
glottolog_languoid.csv: https://glottolog.org/meta/downloads
|
4 |
ScriptCodes.csv: https://www.unicode.org/iso15924/iso15924-codes.html
|
5 |
-
spbleu: https://github.com/facebookresearch/flores/tree/main
|
|
|
2 |
floresp-v2.0-rc.3: https://github.com/openlanguagedata/flores
|
3 |
glottolog_languoid.csv: https://glottolog.org/meta/downloads
|
4 |
ScriptCodes.csv: https://www.unicode.org/iso15924/iso15924-codes.html
|
5 |
+
spbleu: https://github.com/facebookresearch/flores/tree/main/flores200#spm-and-dictionary
|
evals/main.py
CHANGED
@@ -13,7 +13,7 @@ from tqdm.asyncio import tqdm_asyncio
|
|
13 |
# ===== config =====
|
14 |
|
15 |
n_sentences = 30
|
16 |
-
langs_eval = languages.iloc[:
|
17 |
langs_eval_detailed = languages.iloc[:2]
|
18 |
transcription_langs_eval = languages.iloc[:10]
|
19 |
transcription_langs_eval_detailed = languages.iloc[:5]
|
|
|
13 |
# ===== config =====
|
14 |
|
15 |
n_sentences = 30
|
16 |
+
langs_eval = languages.iloc[:30]
|
17 |
langs_eval_detailed = languages.iloc[:2]
|
18 |
transcription_langs_eval = languages.iloc[:10]
|
19 |
transcription_langs_eval_detailed = languages.iloc[:5]
|
evals/tasks.py
CHANGED
@@ -3,16 +3,16 @@ import random
|
|
3 |
import evaluate
|
4 |
import pandas as pd
|
5 |
from joblib.memory import Memory
|
6 |
-
from transformers import NllbTokenizer
|
7 |
from languages import languages, script_name
|
8 |
from datasets_.flores import flores_sentences
|
9 |
from models import complete, transcribe
|
|
|
|
|
10 |
cache = Memory(location=".cache", verbose=0).cache
|
11 |
bleu = evaluate.load("bleu")
|
12 |
chrf = evaluate.load("chrf")
|
13 |
wer = evaluate.load("wer")
|
14 |
-
tokenizer =
|
15 |
-
|
16 |
|
17 |
# sample languages to translate to
|
18 |
target_languages = languages[languages["in_benchmark"]].sample(
|
|
|
3 |
import evaluate
|
4 |
import pandas as pd
|
5 |
from joblib.memory import Memory
|
|
|
6 |
from languages import languages, script_name
|
7 |
from datasets_.flores import flores_sentences
|
8 |
from models import complete, transcribe
|
9 |
+
import sentencepiece as spm
|
10 |
+
|
11 |
cache = Memory(location=".cache", verbose=0).cache
|
12 |
bleu = evaluate.load("bleu")
|
13 |
chrf = evaluate.load("chrf")
|
14 |
wer = evaluate.load("wer")
|
15 |
+
tokenizer = spm.SentencePieceProcessor(model_file="data/spbleu/flores200_sacrebleu_tokenizer_spm.model")
|
|
|
16 |
|
17 |
# sample languages to translate to
|
18 |
target_languages = languages[languages["in_benchmark"]].sample(
|
frontend/public/{LICENSE → INFO}
RENAMED
File without changes
|
frontend/public/results.json
CHANGED
@@ -26,7 +26,7 @@
|
|
26 |
"license": null,
|
27 |
"average": 0.66,
|
28 |
"classification_accuracy": 0.73,
|
29 |
-
"language_modeling_chrf": 0.
|
30 |
"translation_bleu": 0.4,
|
31 |
"translation_chrf": 0.54
|
32 |
},
|
@@ -39,9 +39,9 @@
|
|
39 |
"size": 27432406640.0,
|
40 |
"type": "Open",
|
41 |
"license": "Gemma",
|
42 |
-
"average": 0.
|
43 |
"classification_accuracy": 0.72,
|
44 |
-
"language_modeling_chrf": 0.
|
45 |
"translation_bleu": 0.37,
|
46 |
"translation_chrf": 0.54
|
47 |
},
|
@@ -54,41 +54,41 @@
|
|
54 |
"size": 70553706496.0,
|
55 |
"type": "Open",
|
56 |
"license": "Llama3.1",
|
57 |
-
"average": 0.
|
58 |
"classification_accuracy": 0.57,
|
59 |
-
"language_modeling_chrf": 0.
|
60 |
"translation_bleu": 0.43,
|
61 |
"translation_chrf": 0.57
|
62 |
},
|
63 |
{
|
64 |
"rank": 5,
|
65 |
-
"provider": "
|
66 |
-
"model": "
|
67 |
"hf_id": null,
|
68 |
"creation_date": null,
|
69 |
"size": null,
|
70 |
"type": "Commercial",
|
71 |
"license": null,
|
72 |
"average": 0.61,
|
73 |
-
"classification_accuracy": 0.
|
74 |
-
"language_modeling_chrf": 0.
|
75 |
-
"translation_bleu": 0.
|
76 |
-
"translation_chrf": 0.
|
77 |
},
|
78 |
{
|
79 |
"rank": 6,
|
80 |
-
"provider": "
|
81 |
-
"model": "
|
82 |
"hf_id": null,
|
83 |
"creation_date": null,
|
84 |
"size": null,
|
85 |
"type": "Commercial",
|
86 |
"license": null,
|
87 |
-
"average": 0.
|
88 |
-
"classification_accuracy": 0.
|
89 |
-
"language_modeling_chrf": 0.
|
90 |
-
"translation_bleu": 0.
|
91 |
-
"translation_chrf": 0.
|
92 |
},
|
93 |
{
|
94 |
"rank": 7,
|
@@ -101,7 +101,7 @@
|
|
101 |
"license": null,
|
102 |
"average": 0.6,
|
103 |
"classification_accuracy": 0.52,
|
104 |
-
"language_modeling_chrf": 0.
|
105 |
"translation_bleu": 0.39,
|
106 |
"translation_chrf": 0.55
|
107 |
},
|
@@ -116,7 +116,7 @@
|
|
116 |
"license": "Apache 2.0",
|
117 |
"average": 0.58,
|
118 |
"classification_accuracy": 0.55,
|
119 |
-
"language_modeling_chrf": 0.
|
120 |
"translation_bleu": 0.38,
|
121 |
"translation_chrf": 0.52
|
122 |
},
|
@@ -129,11 +129,11 @@
|
|
129 |
"size": 70553706496.0,
|
130 |
"type": "Open",
|
131 |
"license": "Llama3.3",
|
132 |
-
"average": 0.
|
133 |
-
"classification_accuracy": 0.
|
134 |
"language_modeling_chrf": 0.94,
|
135 |
-
"translation_bleu": 0.
|
136 |
-
"translation_chrf": 0.
|
137 |
},
|
138 |
{
|
139 |
"rank": 10,
|
@@ -144,9 +144,9 @@
|
|
144 |
"size": null,
|
145 |
"type": "Commercial",
|
146 |
"license": null,
|
147 |
-
"average": 0.
|
148 |
"classification_accuracy": 0.5,
|
149 |
-
"language_modeling_chrf": 0.
|
150 |
"translation_bleu": 0.32,
|
151 |
"translation_chrf": 0.49
|
152 |
},
|
@@ -161,7 +161,7 @@
|
|
161 |
"license": "Mit",
|
162 |
"average": 0.52,
|
163 |
"classification_accuracy": 0.42,
|
164 |
-
"language_modeling_chrf": 0.
|
165 |
"translation_bleu": 0.32,
|
166 |
"translation_chrf": 0.46
|
167 |
},
|
@@ -176,7 +176,7 @@
|
|
176 |
"license": "Apache 2.0",
|
177 |
"average": 0.25,
|
178 |
"classification_accuracy": 0.0,
|
179 |
-
"language_modeling_chrf": 0.
|
180 |
"translation_bleu": 0.21,
|
181 |
"translation_chrf": 0.3
|
182 |
}
|
@@ -220,7 +220,7 @@
|
|
220 |
"in_benchmark": true,
|
221 |
"NaN": 0.0,
|
222 |
"classification_accuracy": 0.53,
|
223 |
-
"language_modeling_chrf": 0.
|
224 |
"translation_bleu": 0.32,
|
225 |
"translation_chrf": 0.49
|
226 |
},
|
@@ -248,7 +248,7 @@
|
|
248 |
"in_benchmark": true,
|
249 |
"NaN": 0.0,
|
250 |
"classification_accuracy": 0.43,
|
251 |
-
"language_modeling_chrf": 0.
|
252 |
"translation_bleu": 0.28,
|
253 |
"translation_chrf": 0.47
|
254 |
},
|
@@ -262,7 +262,7 @@
|
|
262 |
"in_benchmark": true,
|
263 |
"NaN": 0.0,
|
264 |
"classification_accuracy": 0.5,
|
265 |
-
"language_modeling_chrf": 0.
|
266 |
"translation_bleu": 0.24,
|
267 |
"translation_chrf": 0.42
|
268 |
},
|
@@ -290,7 +290,7 @@
|
|
290 |
"in_benchmark": true,
|
291 |
"NaN": 0.0,
|
292 |
"classification_accuracy": 0.4,
|
293 |
-
"language_modeling_chrf": 0.
|
294 |
"translation_bleu": 0.2,
|
295 |
"translation_chrf": 0.41
|
296 |
},
|
@@ -300,11 +300,11 @@
|
|
300 |
"autonym": "Português",
|
301 |
"speakers": 237496885,
|
302 |
"family": "Indo-European",
|
303 |
-
"average": 0.
|
304 |
"in_benchmark": true,
|
305 |
"NaN": 0.0,
|
306 |
"classification_accuracy": 0.5,
|
307 |
-
"language_modeling_chrf": 0.
|
308 |
"translation_bleu": 0.31,
|
309 |
"translation_chrf": 0.49
|
310 |
},
|
@@ -314,11 +314,11 @@
|
|
314 |
"autonym": "ਪੰਜਾਬੀ",
|
315 |
"speakers": 203571210,
|
316 |
"family": "Indo-European",
|
317 |
-
"average": 0.
|
318 |
"in_benchmark": true,
|
319 |
"NaN": 0.0,
|
320 |
"classification_accuracy": 0.4,
|
321 |
-
"language_modeling_chrf": 0.
|
322 |
"translation_bleu": 0.34,
|
323 |
"translation_chrf": 0.49
|
324 |
},
|
@@ -328,13 +328,13 @@
|
|
328 |
"autonym": "Русский",
|
329 |
"speakers": 195841151,
|
330 |
"family": "Indo-European",
|
331 |
-
"average": 0.
|
332 |
"in_benchmark": true,
|
333 |
"NaN": 0.0,
|
334 |
-
"classification_accuracy": 0.
|
335 |
-
"language_modeling_chrf": 0.
|
336 |
-
"translation_bleu": 0.
|
337 |
-
"translation_chrf": 0.
|
338 |
},
|
339 |
{
|
340 |
"bcp_47": "sw",
|
@@ -342,13 +342,13 @@
|
|
342 |
"autonym": "Kiswahili",
|
343 |
"speakers": 171610296,
|
344 |
"family": "Atlantic-Congo",
|
345 |
-
"average": 0.
|
346 |
"in_benchmark": true,
|
347 |
"NaN": 0.0,
|
348 |
-
"classification_accuracy": 0.
|
349 |
-
"language_modeling_chrf": 0.
|
350 |
-
"translation_bleu": 0.
|
351 |
-
"translation_chrf": 0.
|
352 |
},
|
353 |
{
|
354 |
"bcp_47": "id",
|
@@ -356,13 +356,13 @@
|
|
356 |
"autonym": "Bahasa Indonesia",
|
357 |
"speakers": 171207687,
|
358 |
"family": "Austronesian",
|
359 |
-
"average": 0.
|
360 |
"in_benchmark": true,
|
361 |
"NaN": 0.0,
|
362 |
-
"classification_accuracy": 0.
|
363 |
-
"language_modeling_chrf": 0.
|
364 |
-
"translation_bleu": 0.
|
365 |
-
"translation_chrf": 0.
|
366 |
},
|
367 |
{
|
368 |
"bcp_47": "de",
|
@@ -370,13 +370,13 @@
|
|
370 |
"autonym": "Deutsch",
|
371 |
"speakers": 136350226,
|
372 |
"family": "Indo-European",
|
373 |
-
"average": 0.
|
374 |
"in_benchmark": true,
|
375 |
"NaN": 0.0,
|
376 |
-
"classification_accuracy": 0.
|
377 |
-
"language_modeling_chrf": 0.
|
378 |
-
"translation_bleu": 0.
|
379 |
-
"translation_chrf": 0.
|
380 |
},
|
381 |
{
|
382 |
"bcp_47": "ja",
|
@@ -384,13 +384,13 @@
|
|
384 |
"autonym": "日本語",
|
385 |
"speakers": 119729026,
|
386 |
"family": "Japonic",
|
387 |
-
"average": 0.
|
388 |
"in_benchmark": true,
|
389 |
"NaN": 0.0,
|
390 |
-
"classification_accuracy": 0.
|
391 |
-
"language_modeling_chrf": 0.
|
392 |
-
"translation_bleu": 0.
|
393 |
-
"translation_chrf": 0.
|
394 |
},
|
395 |
{
|
396 |
"bcp_47": "te",
|
@@ -398,13 +398,13 @@
|
|
398 |
"autonym": "తెలుగు",
|
399 |
"speakers": 95478480,
|
400 |
"family": "Dravidian",
|
401 |
-
"average": 0.
|
402 |
"in_benchmark": true,
|
403 |
"NaN": 0.0,
|
404 |
-
"classification_accuracy": 0.
|
405 |
-
"language_modeling_chrf": 0.
|
406 |
-
"translation_bleu": 0.
|
407 |
-
"translation_chrf": 0.
|
408 |
},
|
409 |
{
|
410 |
"bcp_47": "lah",
|
@@ -426,13 +426,13 @@
|
|
426 |
"autonym": "मराठी",
|
427 |
"speakers": 92826300,
|
428 |
"family": "Indo-European",
|
429 |
-
"average": 0.
|
430 |
"in_benchmark": true,
|
431 |
"NaN": 0.0,
|
432 |
-
"classification_accuracy": 0.
|
433 |
-
"language_modeling_chrf": 0.
|
434 |
-
"translation_bleu": 0.
|
435 |
-
"translation_chrf": 0.
|
436 |
},
|
437 |
{
|
438 |
"bcp_47": "jv",
|
@@ -440,13 +440,13 @@
|
|
440 |
"autonym": "Jawa",
|
441 |
"speakers": 91180665,
|
442 |
"family": "Austronesian",
|
443 |
-
"average": 0.
|
444 |
"in_benchmark": true,
|
445 |
"NaN": 0.0,
|
446 |
-
"classification_accuracy": 0.
|
447 |
-
"language_modeling_chrf": 0.
|
448 |
-
"translation_bleu": 0.
|
449 |
-
"translation_chrf": 0.
|
450 |
},
|
451 |
{
|
452 |
"bcp_47": "vi",
|
@@ -454,13 +454,13 @@
|
|
454 |
"autonym": "Tiếng Việt",
|
455 |
"speakers": 86222962,
|
456 |
"family": "Austroasiatic",
|
457 |
-
"average": 0.
|
458 |
"in_benchmark": true,
|
459 |
"NaN": 0.0,
|
460 |
-
"classification_accuracy": 0.
|
461 |
-
"language_modeling_chrf": 0.
|
462 |
-
"translation_bleu": 0.
|
463 |
-
"translation_chrf": 0.
|
464 |
},
|
465 |
{
|
466 |
"bcp_47": "ta",
|
@@ -468,13 +468,13 @@
|
|
468 |
"autonym": "தமிழ்",
|
469 |
"speakers": 85616159,
|
470 |
"family": "Dravidian",
|
471 |
-
"average": 0.
|
472 |
"in_benchmark": true,
|
473 |
"NaN": 0.0,
|
474 |
-
"classification_accuracy": 0.
|
475 |
-
"language_modeling_chrf": 0.
|
476 |
-
"translation_bleu": 0.
|
477 |
-
"translation_chrf": 0.
|
478 |
},
|
479 |
{
|
480 |
"bcp_47": "fa",
|
@@ -482,13 +482,13 @@
|
|
482 |
"autonym": "فارسی",
|
483 |
"speakers": 84710459,
|
484 |
"family": "Indo-European",
|
485 |
-
"average": 0.
|
486 |
"in_benchmark": true,
|
487 |
"NaN": 0.0,
|
488 |
-
"classification_accuracy": 0.
|
489 |
-
"language_modeling_chrf": 0.
|
490 |
-
"translation_bleu": 0.
|
491 |
-
"translation_chrf": 0.
|
492 |
},
|
493 |
{
|
494 |
"bcp_47": "wuu",
|
@@ -510,13 +510,13 @@
|
|
510 |
"autonym": "Türkçe",
|
511 |
"speakers": 80360704,
|
512 |
"family": "Turkic",
|
513 |
-
"average": 0.
|
514 |
"in_benchmark": true,
|
515 |
"NaN": 0.0,
|
516 |
-
"classification_accuracy": 0.
|
517 |
-
"language_modeling_chrf": 0.
|
518 |
-
"translation_bleu": 0.
|
519 |
-
"translation_chrf": 0.
|
520 |
},
|
521 |
{
|
522 |
"bcp_47": "yue",
|
@@ -524,13 +524,13 @@
|
|
524 |
"autonym": "粵語",
|
525 |
"speakers": 79654759,
|
526 |
"family": "Sino-Tibetan",
|
527 |
-
"average": 0.
|
528 |
"in_benchmark": true,
|
529 |
"NaN": 0.0,
|
530 |
-
"classification_accuracy": 0.
|
531 |
-
"language_modeling_chrf": 0.
|
532 |
-
"translation_bleu": 0.
|
533 |
-
"translation_chrf": 0.
|
534 |
},
|
535 |
{
|
536 |
"bcp_47": "ko",
|
@@ -538,13 +538,13 @@
|
|
538 |
"autonym": "한국어",
|
539 |
"speakers": 78357046,
|
540 |
"family": "Koreanic",
|
541 |
-
"average": 0.
|
542 |
"in_benchmark": true,
|
543 |
"NaN": 0.0,
|
544 |
-
"classification_accuracy": 0.
|
545 |
-
"language_modeling_chrf": 0.
|
546 |
-
"translation_bleu": 0.
|
547 |
-
"translation_chrf": 0.
|
548 |
},
|
549 |
{
|
550 |
"bcp_47": "it",
|
@@ -552,13 +552,13 @@
|
|
552 |
"autonym": "Italiano",
|
553 |
"speakers": 70247060,
|
554 |
"family": "Indo-European",
|
555 |
-
"average": 0.
|
556 |
"in_benchmark": true,
|
557 |
"NaN": 0.0,
|
558 |
-
"classification_accuracy": 0.
|
559 |
-
"language_modeling_chrf": 0.
|
560 |
-
"translation_bleu": 0.
|
561 |
-
"translation_chrf": 0.
|
562 |
},
|
563 |
{
|
564 |
"bcp_47": "fil",
|
@@ -566,13 +566,13 @@
|
|
566 |
"autonym": "Filipino",
|
567 |
"speakers": 67471096,
|
568 |
"family": "Austronesian",
|
569 |
-
"average": 0.
|
570 |
"in_benchmark": true,
|
571 |
"NaN": 0.0,
|
572 |
-
"classification_accuracy": 0.
|
573 |
-
"language_modeling_chrf": 0.
|
574 |
-
"translation_bleu": 0.
|
575 |
-
"translation_chrf": 0.
|
576 |
},
|
577 |
{
|
578 |
"bcp_47": "arz",
|
@@ -580,13 +580,13 @@
|
|
580 |
"autonym": "Egyptian Arabic",
|
581 |
"speakers": 66639360,
|
582 |
"family": "Afro-Asiatic",
|
583 |
-
"average": 0.
|
584 |
"in_benchmark": true,
|
585 |
"NaN": 0.0,
|
586 |
-
"classification_accuracy": 0.
|
587 |
-
"language_modeling_chrf": 0.
|
588 |
-
"translation_bleu": 0.
|
589 |
-
"translation_chrf": 0.
|
590 |
},
|
591 |
{
|
592 |
"bcp_47": "gu",
|
@@ -594,13 +594,13 @@
|
|
594 |
"autonym": "ગુજરાતી",
|
595 |
"speakers": 61721799,
|
596 |
"family": "Indo-European",
|
597 |
-
"average": 0.
|
598 |
"in_benchmark": true,
|
599 |
"NaN": 0.0,
|
600 |
-
"classification_accuracy": 0.
|
601 |
-
"language_modeling_chrf": 0.
|
602 |
-
"translation_bleu": 0.
|
603 |
-
"translation_chrf": 0.
|
604 |
},
|
605 |
{
|
606 |
"bcp_47": "th",
|
@@ -10164,7 +10164,7 @@
|
|
10164 |
]
|
10165 |
},
|
10166 |
"AE": {
|
10167 |
-
"score": 0.
|
10168 |
"languages": [
|
10169 |
{
|
10170 |
"name": "English",
|
@@ -10182,7 +10182,7 @@
|
|
10182 |
"name": "Persian",
|
10183 |
"bcp_47": "fa",
|
10184 |
"population": 189850,
|
10185 |
-
"score": 0.
|
10186 |
},
|
10187 |
{
|
10188 |
"name": "Pashto",
|
@@ -10205,7 +10205,7 @@
|
|
10205 |
]
|
10206 |
},
|
10207 |
"AG": {
|
10208 |
-
"score": 0.
|
10209 |
"languages": [
|
10210 |
{
|
10211 |
"name": "English",
|
@@ -10217,7 +10217,7 @@
|
|
10217 |
"name": "Portuguese",
|
10218 |
"bcp_47": "pt",
|
10219 |
"population": 1571,
|
10220 |
-
"score": 0.
|
10221 |
}
|
10222 |
]
|
10223 |
},
|
@@ -10290,7 +10290,7 @@
|
|
10290 |
]
|
10291 |
},
|
10292 |
"AT": {
|
10293 |
-
"score": 0.
|
10294 |
"languages": [
|
10295 |
{
|
10296 |
"name": "English",
|
@@ -10308,13 +10308,13 @@
|
|
10308 |
"name": "German",
|
10309 |
"bcp_47": "de",
|
10310 |
"population": 8593666,
|
10311 |
-
"score": 0.
|
10312 |
},
|
10313 |
{
|
10314 |
"name": "Italian",
|
10315 |
"bcp_47": "it",
|
10316 |
"population": 797350,
|
10317 |
-
"score": 0.
|
10318 |
},
|
10319 |
{
|
10320 |
"name": "Bavarian",
|
@@ -10343,7 +10343,7 @@
|
|
10343 |
]
|
10344 |
},
|
10345 |
"AU": {
|
10346 |
-
"score": 0.
|
10347 |
"languages": [
|
10348 |
{
|
10349 |
"name": "English",
|
@@ -10361,7 +10361,7 @@
|
|
10361 |
"name": "Italian",
|
10362 |
"bcp_47": "it",
|
10363 |
"population": 483864,
|
10364 |
-
"score": 0.
|
10365 |
},
|
10366 |
{
|
10367 |
"name": "Hmong Njua",
|
@@ -10506,7 +10506,7 @@
|
|
10506 |
]
|
10507 |
},
|
10508 |
"BE": {
|
10509 |
-
"score": 0.
|
10510 |
"languages": [
|
10511 |
{
|
10512 |
"name": "English",
|
@@ -10524,7 +10524,7 @@
|
|
10524 |
"name": "German",
|
10525 |
"bcp_47": "de",
|
10526 |
"population": 2578554,
|
10527 |
-
"score": 0.
|
10528 |
},
|
10529 |
{
|
10530 |
"name": "Dutch",
|
@@ -10547,7 +10547,7 @@
|
|
10547 |
]
|
10548 |
},
|
10549 |
"BG": {
|
10550 |
-
"score": 0.
|
10551 |
"languages": [
|
10552 |
{
|
10553 |
"name": "English",
|
@@ -10559,19 +10559,19 @@
|
|
10559 |
"name": "Russian",
|
10560 |
"bcp_47": "ru",
|
10561 |
"population": 1602387,
|
10562 |
-
"score": 0.
|
10563 |
},
|
10564 |
{
|
10565 |
"name": "German",
|
10566 |
"bcp_47": "de",
|
10567 |
"population": 557352,
|
10568 |
-
"score": 0.
|
10569 |
},
|
10570 |
{
|
10571 |
"name": "Turkish",
|
10572 |
"bcp_47": "tr",
|
10573 |
"population": 766359,
|
10574 |
-
"score": 0.
|
10575 |
},
|
10576 |
{
|
10577 |
"name": "Bulgarian",
|
@@ -10582,7 +10582,7 @@
|
|
10582 |
]
|
10583 |
},
|
10584 |
"BI": {
|
10585 |
-
"score": 0.
|
10586 |
"languages": [
|
10587 |
{
|
10588 |
"name": "English",
|
@@ -10600,7 +10600,7 @@
|
|
10600 |
"name": "Swahili",
|
10601 |
"bcp_47": "sw",
|
10602 |
"population": 6408,
|
10603 |
-
"score": 0.
|
10604 |
},
|
10605 |
{
|
10606 |
"name": "Rundi",
|
@@ -10645,7 +10645,7 @@
|
|
10645 |
]
|
10646 |
},
|
10647 |
"BR": {
|
10648 |
-
"score": 0.
|
10649 |
"languages": [
|
10650 |
{
|
10651 |
"name": "English",
|
@@ -10663,31 +10663,31 @@
|
|
10663 |
"name": "Portuguese",
|
10664 |
"bcp_47": "pt",
|
10665 |
"population": 192661560,
|
10666 |
-
"score": 0.
|
10667 |
},
|
10668 |
{
|
10669 |
"name": "German",
|
10670 |
"bcp_47": "de",
|
10671 |
"population": 1778414,
|
10672 |
-
"score": 0.
|
10673 |
},
|
10674 |
{
|
10675 |
"name": "Japanese",
|
10676 |
"bcp_47": "ja",
|
10677 |
"population": 444604,
|
10678 |
-
"score": 0.
|
10679 |
},
|
10680 |
{
|
10681 |
"name": "Korean",
|
10682 |
"bcp_47": "ko",
|
10683 |
"population": 44460,
|
10684 |
-
"score": 0.
|
10685 |
},
|
10686 |
{
|
10687 |
"name": "Italian",
|
10688 |
"bcp_47": "it",
|
10689 |
"population": 592805,
|
10690 |
-
"score": 0.
|
10691 |
},
|
10692 |
{
|
10693 |
"name": "Venetian",
|
@@ -10819,7 +10819,7 @@
|
|
10819 |
]
|
10820 |
},
|
10821 |
"CA": {
|
10822 |
-
"score": 0.
|
10823 |
"languages": [
|
10824 |
{
|
10825 |
"name": "English",
|
@@ -10873,85 +10873,85 @@
|
|
10873 |
"name": "Portuguese",
|
10874 |
"bcp_47": "pt",
|
10875 |
"population": 229934,
|
10876 |
-
"score": 0.
|
10877 |
},
|
10878 |
{
|
10879 |
"name": "Punjabi",
|
10880 |
"bcp_47": "pa",
|
10881 |
"population": 603106,
|
10882 |
-
"score": 0.
|
10883 |
},
|
10884 |
{
|
10885 |
"name": "Russian",
|
10886 |
"bcp_47": "ru",
|
10887 |
"population": 211087,
|
10888 |
-
"score": 0.
|
10889 |
},
|
10890 |
{
|
10891 |
"name": "German",
|
10892 |
"bcp_47": "de",
|
10893 |
"population": 294014,
|
10894 |
-
"score": 0.
|
10895 |
},
|
10896 |
{
|
10897 |
"name": "Japanese",
|
10898 |
"bcp_47": "ja",
|
10899 |
"population": 52772,
|
10900 |
-
"score": 0.
|
10901 |
},
|
10902 |
{
|
10903 |
"name": "Vietnamese",
|
10904 |
"bcp_47": "vi",
|
10905 |
"population": 184701,
|
10906 |
-
"score": 0.
|
10907 |
},
|
10908 |
{
|
10909 |
"name": "Tamil",
|
10910 |
"bcp_47": "ta",
|
10911 |
"population": 184701,
|
10912 |
-
"score": 0.
|
10913 |
},
|
10914 |
{
|
10915 |
"name": "Persian",
|
10916 |
"bcp_47": "fa",
|
10917 |
"population": 245012,
|
10918 |
-
"score": 0.
|
10919 |
},
|
10920 |
{
|
10921 |
"name": "Turkish",
|
10922 |
"bcp_47": "tr",
|
10923 |
"population": 37694,
|
10924 |
-
"score": 0.
|
10925 |
},
|
10926 |
{
|
10927 |
"name": "Cantonese",
|
10928 |
"bcp_47": "yue",
|
10929 |
"population": 640800,
|
10930 |
-
"score": 0.
|
10931 |
},
|
10932 |
{
|
10933 |
"name": "Korean",
|
10934 |
"bcp_47": "ko",
|
10935 |
"population": 169623,
|
10936 |
-
"score": 0.
|
10937 |
},
|
10938 |
{
|
10939 |
"name": "Italian",
|
10940 |
"bcp_47": "it",
|
10941 |
"population": 343016,
|
10942 |
-
"score": 0.
|
10943 |
},
|
10944 |
{
|
10945 |
"name": "Filipino",
|
10946 |
"bcp_47": "fil",
|
10947 |
"population": 565412,
|
10948 |
-
"score": 0.
|
10949 |
},
|
10950 |
{
|
10951 |
"name": "Gujarati",
|
10952 |
"bcp_47": "gu",
|
10953 |
"population": 135699,
|
10954 |
-
"score": 0.
|
10955 |
},
|
10956 |
{
|
10957 |
"name": "Polish",
|
@@ -11189,7 +11189,7 @@
|
|
11189 |
]
|
11190 |
},
|
11191 |
"CH": {
|
11192 |
-
"score": 0.
|
11193 |
"languages": [
|
11194 |
{
|
11195 |
"name": "English",
|
@@ -11207,19 +11207,19 @@
|
|
11207 |
"name": "Portuguese",
|
11208 |
"bcp_47": "pt",
|
11209 |
"population": 285736,
|
11210 |
-
"score": 0.
|
11211 |
},
|
11212 |
{
|
11213 |
"name": "German",
|
11214 |
"bcp_47": "de",
|
11215 |
"population": 6134913,
|
11216 |
-
"score": 0.
|
11217 |
},
|
11218 |
{
|
11219 |
"name": "Italian",
|
11220 |
"bcp_47": "it",
|
11221 |
"population": 361372,
|
11222 |
-
"score": 0.
|
11223 |
},
|
11224 |
{
|
11225 |
"name": "Swiss German",
|
@@ -11455,7 +11455,7 @@
|
|
11455 |
]
|
11456 |
},
|
11457 |
"CN": {
|
11458 |
-
"score": 0.
|
11459 |
"languages": [
|
11460 |
{
|
11461 |
"name": "English",
|
@@ -11473,13 +11473,13 @@
|
|
11473 |
"name": "Russian",
|
11474 |
"bcp_47": "ru",
|
11475 |
"population": 13940,
|
11476 |
-
"score": 0.
|
11477 |
},
|
11478 |
{
|
11479 |
"name": "Vietnamese",
|
11480 |
"bcp_47": "vi",
|
11481 |
"population": 6970,
|
11482 |
-
"score": 0.
|
11483 |
},
|
11484 |
{
|
11485 |
"name": "Wu Chinese",
|
@@ -11491,13 +11491,13 @@
|
|
11491 |
"name": "Cantonese",
|
11492 |
"bcp_47": "yue",
|
11493 |
"population": 72489040,
|
11494 |
-
"score": 0.
|
11495 |
},
|
11496 |
{
|
11497 |
"name": "Korean",
|
11498 |
"bcp_47": "ko",
|
11499 |
"population": 2091030,
|
11500 |
-
"score": 0.
|
11501 |
},
|
11502 |
{
|
11503 |
"name": "Xiang Chinese",
|
@@ -11649,7 +11649,7 @@
|
|
11649 |
]
|
11650 |
},
|
11651 |
"CY": {
|
11652 |
-
"score": 0.
|
11653 |
"languages": [
|
11654 |
{
|
11655 |
"name": "English",
|
@@ -11673,7 +11673,7 @@
|
|
11673 |
"name": "Turkish",
|
11674 |
"bcp_47": "tr",
|
11675 |
"population": 291336,
|
11676 |
-
"score": 0.
|
11677 |
},
|
11678 |
{
|
11679 |
"name": "Greek",
|
@@ -11690,7 +11690,7 @@
|
|
11690 |
]
|
11691 |
},
|
11692 |
"CZ": {
|
11693 |
-
"score": 0.
|
11694 |
"languages": [
|
11695 |
{
|
11696 |
"name": "English",
|
@@ -11702,7 +11702,7 @@
|
|
11702 |
"name": "German",
|
11703 |
"bcp_47": "de",
|
11704 |
"population": 1605375,
|
11705 |
-
"score": 0.
|
11706 |
},
|
11707 |
{
|
11708 |
"name": "Polish",
|
@@ -11725,7 +11725,7 @@
|
|
11725 |
]
|
11726 |
},
|
11727 |
"DE": {
|
11728 |
-
"score": 0.
|
11729 |
"languages": [
|
11730 |
{
|
11731 |
"name": "English",
|
@@ -11749,25 +11749,25 @@
|
|
11749 |
"name": "Russian",
|
11750 |
"bcp_47": "ru",
|
11751 |
"population": 4809582,
|
11752 |
-
"score": 0.
|
11753 |
},
|
11754 |
{
|
11755 |
"name": "German",
|
11756 |
"bcp_47": "de",
|
11757 |
"population": 72945327,
|
11758 |
-
"score": 0.
|
11759 |
},
|
11760 |
{
|
11761 |
"name": "Turkish",
|
11762 |
"bcp_47": "tr",
|
11763 |
"population": 2003992,
|
11764 |
-
"score": 0.
|
11765 |
},
|
11766 |
{
|
11767 |
"name": "Italian",
|
11768 |
"bcp_47": "it",
|
11769 |
"population": 5611179,
|
11770 |
-
"score": 0.
|
11771 |
},
|
11772 |
{
|
11773 |
"name": "Polish",
|
@@ -11891,7 +11891,7 @@
|
|
11891 |
]
|
11892 |
},
|
11893 |
"DK": {
|
11894 |
-
"score": 0.
|
11895 |
"languages": [
|
11896 |
{
|
11897 |
"name": "English",
|
@@ -11903,7 +11903,7 @@
|
|
11903 |
"name": "German",
|
11904 |
"bcp_47": "de",
|
11905 |
"population": 2758623,
|
11906 |
-
"score": 0.
|
11907 |
},
|
11908 |
{
|
11909 |
"name": "Swedish",
|
@@ -12001,7 +12001,7 @@
|
|
12001 |
]
|
12002 |
},
|
12003 |
"EE": {
|
12004 |
-
"score": 0.
|
12005 |
"languages": [
|
12006 |
{
|
12007 |
"name": "English",
|
@@ -12013,7 +12013,7 @@
|
|
12013 |
"name": "Russian",
|
12014 |
"bcp_47": "ru",
|
12015 |
"population": 688027,
|
12016 |
-
"score": 0.
|
12017 |
},
|
12018 |
{
|
12019 |
"name": "Finnish",
|
@@ -12042,7 +12042,7 @@
|
|
12042 |
]
|
12043 |
},
|
12044 |
"EG": {
|
12045 |
-
"score": 0.
|
12046 |
"languages": [
|
12047 |
{
|
12048 |
"name": "English",
|
@@ -12060,7 +12060,7 @@
|
|
12060 |
"name": "Egyptian Arabic",
|
12061 |
"bcp_47": "arz",
|
12062 |
"population": 66639360,
|
12063 |
-
"score": 0.
|
12064 |
},
|
12065 |
{
|
12066 |
"name": "Greek",
|
@@ -12236,7 +12236,7 @@
|
|
12236 |
]
|
12237 |
},
|
12238 |
"FI": {
|
12239 |
-
"score": 0.
|
12240 |
"languages": [
|
12241 |
{
|
12242 |
"name": "English",
|
@@ -12248,13 +12248,13 @@
|
|
12248 |
"name": "Russian",
|
12249 |
"bcp_47": "ru",
|
12250 |
"population": 45131,
|
12251 |
-
"score": 0.
|
12252 |
},
|
12253 |
{
|
12254 |
"name": "German",
|
12255 |
"bcp_47": "de",
|
12256 |
"population": 1002901,
|
12257 |
-
"score": 0.
|
12258 |
},
|
12259 |
{
|
12260 |
"name": "Swedish",
|
@@ -12388,7 +12388,7 @@
|
|
12388 |
]
|
12389 |
},
|
12390 |
"FR": {
|
12391 |
-
"score": 0.
|
12392 |
"languages": [
|
12393 |
{
|
12394 |
"name": "English",
|
@@ -12412,19 +12412,19 @@
|
|
12412 |
"name": "Portuguese",
|
12413 |
"bcp_47": "pt",
|
12414 |
"population": 882027,
|
12415 |
-
"score": 0.
|
12416 |
},
|
12417 |
{
|
12418 |
"name": "German",
|
12419 |
"bcp_47": "de",
|
12420 |
"population": 3392410,
|
12421 |
-
"score": 0.
|
12422 |
},
|
12423 |
{
|
12424 |
"name": "Italian",
|
12425 |
"bcp_47": "it",
|
12426 |
"population": 1153419,
|
12427 |
-
"score": 0.
|
12428 |
},
|
12429 |
{
|
12430 |
"name": "Dutch",
|
@@ -12495,7 +12495,7 @@
|
|
12495 |
]
|
12496 |
},
|
12497 |
"GB": {
|
12498 |
-
"score": 0.
|
12499 |
"languages": [
|
12500 |
{
|
12501 |
"name": "English",
|
@@ -12543,43 +12543,43 @@
|
|
12543 |
"name": "Portuguese",
|
12544 |
"bcp_47": "pt",
|
12545 |
"population": 131522,
|
12546 |
-
"score": 0.
|
12547 |
},
|
12548 |
{
|
12549 |
"name": "Punjabi",
|
12550 |
"bcp_47": "pa",
|
12551 |
"population": 2367400,
|
12552 |
-
"score": 0.
|
12553 |
},
|
12554 |
{
|
12555 |
"name": "German",
|
12556 |
"bcp_47": "de",
|
12557 |
"population": 5918499,
|
12558 |
-
"score": 0.
|
12559 |
},
|
12560 |
{
|
12561 |
"name": "Tamil",
|
12562 |
"bcp_47": "ta",
|
12563 |
"population": 2104355,
|
12564 |
-
"score": 0.
|
12565 |
},
|
12566 |
{
|
12567 |
"name": "Turkish",
|
12568 |
"bcp_47": "tr",
|
12569 |
"population": 131522,
|
12570 |
-
"score": 0.
|
12571 |
},
|
12572 |
{
|
12573 |
"name": "Italian",
|
12574 |
"bcp_47": "it",
|
12575 |
"population": 131522,
|
12576 |
-
"score": 0.
|
12577 |
},
|
12578 |
{
|
12579 |
"name": "Gujarati",
|
12580 |
"bcp_47": "gu",
|
12581 |
"population": 1907072,
|
12582 |
-
"score": 0.
|
12583 |
},
|
12584 |
{
|
12585 |
"name": "Polish",
|
@@ -12765,7 +12765,7 @@
|
|
12765 |
]
|
12766 |
},
|
12767 |
"GR": {
|
12768 |
-
"score": 0.
|
12769 |
"languages": [
|
12770 |
{
|
12771 |
"name": "English",
|
@@ -12783,13 +12783,13 @@
|
|
12783 |
"name": "German",
|
12784 |
"bcp_47": "de",
|
12785 |
"population": 530355,
|
12786 |
-
"score": 0.
|
12787 |
},
|
12788 |
{
|
12789 |
"name": "Turkish",
|
12790 |
"bcp_47": "tr",
|
12791 |
"population": 127285,
|
12792 |
-
"score": 0.
|
12793 |
},
|
12794 |
{
|
12795 |
"name": "Greek",
|
@@ -12869,7 +12869,7 @@
|
|
12869 |
]
|
12870 |
},
|
12871 |
"HK": {
|
12872 |
-
"score": 0.
|
12873 |
"languages": [
|
12874 |
{
|
12875 |
"name": "English",
|
@@ -12887,7 +12887,7 @@
|
|
12887 |
"name": "Cantonese",
|
12888 |
"bcp_47": "yue",
|
12889 |
"population": 6524919,
|
12890 |
-
"score": 0.
|
12891 |
}
|
12892 |
]
|
12893 |
},
|
@@ -12920,7 +12920,7 @@
|
|
12920 |
]
|
12921 |
},
|
12922 |
"HR": {
|
12923 |
-
"score": 0.
|
12924 |
"languages": [
|
12925 |
{
|
12926 |
"name": "English",
|
@@ -12932,7 +12932,7 @@
|
|
12932 |
"name": "Italian",
|
12933 |
"bcp_47": "it",
|
12934 |
"population": 67644,
|
12935 |
-
"score": 0.
|
12936 |
},
|
12937 |
{
|
12938 |
"name": "Croatian",
|
@@ -12949,7 +12949,7 @@
|
|
12949 |
]
|
12950 |
},
|
12951 |
"HU": {
|
12952 |
-
"score": 0.
|
12953 |
"languages": [
|
12954 |
{
|
12955 |
"name": "English",
|
@@ -12967,7 +12967,7 @@
|
|
12967 |
"name": "German",
|
12968 |
"bcp_47": "de",
|
12969 |
"population": 1758929,
|
12970 |
-
"score": 0.
|
12971 |
},
|
12972 |
{
|
12973 |
"name": "Romanian",
|
@@ -13025,7 +13025,7 @@
|
|
13025 |
]
|
13026 |
},
|
13027 |
"IL": {
|
13028 |
-
"score": 0.
|
13029 |
"languages": [
|
13030 |
{
|
13031 |
"name": "English",
|
@@ -13043,7 +13043,7 @@
|
|
13043 |
"name": "Russian",
|
13044 |
"bcp_47": "ru",
|
13045 |
"population": 954303,
|
13046 |
-
"score": 0.
|
13047 |
},
|
13048 |
{
|
13049 |
"name": "Malayalam",
|
@@ -13125,7 +13125,7 @@
|
|
13125 |
]
|
13126 |
},
|
13127 |
"IN": {
|
13128 |
-
"score": 0.
|
13129 |
"languages": [
|
13130 |
{
|
13131 |
"name": "English",
|
@@ -13155,13 +13155,13 @@
|
|
13155 |
"name": "Punjabi",
|
13156 |
"bcp_47": "pa",
|
13157 |
"population": 37130520,
|
13158 |
-
"score": 0.
|
13159 |
},
|
13160 |
{
|
13161 |
"name": "Telugu",
|
13162 |
"bcp_47": "te",
|
13163 |
"population": 95478480,
|
13164 |
-
"score": 0.
|
13165 |
},
|
13166 |
{
|
13167 |
"name": "Western Panjabi",
|
@@ -13173,19 +13173,19 @@
|
|
13173 |
"name": "Marathi",
|
13174 |
"bcp_47": "mr",
|
13175 |
"population": 92826300,
|
13176 |
-
"score": 0.
|
13177 |
},
|
13178 |
{
|
13179 |
"name": "Tamil",
|
13180 |
"bcp_47": "ta",
|
13181 |
"population": 78239310,
|
13182 |
-
"score": 0.
|
13183 |
},
|
13184 |
{
|
13185 |
"name": "Gujarati",
|
13186 |
"bcp_47": "gu",
|
13187 |
"population": 59674050,
|
13188 |
-
"score": 0.
|
13189 |
},
|
13190 |
{
|
13191 |
"name": "Kannada",
|
@@ -13603,7 +13603,7 @@
|
|
13603 |
]
|
13604 |
},
|
13605 |
"IQ": {
|
13606 |
-
"score": 0.
|
13607 |
"languages": [
|
13608 |
{
|
13609 |
"name": "English",
|
@@ -13621,7 +13621,7 @@
|
|
13621 |
"name": "Persian",
|
13622 |
"bcp_47": "fa",
|
13623 |
"population": 338192,
|
13624 |
-
"score": 0.
|
13625 |
},
|
13626 |
{
|
13627 |
"name": "Azerbaijani",
|
@@ -13650,7 +13650,7 @@
|
|
13650 |
]
|
13651 |
},
|
13652 |
"IT": {
|
13653 |
-
"score": 0.
|
13654 |
"languages": [
|
13655 |
{
|
13656 |
"name": "English",
|
@@ -13668,13 +13668,13 @@
|
|
13668 |
"name": "German",
|
13669 |
"bcp_47": "de",
|
13670 |
"population": 998443,
|
13671 |
-
"score": 0.
|
13672 |
},
|
13673 |
{
|
13674 |
"name": "Italian",
|
13675 |
"bcp_47": "it",
|
13676 |
"population": 59282565,
|
13677 |
-
"score": 0.
|
13678 |
},
|
13679 |
{
|
13680 |
"name": "Greek",
|
@@ -13820,7 +13820,7 @@
|
|
13820 |
]
|
13821 |
},
|
13822 |
"KE": {
|
13823 |
-
"score": 0.
|
13824 |
"languages": [
|
13825 |
{
|
13826 |
"name": "English",
|
@@ -13838,19 +13838,19 @@
|
|
13838 |
"name": "Punjabi",
|
13839 |
"bcp_47": "pa",
|
13840 |
"population": 10170,
|
13841 |
-
"score": 0.
|
13842 |
},
|
13843 |
{
|
13844 |
"name": "Swahili",
|
13845 |
"bcp_47": "sw",
|
13846 |
"population": 35328414,
|
13847 |
-
"score": 0.
|
13848 |
},
|
13849 |
{
|
13850 |
"name": "Gujarati",
|
13851 |
"bcp_47": "gu",
|
13852 |
"population": 4978,
|
13853 |
-
"score": 0.
|
13854 |
},
|
13855 |
{
|
13856 |
"name": "Oromo",
|
@@ -13984,7 +13984,7 @@
|
|
13984 |
]
|
13985 |
},
|
13986 |
"KZ": {
|
13987 |
-
"score": 0.
|
13988 |
"languages": [
|
13989 |
{
|
13990 |
"name": "English",
|
@@ -13996,13 +13996,13 @@
|
|
13996 |
"name": "Russian",
|
13997 |
"bcp_47": "ru",
|
13998 |
"population": 13746168,
|
13999 |
-
"score": 0.
|
14000 |
},
|
14001 |
{
|
14002 |
"name": "German",
|
14003 |
"bcp_47": "de",
|
14004 |
"population": 1221882,
|
14005 |
-
"score": 0.
|
14006 |
},
|
14007 |
{
|
14008 |
"name": "Kazakh",
|
@@ -14071,7 +14071,7 @@
|
|
14071 |
]
|
14072 |
},
|
14073 |
"LK": {
|
14074 |
-
"score": 0.
|
14075 |
"languages": [
|
14076 |
{
|
14077 |
"name": "English",
|
@@ -14083,7 +14083,7 @@
|
|
14083 |
"name": "Tamil",
|
14084 |
"bcp_47": "ta",
|
14085 |
"population": 3433380,
|
14086 |
-
"score": 0.
|
14087 |
},
|
14088 |
{
|
14089 |
"name": "Sinhala",
|
@@ -14164,7 +14164,7 @@
|
|
14164 |
]
|
14165 |
},
|
14166 |
"LT": {
|
14167 |
-
"score": 0.
|
14168 |
"languages": [
|
14169 |
{
|
14170 |
"name": "English",
|
@@ -14176,13 +14176,13 @@
|
|
14176 |
"name": "Russian",
|
14177 |
"bcp_47": "ru",
|
14178 |
"population": 2185168,
|
14179 |
-
"score": 0.
|
14180 |
},
|
14181 |
{
|
14182 |
"name": "German",
|
14183 |
"bcp_47": "de",
|
14184 |
"population": 382404,
|
14185 |
-
"score": 0.
|
14186 |
},
|
14187 |
{
|
14188 |
"name": "Lithuanian",
|
@@ -14199,7 +14199,7 @@
|
|
14199 |
]
|
14200 |
},
|
14201 |
"LU": {
|
14202 |
-
"score": 0.
|
14203 |
"languages": [
|
14204 |
{
|
14205 |
"name": "English",
|
@@ -14217,13 +14217,13 @@
|
|
14217 |
"name": "Portuguese",
|
14218 |
"bcp_47": "pt",
|
14219 |
"population": 100541,
|
14220 |
-
"score": 0.
|
14221 |
},
|
14222 |
{
|
14223 |
"name": "German",
|
14224 |
"bcp_47": "de",
|
14225 |
"population": 395880,
|
14226 |
-
"score": 0.
|
14227 |
},
|
14228 |
{
|
14229 |
"name": "Luxembourgish",
|
@@ -14234,7 +14234,7 @@
|
|
14234 |
]
|
14235 |
},
|
14236 |
"LV": {
|
14237 |
-
"score": 0.
|
14238 |
"languages": [
|
14239 |
{
|
14240 |
"name": "English",
|
@@ -14246,7 +14246,7 @@
|
|
14246 |
"name": "Russian",
|
14247 |
"bcp_47": "ru",
|
14248 |
"population": 714867,
|
14249 |
-
"score": 0.
|
14250 |
},
|
14251 |
{
|
14252 |
"name": "Latvian",
|
@@ -14362,7 +14362,7 @@
|
|
14362 |
]
|
14363 |
},
|
14364 |
"MO": {
|
14365 |
-
"score": 0.
|
14366 |
"languages": [
|
14367 |
{
|
14368 |
"name": "English",
|
@@ -14380,7 +14380,7 @@
|
|
14380 |
"name": "Portuguese",
|
14381 |
"bcp_47": "pt",
|
14382 |
"population": 30723,
|
14383 |
-
"score": 0.
|
14384 |
}
|
14385 |
]
|
14386 |
},
|
@@ -14413,7 +14413,7 @@
|
|
14413 |
]
|
14414 |
},
|
14415 |
"MT": {
|
14416 |
-
"score": 0.
|
14417 |
"languages": [
|
14418 |
{
|
14419 |
"name": "English",
|
@@ -14431,7 +14431,7 @@
|
|
14431 |
"name": "Italian",
|
14432 |
"bcp_47": "it",
|
14433 |
"population": 256070,
|
14434 |
-
"score": 0.
|
14435 |
},
|
14436 |
{
|
14437 |
"name": "Maltese",
|
@@ -14442,7 +14442,7 @@
|
|
14442 |
]
|
14443 |
},
|
14444 |
"MU": {
|
14445 |
-
"score": 0.
|
14446 |
"languages": [
|
14447 |
{
|
14448 |
"name": "English",
|
@@ -14466,7 +14466,7 @@
|
|
14466 |
"name": "Tamil",
|
14467 |
"bcp_47": "ta",
|
14468 |
"population": 34484,
|
14469 |
-
"score": 0.
|
14470 |
},
|
14471 |
{
|
14472 |
"name": "Bhojpuri",
|
@@ -14594,7 +14594,7 @@
|
|
14594 |
]
|
14595 |
},
|
14596 |
"MY": {
|
14597 |
-
"score": 0.
|
14598 |
"languages": [
|
14599 |
{
|
14600 |
"name": "English",
|
@@ -14612,13 +14612,13 @@
|
|
14612 |
"name": "Javanese",
|
14613 |
"bcp_47": "jv",
|
14614 |
"population": 391825,
|
14615 |
-
"score": 0.
|
14616 |
},
|
14617 |
{
|
14618 |
"name": "Tamil",
|
14619 |
"bcp_47": "ta",
|
14620 |
"population": 1371388,
|
14621 |
-
"score": 0.
|
14622 |
},
|
14623 |
{
|
14624 |
"name": "Malayalam",
|
@@ -14665,7 +14665,7 @@
|
|
14665 |
]
|
14666 |
},
|
14667 |
"NA": {
|
14668 |
-
"score": 0.
|
14669 |
"languages": [
|
14670 |
{
|
14671 |
"name": "English",
|
@@ -14677,7 +14677,7 @@
|
|
14677 |
"name": "German",
|
14678 |
"bcp_47": "de",
|
14679 |
"population": 23671,
|
14680 |
-
"score": 0.
|
14681 |
},
|
14682 |
{
|
14683 |
"name": "Afrikaans",
|
@@ -14836,7 +14836,7 @@
|
|
14836 |
]
|
14837 |
},
|
14838 |
"NL": {
|
14839 |
-
"score": 0.
|
14840 |
"languages": [
|
14841 |
{
|
14842 |
"name": "English",
|
@@ -14854,19 +14854,19 @@
|
|
14854 |
"name": "Indonesian",
|
14855 |
"bcp_47": "id",
|
14856 |
"population": 311047,
|
14857 |
-
"score": 0.
|
14858 |
},
|
14859 |
{
|
14860 |
"name": "German",
|
14861 |
"bcp_47": "de",
|
14862 |
"population": 12269084,
|
14863 |
-
"score": 0.
|
14864 |
},
|
14865 |
{
|
14866 |
"name": "Turkish",
|
14867 |
"bcp_47": "tr",
|
14868 |
"population": 207365,
|
14869 |
-
"score": 0.
|
14870 |
},
|
14871 |
{
|
14872 |
"name": "Dutch",
|
@@ -15183,7 +15183,7 @@
|
|
15183 |
]
|
15184 |
},
|
15185 |
"PH": {
|
15186 |
-
"score": 0.
|
15187 |
"languages": [
|
15188 |
{
|
15189 |
"name": "English",
|
@@ -15207,7 +15207,7 @@
|
|
15207 |
"name": "Filipino",
|
15208 |
"bcp_47": "fil",
|
15209 |
"population": 65508600,
|
15210 |
-
"score": 0.
|
15211 |
},
|
15212 |
{
|
15213 |
"name": "Cebuano",
|
@@ -15308,7 +15308,7 @@
|
|
15308 |
]
|
15309 |
},
|
15310 |
"PK": {
|
15311 |
-
"score": 0.
|
15312 |
"languages": [
|
15313 |
{
|
15314 |
"name": "English",
|
@@ -15326,7 +15326,7 @@
|
|
15326 |
"name": "Punjabi",
|
15327 |
"bcp_47": "pa",
|
15328 |
"population": 163450700,
|
15329 |
-
"score": 0.
|
15330 |
},
|
15331 |
{
|
15332 |
"name": "Western Panjabi",
|
@@ -15338,7 +15338,7 @@
|
|
15338 |
"name": "Persian",
|
15339 |
"bcp_47": "fa",
|
15340 |
"population": 1541107,
|
15341 |
-
"score": 0.
|
15342 |
},
|
15343 |
{
|
15344 |
"name": "Pashto",
|
@@ -15457,7 +15457,7 @@
|
|
15457 |
]
|
15458 |
},
|
15459 |
"PL": {
|
15460 |
-
"score": 0.
|
15461 |
"languages": [
|
15462 |
{
|
15463 |
"name": "English",
|
@@ -15469,13 +15469,13 @@
|
|
15469 |
"name": "Russian",
|
15470 |
"bcp_47": "ru",
|
15471 |
"population": 6890814,
|
15472 |
-
"score": 0.
|
15473 |
},
|
15474 |
{
|
15475 |
"name": "German",
|
15476 |
"bcp_47": "de",
|
15477 |
"population": 7273637,
|
15478 |
-
"score": 0.
|
15479 |
},
|
15480 |
{
|
15481 |
"name": "Polish",
|
@@ -15573,7 +15573,7 @@
|
|
15573 |
]
|
15574 |
},
|
15575 |
"PT": {
|
15576 |
-
"score": 0.
|
15577 |
"languages": [
|
15578 |
{
|
15579 |
"name": "English",
|
@@ -15597,7 +15597,7 @@
|
|
15597 |
"name": "Portuguese",
|
15598 |
"bcp_47": "pt",
|
15599 |
"population": 9890592,
|
15600 |
-
"score": 0.
|
15601 |
},
|
15602 |
{
|
15603 |
"name": "Galician",
|
@@ -15625,7 +15625,7 @@
|
|
15625 |
]
|
15626 |
},
|
15627 |
"RO": {
|
15628 |
-
"score": 0.
|
15629 |
"languages": [
|
15630 |
{
|
15631 |
"name": "English",
|
@@ -15649,13 +15649,13 @@
|
|
15649 |
"name": "German",
|
15650 |
"bcp_47": "de",
|
15651 |
"population": 44736,
|
15652 |
-
"score": 0.
|
15653 |
},
|
15654 |
{
|
15655 |
"name": "Turkish",
|
15656 |
"bcp_47": "tr",
|
15657 |
"population": 27694,
|
15658 |
-
"score": 0.
|
15659 |
},
|
15660 |
{
|
15661 |
"name": "Polish",
|
@@ -15883,7 +15883,7 @@
|
|
15883 |
]
|
15884 |
},
|
15885 |
"SG": {
|
15886 |
-
"score": 0.
|
15887 |
"languages": [
|
15888 |
{
|
15889 |
"name": "English",
|
@@ -15901,13 +15901,13 @@
|
|
15901 |
"name": "Punjabi",
|
15902 |
"bcp_47": "pa",
|
15903 |
"population": 9314,
|
15904 |
-
"score": 0.
|
15905 |
},
|
15906 |
{
|
15907 |
"name": "Tamil",
|
15908 |
"bcp_47": "ta",
|
15909 |
"population": 130403,
|
15910 |
-
"score": 0.
|
15911 |
},
|
15912 |
{
|
15913 |
"name": "Malayalam",
|
@@ -15935,7 +15935,7 @@
|
|
15935 |
]
|
15936 |
},
|
15937 |
"SI": {
|
15938 |
-
"score": 0.
|
15939 |
"languages": [
|
15940 |
{
|
15941 |
"name": "English",
|
@@ -15947,13 +15947,13 @@
|
|
15947 |
"name": "German",
|
15948 |
"bcp_47": "de",
|
15949 |
"population": 883126,
|
15950 |
-
"score": 0.
|
15951 |
},
|
15952 |
{
|
15953 |
"name": "Italian",
|
15954 |
"bcp_47": "it",
|
15955 |
"population": 3995,
|
15956 |
-
"score": 0.
|
15957 |
},
|
15958 |
{
|
15959 |
"name": "Hungarian",
|
@@ -15982,7 +15982,7 @@
|
|
15982 |
]
|
15983 |
},
|
15984 |
"SK": {
|
15985 |
-
"score": 0.
|
15986 |
"languages": [
|
15987 |
{
|
15988 |
"name": "English",
|
@@ -15994,7 +15994,7 @@
|
|
15994 |
"name": "German",
|
15995 |
"bcp_47": "de",
|
15996 |
"population": 1196932,
|
15997 |
-
"score": 0.
|
15998 |
},
|
15999 |
{
|
16000 |
"name": "Polish",
|
@@ -16290,7 +16290,7 @@
|
|
16290 |
]
|
16291 |
},
|
16292 |
"TR": {
|
16293 |
-
"score": 0.
|
16294 |
"languages": [
|
16295 |
{
|
16296 |
"name": "English",
|
@@ -16308,7 +16308,7 @@
|
|
16308 |
"name": "Turkish",
|
16309 |
"bcp_47": "tr",
|
16310 |
"population": 76276275,
|
16311 |
-
"score": 0.
|
16312 |
},
|
16313 |
{
|
16314 |
"name": "North Levantine Arabic",
|
@@ -16467,7 +16467,7 @@
|
|
16467 |
]
|
16468 |
},
|
16469 |
"TZ": {
|
16470 |
-
"score": 0.
|
16471 |
"languages": [
|
16472 |
{
|
16473 |
"name": "English",
|
@@ -16479,7 +16479,7 @@
|
|
16479 |
"name": "Swahili",
|
16480 |
"bcp_47": "sw",
|
16481 |
"population": 52697520,
|
16482 |
-
"score": 0.
|
16483 |
},
|
16484 |
{
|
16485 |
"name": "Sukuma",
|
@@ -16568,7 +16568,7 @@
|
|
16568 |
]
|
16569 |
},
|
16570 |
"UG": {
|
16571 |
-
"score": 0.
|
16572 |
"languages": [
|
16573 |
{
|
16574 |
"name": "English",
|
@@ -16586,7 +16586,7 @@
|
|
16586 |
"name": "Swahili",
|
16587 |
"bcp_47": "sw",
|
16588 |
"population": 32439750,
|
16589 |
-
"score": 0.
|
16590 |
},
|
16591 |
{
|
16592 |
"name": "Kinyarwanda",
|
@@ -16662,7 +16662,7 @@
|
|
16662 |
]
|
16663 |
},
|
16664 |
"US": {
|
16665 |
-
"score": 0.
|
16666 |
"languages": [
|
16667 |
{
|
16668 |
"name": "English",
|
@@ -16692,37 +16692,37 @@
|
|
16692 |
"name": "Russian",
|
16693 |
"bcp_47": "ru",
|
16694 |
"population": 798334,
|
16695 |
-
"score": 0.
|
16696 |
},
|
16697 |
{
|
16698 |
"name": "German",
|
16699 |
"bcp_47": "de",
|
16700 |
"population": 1563403,
|
16701 |
-
"score": 0.
|
16702 |
},
|
16703 |
{
|
16704 |
"name": "Vietnamese",
|
16705 |
"bcp_47": "vi",
|
16706 |
"population": 1130973,
|
16707 |
-
"score": 0.
|
16708 |
},
|
16709 |
{
|
16710 |
"name": "Korean",
|
16711 |
"bcp_47": "ko",
|
16712 |
"population": 997917,
|
16713 |
-
"score": 0.
|
16714 |
},
|
16715 |
{
|
16716 |
"name": "Italian",
|
16717 |
"bcp_47": "it",
|
16718 |
"population": 1130973,
|
16719 |
-
"score": 0.
|
16720 |
},
|
16721 |
{
|
16722 |
"name": "Filipino",
|
16723 |
"bcp_47": "fil",
|
16724 |
"population": 1397084,
|
16725 |
-
"score": 0.
|
16726 |
},
|
16727 |
{
|
16728 |
"name": "Yiddish",
|
@@ -16925,7 +16925,7 @@
|
|
16925 |
]
|
16926 |
},
|
16927 |
"ZA": {
|
16928 |
-
"score": 0.
|
16929 |
"languages": [
|
16930 |
{
|
16931 |
"name": "English",
|
@@ -16943,7 +16943,7 @@
|
|
16943 |
"name": "Swahili",
|
16944 |
"bcp_47": "sw",
|
16945 |
"population": 1016,
|
16946 |
-
"score": 0.
|
16947 |
},
|
16948 |
{
|
16949 |
"name": "Zulu",
|
@@ -17125,7 +17125,7 @@
|
|
17125 |
]
|
17126 |
},
|
17127 |
"ID": {
|
17128 |
-
"score": 0.
|
17129 |
"languages": [
|
17130 |
{
|
17131 |
"name": "Chinese",
|
@@ -17137,13 +17137,13 @@
|
|
17137 |
"name": "Indonesian",
|
17138 |
"bcp_47": "id",
|
17139 |
"population": 170896640,
|
17140 |
-
"score": 0.
|
17141 |
},
|
17142 |
{
|
17143 |
"name": "Javanese",
|
17144 |
"bcp_47": "jv",
|
17145 |
"population": 90788840,
|
17146 |
-
"score": 0.
|
17147 |
},
|
17148 |
{
|
17149 |
"name": "Malay",
|
@@ -17304,7 +17304,7 @@
|
|
17304 |
]
|
17305 |
},
|
17306 |
"MN": {
|
17307 |
-
"score": 0.
|
17308 |
"languages": [
|
17309 |
{
|
17310 |
"name": "Chinese",
|
@@ -17316,7 +17316,7 @@
|
|
17316 |
"name": "Russian",
|
17317 |
"bcp_47": "ru",
|
17318 |
"population": 4118,
|
17319 |
-
"score": 0.
|
17320 |
},
|
17321 |
{
|
17322 |
"name": "Kazakh",
|
@@ -17408,7 +17408,7 @@
|
|
17408 |
]
|
17409 |
},
|
17410 |
"VN": {
|
17411 |
-
"score": 0.
|
17412 |
"languages": [
|
17413 |
{
|
17414 |
"name": "Chinese",
|
@@ -17420,7 +17420,7 @@
|
|
17420 |
"name": "Vietnamese",
|
17421 |
"bcp_47": "vi",
|
17422 |
"population": 84900318,
|
17423 |
-
"score": 0.
|
17424 |
},
|
17425 |
{
|
17426 |
"name": "Hmong Njua",
|
@@ -17603,7 +17603,7 @@
|
|
17603 |
]
|
17604 |
},
|
17605 |
"GQ": {
|
17606 |
-
"score": 0.
|
17607 |
"languages": [
|
17608 |
{
|
17609 |
"name": "Spanish",
|
@@ -17621,7 +17621,7 @@
|
|
17621 |
"name": "Portuguese",
|
17622 |
"bcp_47": "pt",
|
17623 |
"population": 1,
|
17624 |
-
"score": 0.
|
17625 |
},
|
17626 |
{
|
17627 |
"name": "Fang",
|
@@ -17700,7 +17700,7 @@
|
|
17700 |
]
|
17701 |
},
|
17702 |
"PY": {
|
17703 |
-
"score": 0.
|
17704 |
"languages": [
|
17705 |
{
|
17706 |
"name": "Spanish",
|
@@ -17712,7 +17712,7 @@
|
|
17712 |
"name": "German",
|
17713 |
"bcp_47": "de",
|
17714 |
"population": 208559,
|
17715 |
-
"score": 0.
|
17716 |
},
|
17717 |
{
|
17718 |
"name": "Guarani",
|
@@ -17819,7 +17819,7 @@
|
|
17819 |
]
|
17820 |
},
|
17821 |
"IR": {
|
17822 |
-
"score": 0.
|
17823 |
"languages": [
|
17824 |
{
|
17825 |
"name": "Arabic",
|
@@ -17831,7 +17831,7 @@
|
|
17831 |
"name": "Persian",
|
17832 |
"bcp_47": "fa",
|
17833 |
"population": 63692475,
|
17834 |
-
"score": 0.
|
17835 |
},
|
17836 |
{
|
17837 |
"name": "Pashto",
|
@@ -18166,7 +18166,7 @@
|
|
18166 |
]
|
18167 |
},
|
18168 |
"OM": {
|
18169 |
-
"score": 0.
|
18170 |
"languages": [
|
18171 |
{
|
18172 |
"name": "Arabic",
|
@@ -18178,7 +18178,7 @@
|
|
18178 |
"name": "Persian",
|
18179 |
"bcp_47": "fa",
|
18180 |
"population": 43849,
|
18181 |
-
"score": 0.
|
18182 |
},
|
18183 |
{
|
18184 |
"name": "Baluchi",
|
@@ -18206,7 +18206,7 @@
|
|
18206 |
]
|
18207 |
},
|
18208 |
"QA": {
|
18209 |
-
"score": 0.
|
18210 |
"languages": [
|
18211 |
{
|
18212 |
"name": "Arabic",
|
@@ -18218,7 +18218,7 @@
|
|
18218 |
"name": "Persian",
|
18219 |
"bcp_47": "fa",
|
18220 |
"population": 268859,
|
18221 |
-
"score": 0.
|
18222 |
},
|
18223 |
{
|
18224 |
"name": "Malayalam",
|
@@ -18246,7 +18246,7 @@
|
|
18246 |
]
|
18247 |
},
|
18248 |
"SO": {
|
18249 |
-
"score": 0.
|
18250 |
"languages": [
|
18251 |
{
|
18252 |
"name": "Arabic",
|
@@ -18258,7 +18258,7 @@
|
|
18258 |
"name": "Swahili",
|
18259 |
"bcp_47": "sw",
|
18260 |
"population": 235142,
|
18261 |
-
"score": 0.
|
18262 |
},
|
18263 |
{
|
18264 |
"name": "Oromo",
|
@@ -18333,7 +18333,7 @@
|
|
18333 |
]
|
18334 |
},
|
18335 |
"TJ": {
|
18336 |
-
"score":
|
18337 |
"languages": [
|
18338 |
{
|
18339 |
"name": "Arabic",
|
@@ -18345,13 +18345,13 @@
|
|
18345 |
"name": "Russian",
|
18346 |
"bcp_47": "ru",
|
18347 |
"population": 1064840,
|
18348 |
-
"score": 0.
|
18349 |
},
|
18350 |
{
|
18351 |
"name": "Persian",
|
18352 |
"bcp_47": "fa",
|
18353 |
"population": 69215,
|
18354 |
-
"score": 0.
|
18355 |
},
|
18356 |
{
|
18357 |
"name": "Tajik",
|
@@ -18454,7 +18454,7 @@
|
|
18454 |
]
|
18455 |
},
|
18456 |
"CD": {
|
18457 |
-
"score": 0.
|
18458 |
"languages": [
|
18459 |
{
|
18460 |
"name": "French",
|
@@ -18466,7 +18466,7 @@
|
|
18466 |
"name": "Swahili",
|
18467 |
"bcp_47": "sw",
|
18468 |
"population": 50890000,
|
18469 |
-
"score": 0.
|
18470 |
},
|
18471 |
{
|
18472 |
"name": "Kinyarwanda",
|
@@ -18718,7 +18718,7 @@
|
|
18718 |
]
|
18719 |
},
|
18720 |
"RE": {
|
18721 |
-
"score": 0.
|
18722 |
"languages": [
|
18723 |
{
|
18724 |
"name": "French",
|
@@ -18730,7 +18730,7 @@
|
|
18730 |
"name": "Tamil",
|
18731 |
"bcp_47": "ta",
|
18732 |
"population": 118138,
|
18733 |
-
"score": 0.
|
18734 |
},
|
18735 |
{
|
18736 |
"name": "Réunion Creole French",
|
@@ -18887,7 +18887,7 @@
|
|
18887 |
]
|
18888 |
},
|
18889 |
"YT": {
|
18890 |
-
"score": 0.
|
18891 |
"languages": [
|
18892 |
{
|
18893 |
"name": "French",
|
@@ -18899,7 +18899,7 @@
|
|
18899 |
"name": "Swahili",
|
18900 |
"bcp_47": "sw",
|
18901 |
"population": 2716,
|
18902 |
-
"score": 0.
|
18903 |
},
|
18904 |
{
|
18905 |
"name": "Comorian",
|
@@ -18916,13 +18916,13 @@
|
|
18916 |
]
|
18917 |
},
|
18918 |
"AO": {
|
18919 |
-
"score": 0.
|
18920 |
"languages": [
|
18921 |
{
|
18922 |
"name": "Portuguese",
|
18923 |
"bcp_47": "pt",
|
18924 |
"population": 21789941,
|
18925 |
-
"score": 0.
|
18926 |
},
|
18927 |
{
|
18928 |
"name": "Umbundu",
|
@@ -18945,13 +18945,13 @@
|
|
18945 |
]
|
18946 |
},
|
18947 |
"CV": {
|
18948 |
-
"score": 0.
|
18949 |
"languages": [
|
18950 |
{
|
18951 |
"name": "Portuguese",
|
18952 |
"bcp_47": "pt",
|
18953 |
"population": 443274,
|
18954 |
-
"score": 0.
|
18955 |
},
|
18956 |
{
|
18957 |
"name": "Kabuverdianu",
|
@@ -18962,13 +18962,13 @@
|
|
18962 |
]
|
18963 |
},
|
18964 |
"GW": {
|
18965 |
-
"score": 0.
|
18966 |
"languages": [
|
18967 |
{
|
18968 |
"name": "Portuguese",
|
18969 |
"bcp_47": "pt",
|
18970 |
"population": 1927100,
|
18971 |
-
"score": 0.
|
18972 |
},
|
18973 |
{
|
18974 |
"name": "Fula",
|
@@ -18985,19 +18985,19 @@
|
|
18985 |
]
|
18986 |
},
|
18987 |
"MZ": {
|
18988 |
-
"score": 0.
|
18989 |
"languages": [
|
18990 |
{
|
18991 |
"name": "Portuguese",
|
18992 |
"bcp_47": "pt",
|
18993 |
"population": 8126514,
|
18994 |
-
"score": 0.
|
18995 |
},
|
18996 |
{
|
18997 |
"name": "Swahili",
|
18998 |
"bcp_47": "sw",
|
18999 |
"population": 9330,
|
19000 |
-
"score": 0.
|
19001 |
},
|
19002 |
{
|
19003 |
"name": "Nyanja",
|
@@ -19062,24 +19062,24 @@
|
|
19062 |
]
|
19063 |
},
|
19064 |
"ST": {
|
19065 |
-
"score": 0.
|
19066 |
"languages": [
|
19067 |
{
|
19068 |
"name": "Portuguese",
|
19069 |
"bcp_47": "pt",
|
19070 |
"population": 179454,
|
19071 |
-
"score": 0.
|
19072 |
}
|
19073 |
]
|
19074 |
},
|
19075 |
"TL": {
|
19076 |
-
"score": 0.
|
19077 |
"languages": [
|
19078 |
{
|
19079 |
"name": "Portuguese",
|
19080 |
"bcp_47": "pt",
|
19081 |
"population": 816395,
|
19082 |
-
"score": 0.
|
19083 |
},
|
19084 |
{
|
19085 |
"name": "Tetum",
|
@@ -19090,13 +19090,13 @@
|
|
19090 |
]
|
19091 |
},
|
19092 |
"BY": {
|
19093 |
-
"score": 0.
|
19094 |
"languages": [
|
19095 |
{
|
19096 |
"name": "Russian",
|
19097 |
"bcp_47": "ru",
|
19098 |
"population": 1137350,
|
19099 |
-
"score": 0.
|
19100 |
},
|
19101 |
{
|
19102 |
"name": "Belarusian",
|
@@ -19107,13 +19107,13 @@
|
|
19107 |
]
|
19108 |
},
|
19109 |
"GE": {
|
19110 |
-
"score": 0.
|
19111 |
"languages": [
|
19112 |
{
|
19113 |
"name": "Russian",
|
19114 |
"bcp_47": "ru",
|
19115 |
"population": 359730,
|
19116 |
-
"score": 0.
|
19117 |
},
|
19118 |
{
|
19119 |
"name": "Kurdish",
|
@@ -19154,13 +19154,13 @@
|
|
19154 |
]
|
19155 |
},
|
19156 |
"KG": {
|
19157 |
-
"score": 0.
|
19158 |
"languages": [
|
19159 |
{
|
19160 |
"name": "Russian",
|
19161 |
"bcp_47": "ru",
|
19162 |
"population": 2147364,
|
19163 |
-
"score": 0.
|
19164 |
},
|
19165 |
{
|
19166 |
"name": "Kyrgyz",
|
@@ -19171,13 +19171,13 @@
|
|
19171 |
]
|
19172 |
},
|
19173 |
"MD": {
|
19174 |
-
"score": 0.
|
19175 |
"languages": [
|
19176 |
{
|
19177 |
"name": "Russian",
|
19178 |
"bcp_47": "ru",
|
19179 |
"population": 100935,
|
19180 |
-
"score": 0.
|
19181 |
},
|
19182 |
{
|
19183 |
"name": "Ukrainian",
|
@@ -19206,13 +19206,13 @@
|
|
19206 |
]
|
19207 |
},
|
19208 |
"RU": {
|
19209 |
-
"score": 0.
|
19210 |
"languages": [
|
19211 |
{
|
19212 |
"name": "Russian",
|
19213 |
"bcp_47": "ru",
|
19214 |
"population": 133218680,
|
19215 |
-
"score": 0.
|
19216 |
},
|
19217 |
{
|
19218 |
"name": "Azerbaijani",
|
@@ -19427,13 +19427,13 @@
|
|
19427 |
]
|
19428 |
},
|
19429 |
"SJ": {
|
19430 |
-
"score": 0.
|
19431 |
"languages": [
|
19432 |
{
|
19433 |
"name": "Russian",
|
19434 |
"bcp_47": "ru",
|
19435 |
"population": 1200,
|
19436 |
-
"score": 0.
|
19437 |
},
|
19438 |
{
|
19439 |
"name": "Norwegian Bokmål",
|
@@ -19444,13 +19444,13 @@
|
|
19444 |
]
|
19445 |
},
|
19446 |
"TM": {
|
19447 |
-
"score": 0.
|
19448 |
"languages": [
|
19449 |
{
|
19450 |
"name": "Russian",
|
19451 |
"bcp_47": "ru",
|
19452 |
"population": 663436,
|
19453 |
-
"score": 0.
|
19454 |
},
|
19455 |
{
|
19456 |
"name": "Uzbek",
|
@@ -19473,19 +19473,19 @@
|
|
19473 |
]
|
19474 |
},
|
19475 |
"UA": {
|
19476 |
-
"score": 0.
|
19477 |
"languages": [
|
19478 |
{
|
19479 |
"name": "Russian",
|
19480 |
"bcp_47": "ru",
|
19481 |
"population": 20204534,
|
19482 |
-
"score": 0.
|
19483 |
},
|
19484 |
{
|
19485 |
"name": "Turkish",
|
19486 |
"bcp_47": "tr",
|
19487 |
"population": 184476,
|
19488 |
-
"score": 0.
|
19489 |
},
|
19490 |
{
|
19491 |
"name": "Polish",
|
@@ -19550,19 +19550,19 @@
|
|
19550 |
]
|
19551 |
},
|
19552 |
"UZ": {
|
19553 |
-
"score": 0.
|
19554 |
"languages": [
|
19555 |
{
|
19556 |
"name": "Russian",
|
19557 |
"bcp_47": "ru",
|
19558 |
"population": 4279156,
|
19559 |
-
"score": 0.
|
19560 |
},
|
19561 |
{
|
19562 |
"name": "Turkish",
|
19563 |
"bcp_47": "tr",
|
19564 |
"population": 232297,
|
19565 |
-
"score": 0.
|
19566 |
},
|
19567 |
{
|
19568 |
"name": "Uzbek",
|
@@ -19579,13 +19579,13 @@
|
|
19579 |
]
|
19580 |
},
|
19581 |
"LI": {
|
19582 |
-
"score": 0.
|
19583 |
"languages": [
|
19584 |
{
|
19585 |
"name": "German",
|
19586 |
"bcp_47": "de",
|
19587 |
"population": 39137,
|
19588 |
-
"score": 0.
|
19589 |
},
|
19590 |
{
|
19591 |
"name": "Swiss German",
|
@@ -19602,19 +19602,19 @@
|
|
19602 |
]
|
19603 |
},
|
19604 |
"JP": {
|
19605 |
-
"score": 0.
|
19606 |
"languages": [
|
19607 |
{
|
19608 |
"name": "Japanese",
|
19609 |
"bcp_47": "ja",
|
19610 |
"population": 119231650,
|
19611 |
-
"score": 0.
|
19612 |
},
|
19613 |
{
|
19614 |
"name": "Korean",
|
19615 |
"bcp_47": "ko",
|
19616 |
"population": 652636,
|
19617 |
-
"score": 0.
|
19618 |
},
|
19619 |
{
|
19620 |
"name": "Central Okinawan",
|
@@ -19625,13 +19625,13 @@
|
|
19625 |
]
|
19626 |
},
|
19627 |
"AF": {
|
19628 |
-
"score": 0.
|
19629 |
"languages": [
|
19630 |
{
|
19631 |
"name": "Persian",
|
19632 |
"bcp_47": "fa",
|
19633 |
"population": 18321900,
|
19634 |
-
"score": 0.
|
19635 |
},
|
19636 |
{
|
19637 |
"name": "Pashto",
|
@@ -19684,13 +19684,13 @@
|
|
19684 |
]
|
19685 |
},
|
19686 |
"MK": {
|
19687 |
-
"score": 0.
|
19688 |
"languages": [
|
19689 |
{
|
19690 |
"name": "Turkish",
|
19691 |
"bcp_47": "tr",
|
19692 |
"population": 74409,
|
19693 |
-
"score": 0.
|
19694 |
},
|
19695 |
{
|
19696 |
"name": "Albanian",
|
@@ -19707,35 +19707,35 @@
|
|
19707 |
]
|
19708 |
},
|
19709 |
"KP": {
|
19710 |
-
"score": 0.
|
19711 |
"languages": [
|
19712 |
{
|
19713 |
"name": "Korean",
|
19714 |
"bcp_47": "ko",
|
19715 |
"population": 22566280,
|
19716 |
-
"score": 0.
|
19717 |
}
|
19718 |
]
|
19719 |
},
|
19720 |
"KR": {
|
19721 |
-
"score": 0.
|
19722 |
"languages": [
|
19723 |
{
|
19724 |
"name": "Korean",
|
19725 |
"bcp_47": "ko",
|
19726 |
"population": 51835100,
|
19727 |
-
"score": 0.
|
19728 |
}
|
19729 |
]
|
19730 |
},
|
19731 |
"SM": {
|
19732 |
-
"score": 0.
|
19733 |
"languages": [
|
19734 |
{
|
19735 |
"name": "Italian",
|
19736 |
"bcp_47": "it",
|
19737 |
"population": 30466,
|
19738 |
-
"score": 0.
|
19739 |
},
|
19740 |
{
|
19741 |
"name": "Esperanto",
|
@@ -19746,13 +19746,13 @@
|
|
19746 |
]
|
19747 |
},
|
19748 |
"VA": {
|
19749 |
-
"score": 0.
|
19750 |
"languages": [
|
19751 |
{
|
19752 |
"name": "Italian",
|
19753 |
"bcp_47": "it",
|
19754 |
"population": 820,
|
19755 |
-
"score": 0.
|
19756 |
},
|
19757 |
{
|
19758 |
"name": "Latin",
|
|
|
26 |
"license": null,
|
27 |
"average": 0.66,
|
28 |
"classification_accuracy": 0.73,
|
29 |
+
"language_modeling_chrf": 0.96,
|
30 |
"translation_bleu": 0.4,
|
31 |
"translation_chrf": 0.54
|
32 |
},
|
|
|
39 |
"size": 27432406640.0,
|
40 |
"type": "Open",
|
41 |
"license": "Gemma",
|
42 |
+
"average": 0.64,
|
43 |
"classification_accuracy": 0.72,
|
44 |
+
"language_modeling_chrf": 0.94,
|
45 |
"translation_bleu": 0.37,
|
46 |
"translation_chrf": 0.54
|
47 |
},
|
|
|
54 |
"size": 70553706496.0,
|
55 |
"type": "Open",
|
56 |
"license": "Llama3.1",
|
57 |
+
"average": 0.63,
|
58 |
"classification_accuracy": 0.57,
|
59 |
+
"language_modeling_chrf": 0.95,
|
60 |
"translation_bleu": 0.43,
|
61 |
"translation_chrf": 0.57
|
62 |
},
|
63 |
{
|
64 |
"rank": 5,
|
65 |
+
"provider": "Meta Llama",
|
66 |
+
"model": "Llama 3 70b Instruct",
|
67 |
"hf_id": null,
|
68 |
"creation_date": null,
|
69 |
"size": null,
|
70 |
"type": "Commercial",
|
71 |
"license": null,
|
72 |
"average": 0.61,
|
73 |
+
"classification_accuracy": 0.8,
|
74 |
+
"language_modeling_chrf": 0.96,
|
75 |
+
"translation_bleu": 0.25,
|
76 |
+
"translation_chrf": 0.43
|
77 |
},
|
78 |
{
|
79 |
"rank": 6,
|
80 |
+
"provider": "Amazon",
|
81 |
+
"model": "Nova Micro V1",
|
82 |
"hf_id": null,
|
83 |
"creation_date": null,
|
84 |
"size": null,
|
85 |
"type": "Commercial",
|
86 |
"license": null,
|
87 |
+
"average": 0.6,
|
88 |
+
"classification_accuracy": 0.52,
|
89 |
+
"language_modeling_chrf": 0.94,
|
90 |
+
"translation_bleu": 0.4,
|
91 |
+
"translation_chrf": 0.56
|
92 |
},
|
93 |
{
|
94 |
"rank": 7,
|
|
|
101 |
"license": null,
|
102 |
"average": 0.6,
|
103 |
"classification_accuracy": 0.52,
|
104 |
+
"language_modeling_chrf": 0.96,
|
105 |
"translation_bleu": 0.39,
|
106 |
"translation_chrf": 0.55
|
107 |
},
|
|
|
116 |
"license": "Apache 2.0",
|
117 |
"average": 0.58,
|
118 |
"classification_accuracy": 0.55,
|
119 |
+
"language_modeling_chrf": 0.88,
|
120 |
"translation_bleu": 0.38,
|
121 |
"translation_chrf": 0.52
|
122 |
},
|
|
|
129 |
"size": 70553706496.0,
|
130 |
"type": "Open",
|
131 |
"license": "Llama3.3",
|
132 |
+
"average": 0.55,
|
133 |
+
"classification_accuracy": 0.51,
|
134 |
"language_modeling_chrf": 0.94,
|
135 |
+
"translation_bleu": 0.28,
|
136 |
+
"translation_chrf": 0.46
|
137 |
},
|
138 |
{
|
139 |
"rank": 10,
|
|
|
144 |
"size": null,
|
145 |
"type": "Commercial",
|
146 |
"license": null,
|
147 |
+
"average": 0.54,
|
148 |
"classification_accuracy": 0.5,
|
149 |
+
"language_modeling_chrf": 0.86,
|
150 |
"translation_bleu": 0.32,
|
151 |
"translation_chrf": 0.49
|
152 |
},
|
|
|
161 |
"license": "Mit",
|
162 |
"average": 0.52,
|
163 |
"classification_accuracy": 0.42,
|
164 |
+
"language_modeling_chrf": 0.88,
|
165 |
"translation_bleu": 0.32,
|
166 |
"translation_chrf": 0.46
|
167 |
},
|
|
|
176 |
"license": "Apache 2.0",
|
177 |
"average": 0.25,
|
178 |
"classification_accuracy": 0.0,
|
179 |
+
"language_modeling_chrf": 0.47,
|
180 |
"translation_bleu": 0.21,
|
181 |
"translation_chrf": 0.3
|
182 |
}
|
|
|
220 |
"in_benchmark": true,
|
221 |
"NaN": 0.0,
|
222 |
"classification_accuracy": 0.53,
|
223 |
+
"language_modeling_chrf": 0.94,
|
224 |
"translation_bleu": 0.32,
|
225 |
"translation_chrf": 0.49
|
226 |
},
|
|
|
248 |
"in_benchmark": true,
|
249 |
"NaN": 0.0,
|
250 |
"classification_accuracy": 0.43,
|
251 |
+
"language_modeling_chrf": 0.94,
|
252 |
"translation_bleu": 0.28,
|
253 |
"translation_chrf": 0.47
|
254 |
},
|
|
|
262 |
"in_benchmark": true,
|
263 |
"NaN": 0.0,
|
264 |
"classification_accuracy": 0.5,
|
265 |
+
"language_modeling_chrf": 0.92,
|
266 |
"translation_bleu": 0.24,
|
267 |
"translation_chrf": 0.42
|
268 |
},
|
|
|
290 |
"in_benchmark": true,
|
291 |
"NaN": 0.0,
|
292 |
"classification_accuracy": 0.4,
|
293 |
+
"language_modeling_chrf": 0.91,
|
294 |
"translation_bleu": 0.2,
|
295 |
"translation_chrf": 0.41
|
296 |
},
|
|
|
300 |
"autonym": "Português",
|
301 |
"speakers": 237496885,
|
302 |
"family": "Indo-European",
|
303 |
+
"average": 0.45,
|
304 |
"in_benchmark": true,
|
305 |
"NaN": 0.0,
|
306 |
"classification_accuracy": 0.5,
|
307 |
+
"language_modeling_chrf": 0.96,
|
308 |
"translation_bleu": 0.31,
|
309 |
"translation_chrf": 0.49
|
310 |
},
|
|
|
314 |
"autonym": "ਪੰਜਾਬੀ",
|
315 |
"speakers": 203571210,
|
316 |
"family": "Indo-European",
|
317 |
+
"average": 0.43,
|
318 |
"in_benchmark": true,
|
319 |
"NaN": 0.0,
|
320 |
"classification_accuracy": 0.4,
|
321 |
+
"language_modeling_chrf": 0.9,
|
322 |
"translation_bleu": 0.34,
|
323 |
"translation_chrf": 0.49
|
324 |
},
|
|
|
328 |
"autonym": "Русский",
|
329 |
"speakers": 195841151,
|
330 |
"family": "Indo-European",
|
331 |
+
"average": 0.45,
|
332 |
"in_benchmark": true,
|
333 |
"NaN": 0.0,
|
334 |
+
"classification_accuracy": 0.57,
|
335 |
+
"language_modeling_chrf": 0.97,
|
336 |
+
"translation_bleu": 0.26,
|
337 |
+
"translation_chrf": 0.45
|
338 |
},
|
339 |
{
|
340 |
"bcp_47": "sw",
|
|
|
342 |
"autonym": "Kiswahili",
|
343 |
"speakers": 171610296,
|
344 |
"family": "Atlantic-Congo",
|
345 |
+
"average": 0.45,
|
346 |
"in_benchmark": true,
|
347 |
"NaN": 0.0,
|
348 |
+
"classification_accuracy": 0.57,
|
349 |
+
"language_modeling_chrf": 0.94,
|
350 |
+
"translation_bleu": 0.3,
|
351 |
+
"translation_chrf": 0.47
|
352 |
},
|
353 |
{
|
354 |
"bcp_47": "id",
|
|
|
356 |
"autonym": "Bahasa Indonesia",
|
357 |
"speakers": 171207687,
|
358 |
"family": "Austronesian",
|
359 |
+
"average": 0.47,
|
360 |
"in_benchmark": true,
|
361 |
"NaN": 0.0,
|
362 |
+
"classification_accuracy": 0.63,
|
363 |
+
"language_modeling_chrf": 0.96,
|
364 |
+
"translation_bleu": 0.29,
|
365 |
+
"translation_chrf": 0.47
|
366 |
},
|
367 |
{
|
368 |
"bcp_47": "de",
|
|
|
370 |
"autonym": "Deutsch",
|
371 |
"speakers": 136350226,
|
372 |
"family": "Indo-European",
|
373 |
+
"average": 0.49,
|
374 |
"in_benchmark": true,
|
375 |
"NaN": 0.0,
|
376 |
+
"classification_accuracy": 0.67,
|
377 |
+
"language_modeling_chrf": 0.96,
|
378 |
+
"translation_bleu": 0.32,
|
379 |
+
"translation_chrf": 0.5
|
380 |
},
|
381 |
{
|
382 |
"bcp_47": "ja",
|
|
|
384 |
"autonym": "日本語",
|
385 |
"speakers": 119729026,
|
386 |
"family": "Japonic",
|
387 |
+
"average": 0.46,
|
388 |
"in_benchmark": true,
|
389 |
"NaN": 0.0,
|
390 |
+
"classification_accuracy": 0.63,
|
391 |
+
"language_modeling_chrf": 0.94,
|
392 |
+
"translation_bleu": 0.27,
|
393 |
+
"translation_chrf": 0.44
|
394 |
},
|
395 |
{
|
396 |
"bcp_47": "te",
|
|
|
398 |
"autonym": "తెలుగు",
|
399 |
"speakers": 95478480,
|
400 |
"family": "Dravidian",
|
401 |
+
"average": 0.41,
|
402 |
"in_benchmark": true,
|
403 |
"NaN": 0.0,
|
404 |
+
"classification_accuracy": 0.37,
|
405 |
+
"language_modeling_chrf": 0.95,
|
406 |
+
"translation_bleu": 0.28,
|
407 |
+
"translation_chrf": 0.47
|
408 |
},
|
409 |
{
|
410 |
"bcp_47": "lah",
|
|
|
426 |
"autonym": "मराठी",
|
427 |
"speakers": 92826300,
|
428 |
"family": "Indo-European",
|
429 |
+
"average": 0.45,
|
430 |
"in_benchmark": true,
|
431 |
"NaN": 0.0,
|
432 |
+
"classification_accuracy": 0.63,
|
433 |
+
"language_modeling_chrf": 0.94,
|
434 |
+
"translation_bleu": 0.25,
|
435 |
+
"translation_chrf": 0.42
|
436 |
},
|
437 |
{
|
438 |
"bcp_47": "jv",
|
|
|
440 |
"autonym": "Jawa",
|
441 |
"speakers": 91180665,
|
442 |
"family": "Austronesian",
|
443 |
+
"average": 0.41,
|
444 |
"in_benchmark": true,
|
445 |
"NaN": 0.0,
|
446 |
+
"classification_accuracy": 0.47,
|
447 |
+
"language_modeling_chrf": 0.93,
|
448 |
+
"translation_bleu": 0.24,
|
449 |
+
"translation_chrf": 0.42
|
450 |
},
|
451 |
{
|
452 |
"bcp_47": "vi",
|
|
|
454 |
"autonym": "Tiếng Việt",
|
455 |
"speakers": 86222962,
|
456 |
"family": "Austroasiatic",
|
457 |
+
"average": 0.45,
|
458 |
"in_benchmark": true,
|
459 |
"NaN": 0.0,
|
460 |
+
"classification_accuracy": 0.6,
|
461 |
+
"language_modeling_chrf": 0.96,
|
462 |
+
"translation_bleu": 0.26,
|
463 |
+
"translation_chrf": 0.44
|
464 |
},
|
465 |
{
|
466 |
"bcp_47": "ta",
|
|
|
468 |
"autonym": "தமிழ்",
|
469 |
"speakers": 85616159,
|
470 |
"family": "Dravidian",
|
471 |
+
"average": 0.41,
|
472 |
"in_benchmark": true,
|
473 |
"NaN": 0.0,
|
474 |
+
"classification_accuracy": 0.43,
|
475 |
+
"language_modeling_chrf": 0.96,
|
476 |
+
"translation_bleu": 0.25,
|
477 |
+
"translation_chrf": 0.42
|
478 |
},
|
479 |
{
|
480 |
"bcp_47": "fa",
|
|
|
482 |
"autonym": "فارسی",
|
483 |
"speakers": 84710459,
|
484 |
"family": "Indo-European",
|
485 |
+
"average": 0.41,
|
486 |
"in_benchmark": true,
|
487 |
"NaN": 0.0,
|
488 |
+
"classification_accuracy": 0.4,
|
489 |
+
"language_modeling_chrf": 0.94,
|
490 |
+
"translation_bleu": 0.26,
|
491 |
+
"translation_chrf": 0.45
|
492 |
},
|
493 |
{
|
494 |
"bcp_47": "wuu",
|
|
|
510 |
"autonym": "Türkçe",
|
511 |
"speakers": 80360704,
|
512 |
"family": "Turkic",
|
513 |
+
"average": 0.44,
|
514 |
"in_benchmark": true,
|
515 |
"NaN": 0.0,
|
516 |
+
"classification_accuracy": 0.53,
|
517 |
+
"language_modeling_chrf": 0.94,
|
518 |
+
"translation_bleu": 0.28,
|
519 |
+
"translation_chrf": 0.45
|
520 |
},
|
521 |
{
|
522 |
"bcp_47": "yue",
|
|
|
524 |
"autonym": "粵語",
|
525 |
"speakers": 79654759,
|
526 |
"family": "Sino-Tibetan",
|
527 |
+
"average": 0.39,
|
528 |
"in_benchmark": true,
|
529 |
"NaN": 0.0,
|
530 |
+
"classification_accuracy": 0.43,
|
531 |
+
"language_modeling_chrf": 0.9,
|
532 |
+
"translation_bleu": 0.23,
|
533 |
+
"translation_chrf": 0.41
|
534 |
},
|
535 |
{
|
536 |
"bcp_47": "ko",
|
|
|
538 |
"autonym": "한국어",
|
539 |
"speakers": 78357046,
|
540 |
"family": "Koreanic",
|
541 |
+
"average": 0.41,
|
542 |
"in_benchmark": true,
|
543 |
"NaN": 0.0,
|
544 |
+
"classification_accuracy": 0.53,
|
545 |
+
"language_modeling_chrf": 0.94,
|
546 |
+
"translation_bleu": 0.2,
|
547 |
+
"translation_chrf": 0.4
|
548 |
},
|
549 |
{
|
550 |
"bcp_47": "it",
|
|
|
552 |
"autonym": "Italiano",
|
553 |
"speakers": 70247060,
|
554 |
"family": "Indo-European",
|
555 |
+
"average": 0.47,
|
556 |
"in_benchmark": true,
|
557 |
"NaN": 0.0,
|
558 |
+
"classification_accuracy": 0.67,
|
559 |
+
"language_modeling_chrf": 0.94,
|
560 |
+
"translation_bleu": 0.28,
|
561 |
+
"translation_chrf": 0.47
|
562 |
},
|
563 |
{
|
564 |
"bcp_47": "fil",
|
|
|
566 |
"autonym": "Filipino",
|
567 |
"speakers": 67471096,
|
568 |
"family": "Austronesian",
|
569 |
+
"average": 0.42,
|
570 |
"in_benchmark": true,
|
571 |
"NaN": 0.0,
|
572 |
+
"classification_accuracy": 0.43,
|
573 |
+
"language_modeling_chrf": 0.94,
|
574 |
+
"translation_bleu": 0.29,
|
575 |
+
"translation_chrf": 0.45
|
576 |
},
|
577 |
{
|
578 |
"bcp_47": "arz",
|
|
|
580 |
"autonym": "Egyptian Arabic",
|
581 |
"speakers": 66639360,
|
582 |
"family": "Afro-Asiatic",
|
583 |
+
"average": 0.38,
|
584 |
"in_benchmark": true,
|
585 |
"NaN": 0.0,
|
586 |
+
"classification_accuracy": 0.4,
|
587 |
+
"language_modeling_chrf": 0.93,
|
588 |
+
"translation_bleu": 0.2,
|
589 |
+
"translation_chrf": 0.39
|
590 |
},
|
591 |
{
|
592 |
"bcp_47": "gu",
|
|
|
594 |
"autonym": "ગુજરાતી",
|
595 |
"speakers": 61721799,
|
596 |
"family": "Indo-European",
|
597 |
+
"average": 0.42,
|
598 |
"in_benchmark": true,
|
599 |
"NaN": 0.0,
|
600 |
+
"classification_accuracy": 0.43,
|
601 |
+
"language_modeling_chrf": 0.94,
|
602 |
+
"translation_bleu": 0.26,
|
603 |
+
"translation_chrf": 0.44
|
604 |
},
|
605 |
{
|
606 |
"bcp_47": "th",
|
|
|
10164 |
]
|
10165 |
},
|
10166 |
"AE": {
|
10167 |
+
"score": 0.40140041521976655,
|
10168 |
"languages": [
|
10169 |
{
|
10170 |
"name": "English",
|
|
|
10182 |
"name": "Persian",
|
10183 |
"bcp_47": "fa",
|
10184 |
"population": 189850,
|
10185 |
+
"score": 0.41
|
10186 |
},
|
10187 |
{
|
10188 |
"name": "Pashto",
|
|
|
10205 |
]
|
10206 |
},
|
10207 |
"AG": {
|
10208 |
+
"score": 0.4696346724027672,
|
10209 |
"languages": [
|
10210 |
{
|
10211 |
"name": "English",
|
|
|
10217 |
"name": "Portuguese",
|
10218 |
"bcp_47": "pt",
|
10219 |
"population": 1571,
|
10220 |
+
"score": 0.45
|
10221 |
}
|
10222 |
]
|
10223 |
},
|
|
|
10290 |
]
|
10291 |
},
|
10292 |
"AT": {
|
10293 |
+
"score": 0.31771431191158667,
|
10294 |
"languages": [
|
10295 |
{
|
10296 |
"name": "English",
|
|
|
10308 |
"name": "German",
|
10309 |
"bcp_47": "de",
|
10310 |
"population": 8593666,
|
10311 |
+
"score": 0.49
|
10312 |
},
|
10313 |
{
|
10314 |
"name": "Italian",
|
10315 |
"bcp_47": "it",
|
10316 |
"population": 797350,
|
10317 |
+
"score": 0.47
|
10318 |
},
|
10319 |
{
|
10320 |
"name": "Bavarian",
|
|
|
10343 |
]
|
10344 |
},
|
10345 |
"AU": {
|
10346 |
+
"score": 0.46970357171432847,
|
10347 |
"languages": [
|
10348 |
{
|
10349 |
"name": "English",
|
|
|
10361 |
"name": "Italian",
|
10362 |
"bcp_47": "it",
|
10363 |
"population": 483864,
|
10364 |
+
"score": 0.47
|
10365 |
},
|
10366 |
{
|
10367 |
"name": "Hmong Njua",
|
|
|
10506 |
]
|
10507 |
},
|
10508 |
"BE": {
|
10509 |
+
"score": 0.29499472599184506,
|
10510 |
"languages": [
|
10511 |
{
|
10512 |
"name": "English",
|
|
|
10524 |
"name": "German",
|
10525 |
"bcp_47": "de",
|
10526 |
"population": 2578554,
|
10527 |
+
"score": 0.49
|
10528 |
},
|
10529 |
{
|
10530 |
"name": "Dutch",
|
|
|
10547 |
]
|
10548 |
},
|
10549 |
"BG": {
|
10550 |
+
"score": 0.18479041916167663,
|
10551 |
"languages": [
|
10552 |
{
|
10553 |
"name": "English",
|
|
|
10559 |
"name": "Russian",
|
10560 |
"bcp_47": "ru",
|
10561 |
"population": 1602387,
|
10562 |
+
"score": 0.45
|
10563 |
},
|
10564 |
{
|
10565 |
"name": "German",
|
10566 |
"bcp_47": "de",
|
10567 |
"population": 557352,
|
10568 |
+
"score": 0.49
|
10569 |
},
|
10570 |
{
|
10571 |
"name": "Turkish",
|
10572 |
"bcp_47": "tr",
|
10573 |
"population": 766359,
|
10574 |
+
"score": 0.44
|
10575 |
},
|
10576 |
{
|
10577 |
"name": "Bulgarian",
|
|
|
10582 |
]
|
10583 |
},
|
10584 |
"BI": {
|
10585 |
+
"score": 0.2226670965568091,
|
10586 |
"languages": [
|
10587 |
{
|
10588 |
"name": "English",
|
|
|
10600 |
"name": "Swahili",
|
10601 |
"bcp_47": "sw",
|
10602 |
"population": 6408,
|
10603 |
+
"score": 0.45
|
10604 |
},
|
10605 |
{
|
10606 |
"name": "Rundi",
|
|
|
10645 |
]
|
10646 |
},
|
10647 |
"BR": {
|
10648 |
+
"score": 0.45070787745315494,
|
10649 |
"languages": [
|
10650 |
{
|
10651 |
"name": "English",
|
|
|
10663 |
"name": "Portuguese",
|
10664 |
"bcp_47": "pt",
|
10665 |
"population": 192661560,
|
10666 |
+
"score": 0.45
|
10667 |
},
|
10668 |
{
|
10669 |
"name": "German",
|
10670 |
"bcp_47": "de",
|
10671 |
"population": 1778414,
|
10672 |
+
"score": 0.49
|
10673 |
},
|
10674 |
{
|
10675 |
"name": "Japanese",
|
10676 |
"bcp_47": "ja",
|
10677 |
"population": 444604,
|
10678 |
+
"score": 0.46
|
10679 |
},
|
10680 |
{
|
10681 |
"name": "Korean",
|
10682 |
"bcp_47": "ko",
|
10683 |
"population": 44460,
|
10684 |
+
"score": 0.41
|
10685 |
},
|
10686 |
{
|
10687 |
"name": "Italian",
|
10688 |
"bcp_47": "it",
|
10689 |
"population": 592805,
|
10690 |
+
"score": 0.47
|
10691 |
},
|
10692 |
{
|
10693 |
"name": "Venetian",
|
|
|
10819 |
]
|
10820 |
},
|
10821 |
"CA": {
|
10822 |
+
"score": 0.4538591979207903,
|
10823 |
"languages": [
|
10824 |
{
|
10825 |
"name": "English",
|
|
|
10873 |
"name": "Portuguese",
|
10874 |
"bcp_47": "pt",
|
10875 |
"population": 229934,
|
10876 |
+
"score": 0.45
|
10877 |
},
|
10878 |
{
|
10879 |
"name": "Punjabi",
|
10880 |
"bcp_47": "pa",
|
10881 |
"population": 603106,
|
10882 |
+
"score": 0.43
|
10883 |
},
|
10884 |
{
|
10885 |
"name": "Russian",
|
10886 |
"bcp_47": "ru",
|
10887 |
"population": 211087,
|
10888 |
+
"score": 0.45
|
10889 |
},
|
10890 |
{
|
10891 |
"name": "German",
|
10892 |
"bcp_47": "de",
|
10893 |
"population": 294014,
|
10894 |
+
"score": 0.49
|
10895 |
},
|
10896 |
{
|
10897 |
"name": "Japanese",
|
10898 |
"bcp_47": "ja",
|
10899 |
"population": 52772,
|
10900 |
+
"score": 0.46
|
10901 |
},
|
10902 |
{
|
10903 |
"name": "Vietnamese",
|
10904 |
"bcp_47": "vi",
|
10905 |
"population": 184701,
|
10906 |
+
"score": 0.45
|
10907 |
},
|
10908 |
{
|
10909 |
"name": "Tamil",
|
10910 |
"bcp_47": "ta",
|
10911 |
"population": 184701,
|
10912 |
+
"score": 0.41
|
10913 |
},
|
10914 |
{
|
10915 |
"name": "Persian",
|
10916 |
"bcp_47": "fa",
|
10917 |
"population": 245012,
|
10918 |
+
"score": 0.41
|
10919 |
},
|
10920 |
{
|
10921 |
"name": "Turkish",
|
10922 |
"bcp_47": "tr",
|
10923 |
"population": 37694,
|
10924 |
+
"score": 0.44
|
10925 |
},
|
10926 |
{
|
10927 |
"name": "Cantonese",
|
10928 |
"bcp_47": "yue",
|
10929 |
"population": 640800,
|
10930 |
+
"score": 0.39
|
10931 |
},
|
10932 |
{
|
10933 |
"name": "Korean",
|
10934 |
"bcp_47": "ko",
|
10935 |
"population": 169623,
|
10936 |
+
"score": 0.41
|
10937 |
},
|
10938 |
{
|
10939 |
"name": "Italian",
|
10940 |
"bcp_47": "it",
|
10941 |
"population": 343016,
|
10942 |
+
"score": 0.47
|
10943 |
},
|
10944 |
{
|
10945 |
"name": "Filipino",
|
10946 |
"bcp_47": "fil",
|
10947 |
"population": 565412,
|
10948 |
+
"score": 0.42
|
10949 |
},
|
10950 |
{
|
10951 |
"name": "Gujarati",
|
10952 |
"bcp_47": "gu",
|
10953 |
"population": 135699,
|
10954 |
+
"score": 0.42
|
10955 |
},
|
10956 |
{
|
10957 |
"name": "Polish",
|
|
|
11189 |
]
|
11190 |
},
|
11191 |
"CH": {
|
11192 |
+
"score": 0.33368138748580556,
|
11193 |
"languages": [
|
11194 |
{
|
11195 |
"name": "English",
|
|
|
11207 |
"name": "Portuguese",
|
11208 |
"bcp_47": "pt",
|
11209 |
"population": 285736,
|
11210 |
+
"score": 0.45
|
11211 |
},
|
11212 |
{
|
11213 |
"name": "German",
|
11214 |
"bcp_47": "de",
|
11215 |
"population": 6134913,
|
11216 |
+
"score": 0.49
|
11217 |
},
|
11218 |
{
|
11219 |
"name": "Italian",
|
11220 |
"bcp_47": "it",
|
11221 |
"population": 361372,
|
11222 |
+
"score": 0.47
|
11223 |
},
|
11224 |
{
|
11225 |
"name": "Swiss German",
|
|
|
11455 |
]
|
11456 |
},
|
11457 |
"CN": {
|
11458 |
+
"score": 0.38724457341349466,
|
11459 |
"languages": [
|
11460 |
{
|
11461 |
"name": "English",
|
|
|
11473 |
"name": "Russian",
|
11474 |
"bcp_47": "ru",
|
11475 |
"population": 13940,
|
11476 |
+
"score": 0.45
|
11477 |
},
|
11478 |
{
|
11479 |
"name": "Vietnamese",
|
11480 |
"bcp_47": "vi",
|
11481 |
"population": 6970,
|
11482 |
+
"score": 0.45
|
11483 |
},
|
11484 |
{
|
11485 |
"name": "Wu Chinese",
|
|
|
11491 |
"name": "Cantonese",
|
11492 |
"bcp_47": "yue",
|
11493 |
"population": 72489040,
|
11494 |
+
"score": 0.39
|
11495 |
},
|
11496 |
{
|
11497 |
"name": "Korean",
|
11498 |
"bcp_47": "ko",
|
11499 |
"population": 2091030,
|
11500 |
+
"score": 0.41
|
11501 |
},
|
11502 |
{
|
11503 |
"name": "Xiang Chinese",
|
|
|
11649 |
]
|
11650 |
},
|
11651 |
"CY": {
|
11652 |
+
"score": 0.2404799926753925,
|
11653 |
"languages": [
|
11654 |
{
|
11655 |
"name": "English",
|
|
|
11673 |
"name": "Turkish",
|
11674 |
"bcp_47": "tr",
|
11675 |
"population": 291336,
|
11676 |
+
"score": 0.44
|
11677 |
},
|
11678 |
{
|
11679 |
"name": "Greek",
|
|
|
11690 |
]
|
11691 |
},
|
11692 |
"CZ": {
|
11693 |
+
"score": 0.12805930282531847,
|
11694 |
"languages": [
|
11695 |
{
|
11696 |
"name": "English",
|
|
|
11702 |
"name": "German",
|
11703 |
"bcp_47": "de",
|
11704 |
"population": 1605375,
|
11705 |
+
"score": 0.49
|
11706 |
},
|
11707 |
{
|
11708 |
"name": "Polish",
|
|
|
11725 |
]
|
11726 |
},
|
11727 |
"DE": {
|
11728 |
+
"score": 0.3765932308207555,
|
11729 |
"languages": [
|
11730 |
{
|
11731 |
"name": "English",
|
|
|
11749 |
"name": "Russian",
|
11750 |
"bcp_47": "ru",
|
11751 |
"population": 4809582,
|
11752 |
+
"score": 0.45
|
11753 |
},
|
11754 |
{
|
11755 |
"name": "German",
|
11756 |
"bcp_47": "de",
|
11757 |
"population": 72945327,
|
11758 |
+
"score": 0.49
|
11759 |
},
|
11760 |
{
|
11761 |
"name": "Turkish",
|
11762 |
"bcp_47": "tr",
|
11763 |
"population": 2003992,
|
11764 |
+
"score": 0.44
|
11765 |
},
|
11766 |
{
|
11767 |
"name": "Italian",
|
11768 |
"bcp_47": "it",
|
11769 |
"population": 5611179,
|
11770 |
+
"score": 0.47
|
11771 |
},
|
11772 |
{
|
11773 |
"name": "Polish",
|
|
|
11891 |
]
|
11892 |
},
|
11893 |
"DK": {
|
11894 |
+
"score": 0.2649269539952979,
|
11895 |
"languages": [
|
11896 |
{
|
11897 |
"name": "English",
|
|
|
11903 |
"name": "German",
|
11904 |
"bcp_47": "de",
|
11905 |
"population": 2758623,
|
11906 |
+
"score": 0.49
|
11907 |
},
|
11908 |
{
|
11909 |
"name": "Swedish",
|
|
|
12001 |
]
|
12002 |
},
|
12003 |
"EE": {
|
12004 |
+
"score": 0.23907703243578238,
|
12005 |
"languages": [
|
12006 |
{
|
12007 |
"name": "English",
|
|
|
12013 |
"name": "Russian",
|
12014 |
"bcp_47": "ru",
|
12015 |
"population": 688027,
|
12016 |
+
"score": 0.45
|
12017 |
},
|
12018 |
{
|
12019 |
"name": "Finnish",
|
|
|
12042 |
]
|
12043 |
},
|
12044 |
"EG": {
|
12045 |
+
"score": 0.4156717299521135,
|
12046 |
"languages": [
|
12047 |
{
|
12048 |
"name": "English",
|
|
|
12060 |
"name": "Egyptian Arabic",
|
12061 |
"bcp_47": "arz",
|
12062 |
"population": 66639360,
|
12063 |
+
"score": 0.38
|
12064 |
},
|
12065 |
{
|
12066 |
"name": "Greek",
|
|
|
12236 |
]
|
12237 |
},
|
12238 |
"FI": {
|
12239 |
+
"score": 0.18533875082776866,
|
12240 |
"languages": [
|
12241 |
{
|
12242 |
"name": "English",
|
|
|
12248 |
"name": "Russian",
|
12249 |
"bcp_47": "ru",
|
12250 |
"population": 45131,
|
12251 |
+
"score": 0.45
|
12252 |
},
|
12253 |
{
|
12254 |
"name": "German",
|
12255 |
"bcp_47": "de",
|
12256 |
"population": 1002901,
|
12257 |
+
"score": 0.49
|
12258 |
},
|
12259 |
{
|
12260 |
"name": "Swedish",
|
|
|
12388 |
]
|
12389 |
},
|
12390 |
"FR": {
|
12391 |
+
"score": 0.4436463938115849,
|
12392 |
"languages": [
|
12393 |
{
|
12394 |
"name": "English",
|
|
|
12412 |
"name": "Portuguese",
|
12413 |
"bcp_47": "pt",
|
12414 |
"population": 882027,
|
12415 |
+
"score": 0.45
|
12416 |
},
|
12417 |
{
|
12418 |
"name": "German",
|
12419 |
"bcp_47": "de",
|
12420 |
"population": 3392410,
|
12421 |
+
"score": 0.49
|
12422 |
},
|
12423 |
{
|
12424 |
"name": "Italian",
|
12425 |
"bcp_47": "it",
|
12426 |
"population": 1153419,
|
12427 |
+
"score": 0.47
|
12428 |
},
|
12429 |
{
|
12430 |
"name": "Dutch",
|
|
|
12495 |
]
|
12496 |
},
|
12497 |
"GB": {
|
12498 |
+
"score": 0.43956766255639257,
|
12499 |
"languages": [
|
12500 |
{
|
12501 |
"name": "English",
|
|
|
12543 |
"name": "Portuguese",
|
12544 |
"bcp_47": "pt",
|
12545 |
"population": 131522,
|
12546 |
+
"score": 0.45
|
12547 |
},
|
12548 |
{
|
12549 |
"name": "Punjabi",
|
12550 |
"bcp_47": "pa",
|
12551 |
"population": 2367400,
|
12552 |
+
"score": 0.43
|
12553 |
},
|
12554 |
{
|
12555 |
"name": "German",
|
12556 |
"bcp_47": "de",
|
12557 |
"population": 5918499,
|
12558 |
+
"score": 0.49
|
12559 |
},
|
12560 |
{
|
12561 |
"name": "Tamil",
|
12562 |
"bcp_47": "ta",
|
12563 |
"population": 2104355,
|
12564 |
+
"score": 0.41
|
12565 |
},
|
12566 |
{
|
12567 |
"name": "Turkish",
|
12568 |
"bcp_47": "tr",
|
12569 |
"population": 131522,
|
12570 |
+
"score": 0.44
|
12571 |
},
|
12572 |
{
|
12573 |
"name": "Italian",
|
12574 |
"bcp_47": "it",
|
12575 |
"population": 131522,
|
12576 |
+
"score": 0.47
|
12577 |
},
|
12578 |
{
|
12579 |
"name": "Gujarati",
|
12580 |
"bcp_47": "gu",
|
12581 |
"population": 1907072,
|
12582 |
+
"score": 0.42
|
12583 |
},
|
12584 |
{
|
12585 |
"name": "Polish",
|
|
|
12765 |
]
|
12766 |
},
|
12767 |
"GR": {
|
12768 |
+
"score": 0.18194383576443016,
|
12769 |
"languages": [
|
12770 |
{
|
12771 |
"name": "English",
|
|
|
12783 |
"name": "German",
|
12784 |
"bcp_47": "de",
|
12785 |
"population": 530355,
|
12786 |
+
"score": 0.49
|
12787 |
},
|
12788 |
{
|
12789 |
"name": "Turkish",
|
12790 |
"bcp_47": "tr",
|
12791 |
"population": 127285,
|
12792 |
+
"score": 0.44
|
12793 |
},
|
12794 |
{
|
12795 |
"name": "Greek",
|
|
|
12869 |
]
|
12870 |
},
|
12871 |
"HK": {
|
12872 |
+
"score": 0.4359751035397035,
|
12873 |
"languages": [
|
12874 |
{
|
12875 |
"name": "English",
|
|
|
12887 |
"name": "Cantonese",
|
12888 |
"bcp_47": "yue",
|
12889 |
"population": 6524919,
|
12890 |
+
"score": 0.39
|
12891 |
}
|
12892 |
]
|
12893 |
},
|
|
|
12920 |
]
|
12921 |
},
|
12922 |
"HR": {
|
12923 |
+
"score": 0.15823024946225459,
|
12924 |
"languages": [
|
12925 |
{
|
12926 |
"name": "English",
|
|
|
12932 |
"name": "Italian",
|
12933 |
"bcp_47": "it",
|
12934 |
"population": 67644,
|
12935 |
+
"score": 0.47
|
12936 |
},
|
12937 |
{
|
12938 |
"name": "Croatian",
|
|
|
12949 |
]
|
12950 |
},
|
12951 |
"HU": {
|
12952 |
+
"score": 0.13756219151316587,
|
12953 |
"languages": [
|
12954 |
{
|
12955 |
"name": "English",
|
|
|
12967 |
"name": "German",
|
12968 |
"bcp_47": "de",
|
12969 |
"population": 1758929,
|
12970 |
+
"score": 0.49
|
12971 |
},
|
12972 |
{
|
12973 |
"name": "Romanian",
|
|
|
13025 |
]
|
13026 |
},
|
13027 |
"IL": {
|
13028 |
+
"score": 0.21817259544999,
|
13029 |
"languages": [
|
13030 |
{
|
13031 |
"name": "English",
|
|
|
13043 |
"name": "Russian",
|
13044 |
"bcp_47": "ru",
|
13045 |
"population": 954303,
|
13046 |
+
"score": 0.45
|
13047 |
},
|
13048 |
{
|
13049 |
"name": "Malayalam",
|
|
|
13125 |
]
|
13126 |
},
|
13127 |
"IN": {
|
13128 |
+
"score": 0.3397907454052606,
|
13129 |
"languages": [
|
13130 |
{
|
13131 |
"name": "English",
|
|
|
13155 |
"name": "Punjabi",
|
13156 |
"bcp_47": "pa",
|
13157 |
"population": 37130520,
|
13158 |
+
"score": 0.43
|
13159 |
},
|
13160 |
{
|
13161 |
"name": "Telugu",
|
13162 |
"bcp_47": "te",
|
13163 |
"population": 95478480,
|
13164 |
+
"score": 0.41
|
13165 |
},
|
13166 |
{
|
13167 |
"name": "Western Panjabi",
|
|
|
13173 |
"name": "Marathi",
|
13174 |
"bcp_47": "mr",
|
13175 |
"population": 92826300,
|
13176 |
+
"score": 0.45
|
13177 |
},
|
13178 |
{
|
13179 |
"name": "Tamil",
|
13180 |
"bcp_47": "ta",
|
13181 |
"population": 78239310,
|
13182 |
+
"score": 0.41
|
13183 |
},
|
13184 |
{
|
13185 |
"name": "Gujarati",
|
13186 |
"bcp_47": "gu",
|
13187 |
"population": 59674050,
|
13188 |
+
"score": 0.42
|
13189 |
},
|
13190 |
{
|
13191 |
"name": "Kannada",
|
|
|
13603 |
]
|
13604 |
},
|
13605 |
"IQ": {
|
13606 |
+
"score": 0.357837983423388,
|
13607 |
"languages": [
|
13608 |
{
|
13609 |
"name": "English",
|
|
|
13621 |
"name": "Persian",
|
13622 |
"bcp_47": "fa",
|
13623 |
"population": 338192,
|
13624 |
+
"score": 0.41
|
13625 |
},
|
13626 |
{
|
13627 |
"name": "Azerbaijani",
|
|
|
13650 |
]
|
13651 |
},
|
13652 |
"IT": {
|
13653 |
+
"score": 0.43224641662655555,
|
13654 |
"languages": [
|
13655 |
{
|
13656 |
"name": "English",
|
|
|
13668 |
"name": "German",
|
13669 |
"bcp_47": "de",
|
13670 |
"population": 998443,
|
13671 |
+
"score": 0.49
|
13672 |
},
|
13673 |
{
|
13674 |
"name": "Italian",
|
13675 |
"bcp_47": "it",
|
13676 |
"population": 59282565,
|
13677 |
+
"score": 0.47
|
13678 |
},
|
13679 |
{
|
13680 |
"name": "Greek",
|
|
|
13820 |
]
|
13821 |
},
|
13822 |
"KE": {
|
13823 |
+
"score": 0.2501476621404106,
|
13824 |
"languages": [
|
13825 |
{
|
13826 |
"name": "English",
|
|
|
13838 |
"name": "Punjabi",
|
13839 |
"bcp_47": "pa",
|
13840 |
"population": 10170,
|
13841 |
+
"score": 0.43
|
13842 |
},
|
13843 |
{
|
13844 |
"name": "Swahili",
|
13845 |
"bcp_47": "sw",
|
13846 |
"population": 35328414,
|
13847 |
+
"score": 0.45
|
13848 |
},
|
13849 |
{
|
13850 |
"name": "Gujarati",
|
13851 |
"bcp_47": "gu",
|
13852 |
"population": 4978,
|
13853 |
+
"score": 0.42
|
13854 |
},
|
13855 |
{
|
13856 |
"name": "Oromo",
|
|
|
13984 |
]
|
13985 |
},
|
13986 |
"KZ": {
|
13987 |
+
"score": 0.2671643693028198,
|
13988 |
"languages": [
|
13989 |
{
|
13990 |
"name": "English",
|
|
|
13996 |
"name": "Russian",
|
13997 |
"bcp_47": "ru",
|
13998 |
"population": 13746168,
|
13999 |
+
"score": 0.45
|
14000 |
},
|
14001 |
{
|
14002 |
"name": "German",
|
14003 |
"bcp_47": "de",
|
14004 |
"population": 1221882,
|
14005 |
+
"score": 0.49
|
14006 |
},
|
14007 |
{
|
14008 |
"name": "Kazakh",
|
|
|
14071 |
]
|
14072 |
},
|
14073 |
"LK": {
|
14074 |
+
"score": 0.11666666666666665,
|
14075 |
"languages": [
|
14076 |
{
|
14077 |
"name": "English",
|
|
|
14083 |
"name": "Tamil",
|
14084 |
"bcp_47": "ta",
|
14085 |
"population": 3433380,
|
14086 |
+
"score": 0.41
|
14087 |
},
|
14088 |
{
|
14089 |
"name": "Sinhala",
|
|
|
14164 |
]
|
14165 |
},
|
14166 |
"LT": {
|
14167 |
+
"score": 0.2785320836068621,
|
14168 |
"languages": [
|
14169 |
{
|
14170 |
"name": "English",
|
|
|
14176 |
"name": "Russian",
|
14177 |
"bcp_47": "ru",
|
14178 |
"population": 2185168,
|
14179 |
+
"score": 0.45
|
14180 |
},
|
14181 |
{
|
14182 |
"name": "German",
|
14183 |
"bcp_47": "de",
|
14184 |
"population": 382404,
|
14185 |
+
"score": 0.49
|
14186 |
},
|
14187 |
{
|
14188 |
"name": "Lithuanian",
|
|
|
14199 |
]
|
14200 |
},
|
14201 |
"LU": {
|
14202 |
+
"score": 0.3612802832567923,
|
14203 |
"languages": [
|
14204 |
{
|
14205 |
"name": "English",
|
|
|
14217 |
"name": "Portuguese",
|
14218 |
"bcp_47": "pt",
|
14219 |
"population": 100541,
|
14220 |
+
"score": 0.45
|
14221 |
},
|
14222 |
{
|
14223 |
"name": "German",
|
14224 |
"bcp_47": "de",
|
14225 |
"population": 395880,
|
14226 |
+
"score": 0.49
|
14227 |
},
|
14228 |
{
|
14229 |
"name": "Luxembourgish",
|
|
|
14234 |
]
|
14235 |
},
|
14236 |
"LV": {
|
14237 |
+
"score": 0.2515919974081345,
|
14238 |
"languages": [
|
14239 |
{
|
14240 |
"name": "English",
|
|
|
14246 |
"name": "Russian",
|
14247 |
"bcp_47": "ru",
|
14248 |
"population": 714867,
|
14249 |
+
"score": 0.45
|
14250 |
},
|
14251 |
{
|
14252 |
"name": "Latvian",
|
|
|
14362 |
]
|
14363 |
},
|
14364 |
"MO": {
|
14365 |
+
"score": 0.4597552187538731,
|
14366 |
"languages": [
|
14367 |
{
|
14368 |
"name": "English",
|
|
|
14380 |
"name": "Portuguese",
|
14381 |
"bcp_47": "pt",
|
14382 |
"population": 30723,
|
14383 |
+
"score": 0.45
|
14384 |
}
|
14385 |
]
|
14386 |
},
|
|
|
14413 |
]
|
14414 |
},
|
14415 |
"MT": {
|
14416 |
+
"score": 0.28525492889983195,
|
14417 |
"languages": [
|
14418 |
{
|
14419 |
"name": "English",
|
|
|
14431 |
"name": "Italian",
|
14432 |
"bcp_47": "it",
|
14433 |
"population": 256070,
|
14434 |
+
"score": 0.47
|
14435 |
},
|
14436 |
{
|
14437 |
"name": "Maltese",
|
|
|
14442 |
]
|
14443 |
},
|
14444 |
"MU": {
|
14445 |
+
"score": 0.19243355389764255,
|
14446 |
"languages": [
|
14447 |
{
|
14448 |
"name": "English",
|
|
|
14466 |
"name": "Tamil",
|
14467 |
"bcp_47": "ta",
|
14468 |
"population": 34484,
|
14469 |
+
"score": 0.41
|
14470 |
},
|
14471 |
{
|
14472 |
"name": "Bhojpuri",
|
|
|
14594 |
]
|
14595 |
},
|
14596 |
"MY": {
|
14597 |
+
"score": 0.1619475361727729,
|
14598 |
"languages": [
|
14599 |
{
|
14600 |
"name": "English",
|
|
|
14612 |
"name": "Javanese",
|
14613 |
"bcp_47": "jv",
|
14614 |
"population": 391825,
|
14615 |
+
"score": 0.41
|
14616 |
},
|
14617 |
{
|
14618 |
"name": "Tamil",
|
14619 |
"bcp_47": "ta",
|
14620 |
"population": 1371388,
|
14621 |
+
"score": 0.41
|
14622 |
},
|
14623 |
{
|
14624 |
"name": "Malayalam",
|
|
|
14665 |
]
|
14666 |
},
|
14667 |
"NA": {
|
14668 |
+
"score": 0.023383111654627774,
|
14669 |
"languages": [
|
14670 |
{
|
14671 |
"name": "English",
|
|
|
14677 |
"name": "German",
|
14678 |
"bcp_47": "de",
|
14679 |
"population": 23671,
|
14680 |
+
"score": 0.49
|
14681 |
},
|
14682 |
{
|
14683 |
"name": "Afrikaans",
|
|
|
14836 |
]
|
14837 |
},
|
14838 |
"NL": {
|
14839 |
+
"score": 0.28688749989149553,
|
14840 |
"languages": [
|
14841 |
{
|
14842 |
"name": "English",
|
|
|
14854 |
"name": "Indonesian",
|
14855 |
"bcp_47": "id",
|
14856 |
"population": 311047,
|
14857 |
+
"score": 0.47
|
14858 |
},
|
14859 |
{
|
14860 |
"name": "German",
|
14861 |
"bcp_47": "de",
|
14862 |
"population": 12269084,
|
14863 |
+
"score": 0.49
|
14864 |
},
|
14865 |
{
|
14866 |
"name": "Turkish",
|
14867 |
"bcp_47": "tr",
|
14868 |
"population": 207365,
|
14869 |
+
"score": 0.44
|
14870 |
},
|
14871 |
{
|
14872 |
"name": "Dutch",
|
|
|
15183 |
]
|
15184 |
},
|
15185 |
"PH": {
|
15186 |
+
"score": 0.32615211365536473,
|
15187 |
"languages": [
|
15188 |
{
|
15189 |
"name": "English",
|
|
|
15207 |
"name": "Filipino",
|
15208 |
"bcp_47": "fil",
|
15209 |
"population": 65508600,
|
15210 |
+
"score": 0.42
|
15211 |
},
|
15212 |
{
|
15213 |
"name": "Cebuano",
|
|
|
15308 |
]
|
15309 |
},
|
15310 |
"PK": {
|
15311 |
+
"score": 0.30567966556461956,
|
15312 |
"languages": [
|
15313 |
{
|
15314 |
"name": "English",
|
|
|
15326 |
"name": "Punjabi",
|
15327 |
"bcp_47": "pa",
|
15328 |
"population": 163450700,
|
15329 |
+
"score": 0.43
|
15330 |
},
|
15331 |
{
|
15332 |
"name": "Western Panjabi",
|
|
|
15338 |
"name": "Persian",
|
15339 |
"bcp_47": "fa",
|
15340 |
"population": 1541107,
|
15341 |
+
"score": 0.41
|
15342 |
},
|
15343 |
{
|
15344 |
"name": "Pashto",
|
|
|
15457 |
]
|
15458 |
},
|
15459 |
"PL": {
|
15460 |
+
"score": 0.19542647519424666,
|
15461 |
"languages": [
|
15462 |
{
|
15463 |
"name": "English",
|
|
|
15469 |
"name": "Russian",
|
15470 |
"bcp_47": "ru",
|
15471 |
"population": 6890814,
|
15472 |
+
"score": 0.45
|
15473 |
},
|
15474 |
{
|
15475 |
"name": "German",
|
15476 |
"bcp_47": "de",
|
15477 |
"population": 7273637,
|
15478 |
+
"score": 0.49
|
15479 |
},
|
15480 |
{
|
15481 |
"name": "Polish",
|
|
|
15573 |
]
|
15574 |
},
|
15575 |
"PT": {
|
15576 |
+
"score": 0.4542324762390237,
|
15577 |
"languages": [
|
15578 |
{
|
15579 |
"name": "English",
|
|
|
15597 |
"name": "Portuguese",
|
15598 |
"bcp_47": "pt",
|
15599 |
"population": 9890592,
|
15600 |
+
"score": 0.45
|
15601 |
},
|
15602 |
{
|
15603 |
"name": "Galician",
|
|
|
15625 |
]
|
15626 |
},
|
15627 |
"RO": {
|
15628 |
+
"score": 0.1743772772485309,
|
15629 |
"languages": [
|
15630 |
{
|
15631 |
"name": "English",
|
|
|
15649 |
"name": "German",
|
15650 |
"bcp_47": "de",
|
15651 |
"population": 44736,
|
15652 |
+
"score": 0.49
|
15653 |
},
|
15654 |
{
|
15655 |
"name": "Turkish",
|
15656 |
"bcp_47": "tr",
|
15657 |
"population": 27694,
|
15658 |
+
"score": 0.44
|
15659 |
},
|
15660 |
{
|
15661 |
"name": "Polish",
|
|
|
15883 |
]
|
15884 |
},
|
15885 |
"SG": {
|
15886 |
+
"score": 0.4294592881506046,
|
15887 |
"languages": [
|
15888 |
{
|
15889 |
"name": "English",
|
|
|
15901 |
"name": "Punjabi",
|
15902 |
"bcp_47": "pa",
|
15903 |
"population": 9314,
|
15904 |
+
"score": 0.43
|
15905 |
},
|
15906 |
{
|
15907 |
"name": "Tamil",
|
15908 |
"bcp_47": "ta",
|
15909 |
"population": 130403,
|
15910 |
+
"score": 0.41
|
15911 |
},
|
15912 |
{
|
15913 |
"name": "Malayalam",
|
|
|
15935 |
]
|
15936 |
},
|
15937 |
"SI": {
|
15938 |
+
"score": 0.1928028123892293,
|
15939 |
"languages": [
|
15940 |
{
|
15941 |
"name": "English",
|
|
|
15947 |
"name": "German",
|
15948 |
"bcp_47": "de",
|
15949 |
"population": 883126,
|
15950 |
+
"score": 0.49
|
15951 |
},
|
15952 |
{
|
15953 |
"name": "Italian",
|
15954 |
"bcp_47": "it",
|
15955 |
"population": 3995,
|
15956 |
+
"score": 0.47
|
15957 |
},
|
15958 |
{
|
15959 |
"name": "Hungarian",
|
|
|
15982 |
]
|
15983 |
},
|
15984 |
"SK": {
|
15985 |
+
"score": 0.11567670853229638,
|
15986 |
"languages": [
|
15987 |
{
|
15988 |
"name": "English",
|
|
|
15994 |
"name": "German",
|
15995 |
"bcp_47": "de",
|
15996 |
"population": 1196932,
|
15997 |
+
"score": 0.49
|
15998 |
},
|
15999 |
{
|
16000 |
"name": "Polish",
|
|
|
16290 |
]
|
16291 |
},
|
16292 |
"TR": {
|
16293 |
+
"score": 0.38853953080443926,
|
16294 |
"languages": [
|
16295 |
{
|
16296 |
"name": "English",
|
|
|
16308 |
"name": "Turkish",
|
16309 |
"bcp_47": "tr",
|
16310 |
"population": 76276275,
|
16311 |
+
"score": 0.44
|
16312 |
},
|
16313 |
{
|
16314 |
"name": "North Levantine Arabic",
|
|
|
16467 |
]
|
16468 |
},
|
16469 |
"TZ": {
|
16470 |
+
"score": 0.3952631230768349,
|
16471 |
"languages": [
|
16472 |
{
|
16473 |
"name": "English",
|
|
|
16479 |
"name": "Swahili",
|
16480 |
"bcp_47": "sw",
|
16481 |
"population": 52697520,
|
16482 |
+
"score": 0.45
|
16483 |
},
|
16484 |
{
|
16485 |
"name": "Sukuma",
|
|
|
16568 |
]
|
16569 |
},
|
16570 |
"UG": {
|
16571 |
+
"score": 0.2797477934487195,
|
16572 |
"languages": [
|
16573 |
{
|
16574 |
"name": "English",
|
|
|
16586 |
"name": "Swahili",
|
16587 |
"bcp_47": "sw",
|
16588 |
"population": 32439750,
|
16589 |
+
"score": 0.45
|
16590 |
},
|
16591 |
{
|
16592 |
"name": "Kinyarwanda",
|
|
|
16662 |
]
|
16663 |
},
|
16664 |
"US": {
|
16665 |
+
"score": 0.46680423711359387,
|
16666 |
"languages": [
|
16667 |
{
|
16668 |
"name": "English",
|
|
|
16692 |
"name": "Russian",
|
16693 |
"bcp_47": "ru",
|
16694 |
"population": 798334,
|
16695 |
+
"score": 0.45
|
16696 |
},
|
16697 |
{
|
16698 |
"name": "German",
|
16699 |
"bcp_47": "de",
|
16700 |
"population": 1563403,
|
16701 |
+
"score": 0.49
|
16702 |
},
|
16703 |
{
|
16704 |
"name": "Vietnamese",
|
16705 |
"bcp_47": "vi",
|
16706 |
"population": 1130973,
|
16707 |
+
"score": 0.45
|
16708 |
},
|
16709 |
{
|
16710 |
"name": "Korean",
|
16711 |
"bcp_47": "ko",
|
16712 |
"population": 997917,
|
16713 |
+
"score": 0.41
|
16714 |
},
|
16715 |
{
|
16716 |
"name": "Italian",
|
16717 |
"bcp_47": "it",
|
16718 |
"population": 1130973,
|
16719 |
+
"score": 0.47
|
16720 |
},
|
16721 |
{
|
16722 |
"name": "Filipino",
|
16723 |
"bcp_47": "fil",
|
16724 |
"population": 1397084,
|
16725 |
+
"score": 0.42
|
16726 |
},
|
16727 |
{
|
16728 |
"name": "Yiddish",
|
|
|
16925 |
]
|
16926 |
},
|
16927 |
"ZA": {
|
16928 |
+
"score": 0.12442237800209865,
|
16929 |
"languages": [
|
16930 |
{
|
16931 |
"name": "English",
|
|
|
16943 |
"name": "Swahili",
|
16944 |
"bcp_47": "sw",
|
16945 |
"population": 1016,
|
16946 |
+
"score": 0.45
|
16947 |
},
|
16948 |
{
|
16949 |
"name": "Zulu",
|
|
|
17125 |
]
|
17126 |
},
|
17127 |
"ID": {
|
17128 |
+
"score": 0.3194548673228042,
|
17129 |
"languages": [
|
17130 |
{
|
17131 |
"name": "Chinese",
|
|
|
17137 |
"name": "Indonesian",
|
17138 |
"bcp_47": "id",
|
17139 |
"population": 170896640,
|
17140 |
+
"score": 0.47
|
17141 |
},
|
17142 |
{
|
17143 |
"name": "Javanese",
|
17144 |
"bcp_47": "jv",
|
17145 |
"population": 90788840,
|
17146 |
+
"score": 0.41
|
17147 |
},
|
17148 |
{
|
17149 |
"name": "Malay",
|
|
|
17304 |
]
|
17305 |
},
|
17306 |
"MN": {
|
17307 |
+
"score": 0.006903243016889744,
|
17308 |
"languages": [
|
17309 |
{
|
17310 |
"name": "Chinese",
|
|
|
17316 |
"name": "Russian",
|
17317 |
"bcp_47": "ru",
|
17318 |
"population": 4118,
|
17319 |
+
"score": 0.45
|
17320 |
},
|
17321 |
{
|
17322 |
"name": "Kazakh",
|
|
|
17408 |
]
|
17409 |
},
|
17410 |
"VN": {
|
17411 |
+
"score": 0.44527479082463184,
|
17412 |
"languages": [
|
17413 |
{
|
17414 |
"name": "Chinese",
|
|
|
17420 |
"name": "Vietnamese",
|
17421 |
"bcp_47": "vi",
|
17422 |
"population": 84900318,
|
17423 |
+
"score": 0.45
|
17424 |
},
|
17425 |
{
|
17426 |
"name": "Hmong Njua",
|
|
|
17603 |
]
|
17604 |
},
|
17605 |
"GQ": {
|
17606 |
+
"score": 0.27923739669086073,
|
17607 |
"languages": [
|
17608 |
{
|
17609 |
"name": "Spanish",
|
|
|
17621 |
"name": "Portuguese",
|
17622 |
"bcp_47": "pt",
|
17623 |
"population": 1,
|
17624 |
+
"score": 0.45
|
17625 |
},
|
17626 |
{
|
17627 |
"name": "Fang",
|
|
|
17700 |
]
|
17701 |
},
|
17702 |
"PY": {
|
17703 |
+
"score": 0.03322879759433273,
|
17704 |
"languages": [
|
17705 |
{
|
17706 |
"name": "Spanish",
|
|
|
17712 |
"name": "German",
|
17713 |
"bcp_47": "de",
|
17714 |
"population": 208559,
|
17715 |
+
"score": 0.49
|
17716 |
},
|
17717 |
{
|
17718 |
"name": "Guarani",
|
|
|
17819 |
]
|
17820 |
},
|
17821 |
"IR": {
|
17822 |
+
"score": 0.23949254115959248,
|
17823 |
"languages": [
|
17824 |
{
|
17825 |
"name": "Arabic",
|
|
|
17831 |
"name": "Persian",
|
17832 |
"bcp_47": "fa",
|
17833 |
"population": 63692475,
|
17834 |
+
"score": 0.41
|
17835 |
},
|
17836 |
{
|
17837 |
"name": "Pashto",
|
|
|
18166 |
]
|
18167 |
},
|
18168 |
"OM": {
|
18169 |
+
"score": 0.3961930102252659,
|
18170 |
"languages": [
|
18171 |
{
|
18172 |
"name": "Arabic",
|
|
|
18178 |
"name": "Persian",
|
18179 |
"bcp_47": "fa",
|
18180 |
"population": 43849,
|
18181 |
+
"score": 0.41
|
18182 |
},
|
18183 |
{
|
18184 |
"name": "Baluchi",
|
|
|
18206 |
]
|
18207 |
},
|
18208 |
"QA": {
|
18209 |
+
"score": 0.41777205848450016,
|
18210 |
"languages": [
|
18211 |
{
|
18212 |
"name": "Arabic",
|
|
|
18218 |
"name": "Persian",
|
18219 |
"bcp_47": "fa",
|
18220 |
"population": 268859,
|
18221 |
+
"score": 0.41
|
18222 |
},
|
18223 |
{
|
18224 |
"name": "Malayalam",
|
|
|
18246 |
]
|
18247 |
},
|
18248 |
"SO": {
|
18249 |
+
"score": 0.1326691120161243,
|
18250 |
"languages": [
|
18251 |
{
|
18252 |
"name": "Arabic",
|
|
|
18258 |
"name": "Swahili",
|
18259 |
"bcp_47": "sw",
|
18260 |
"population": 235142,
|
18261 |
+
"score": 0.45
|
18262 |
},
|
18263 |
{
|
18264 |
"name": "Oromo",
|
|
|
18333 |
]
|
18334 |
},
|
18335 |
"TJ": {
|
18336 |
+
"score": 0.05075244729560809,
|
18337 |
"languages": [
|
18338 |
{
|
18339 |
"name": "Arabic",
|
|
|
18345 |
"name": "Russian",
|
18346 |
"bcp_47": "ru",
|
18347 |
"population": 1064840,
|
18348 |
+
"score": 0.45
|
18349 |
},
|
18350 |
{
|
18351 |
"name": "Persian",
|
18352 |
"bcp_47": "fa",
|
18353 |
"population": 69215,
|
18354 |
+
"score": 0.41
|
18355 |
},
|
18356 |
{
|
18357 |
"name": "Tajik",
|
|
|
18454 |
]
|
18455 |
},
|
18456 |
"CD": {
|
18457 |
+
"score": 0.34013185580025246,
|
18458 |
"languages": [
|
18459 |
{
|
18460 |
"name": "French",
|
|
|
18466 |
"name": "Swahili",
|
18467 |
"bcp_47": "sw",
|
18468 |
"population": 50890000,
|
18469 |
+
"score": 0.45
|
18470 |
},
|
18471 |
{
|
18472 |
"name": "Kinyarwanda",
|
|
|
18718 |
]
|
18719 |
},
|
18720 |
"RE": {
|
18721 |
+
"score": 0.26908571814147125,
|
18722 |
"languages": [
|
18723 |
{
|
18724 |
"name": "French",
|
|
|
18730 |
"name": "Tamil",
|
18731 |
"bcp_47": "ta",
|
18732 |
"population": 118138,
|
18733 |
+
"score": 0.41
|
18734 |
},
|
18735 |
{
|
18736 |
"name": "Réunion Creole French",
|
|
|
18887 |
]
|
18888 |
},
|
18889 |
"YT": {
|
18890 |
+
"score": 0.15850059031877214,
|
18891 |
"languages": [
|
18892 |
{
|
18893 |
"name": "French",
|
|
|
18899 |
"name": "Swahili",
|
18900 |
"bcp_47": "sw",
|
18901 |
"population": 2716,
|
18902 |
+
"score": 0.45
|
18903 |
},
|
18904 |
{
|
18905 |
"name": "Comorian",
|
|
|
18916 |
]
|
18917 |
},
|
18918 |
"AO": {
|
18919 |
+
"score": 0.2478014326653792,
|
18920 |
"languages": [
|
18921 |
{
|
18922 |
"name": "Portuguese",
|
18923 |
"bcp_47": "pt",
|
18924 |
"population": 21789941,
|
18925 |
+
"score": 0.45
|
18926 |
},
|
18927 |
{
|
18928 |
"name": "Umbundu",
|
|
|
18945 |
]
|
18946 |
},
|
18947 |
"CV": {
|
18948 |
+
"score": 0.20479048002332564,
|
18949 |
"languages": [
|
18950 |
{
|
18951 |
"name": "Portuguese",
|
18952 |
"bcp_47": "pt",
|
18953 |
"population": 443274,
|
18954 |
+
"score": 0.45
|
18955 |
},
|
18956 |
{
|
18957 |
"name": "Kabuverdianu",
|
|
|
18962 |
]
|
18963 |
},
|
18964 |
"GW": {
|
18965 |
+
"score": 0.43859551519338624,
|
18966 |
"languages": [
|
18967 |
{
|
18968 |
"name": "Portuguese",
|
18969 |
"bcp_47": "pt",
|
18970 |
"population": 1927100,
|
18971 |
+
"score": 0.45
|
18972 |
},
|
18973 |
{
|
18974 |
"name": "Fula",
|
|
|
18985 |
]
|
18986 |
},
|
18987 |
"MZ": {
|
18988 |
+
"score": 0.1480934184335346,
|
18989 |
"languages": [
|
18990 |
{
|
18991 |
"name": "Portuguese",
|
18992 |
"bcp_47": "pt",
|
18993 |
"population": 8126514,
|
18994 |
+
"score": 0.45
|
18995 |
},
|
18996 |
{
|
18997 |
"name": "Swahili",
|
18998 |
"bcp_47": "sw",
|
18999 |
"population": 9330,
|
19000 |
+
"score": 0.45
|
19001 |
},
|
19002 |
{
|
19003 |
"name": "Nyanja",
|
|
|
19062 |
]
|
19063 |
},
|
19064 |
"ST": {
|
19065 |
+
"score": 0.45,
|
19066 |
"languages": [
|
19067 |
{
|
19068 |
"name": "Portuguese",
|
19069 |
"bcp_47": "pt",
|
19070 |
"population": 179454,
|
19071 |
+
"score": 0.45
|
19072 |
}
|
19073 |
]
|
19074 |
},
|
19075 |
"TL": {
|
19076 |
+
"score": 0.225,
|
19077 |
"languages": [
|
19078 |
{
|
19079 |
"name": "Portuguese",
|
19080 |
"bcp_47": "pt",
|
19081 |
"population": 816395,
|
19082 |
+
"score": 0.45
|
19083 |
},
|
19084 |
{
|
19085 |
"name": "Tetum",
|
|
|
19090 |
]
|
19091 |
},
|
19092 |
"BY": {
|
19093 |
+
"score": 0.04821427057437069,
|
19094 |
"languages": [
|
19095 |
{
|
19096 |
"name": "Russian",
|
19097 |
"bcp_47": "ru",
|
19098 |
"population": 1137350,
|
19099 |
+
"score": 0.45
|
19100 |
},
|
19101 |
{
|
19102 |
"name": "Belarusian",
|
|
|
19107 |
]
|
19108 |
},
|
19109 |
"GE": {
|
19110 |
+
"score": 0.03423789210395573,
|
19111 |
"languages": [
|
19112 |
{
|
19113 |
"name": "Russian",
|
19114 |
"bcp_47": "ru",
|
19115 |
"population": 359730,
|
19116 |
+
"score": 0.45
|
19117 |
},
|
19118 |
{
|
19119 |
"name": "Kurdish",
|
|
|
19154 |
]
|
19155 |
},
|
19156 |
"KG": {
|
19157 |
+
"score": 0.19285714285714287,
|
19158 |
"languages": [
|
19159 |
{
|
19160 |
"name": "Russian",
|
19161 |
"bcp_47": "ru",
|
19162 |
"population": 2147364,
|
19163 |
+
"score": 0.45
|
19164 |
},
|
19165 |
{
|
19166 |
"name": "Kyrgyz",
|
|
|
19171 |
]
|
19172 |
},
|
19173 |
"MD": {
|
19174 |
+
"score": 0.014563109130777574,
|
19175 |
"languages": [
|
19176 |
{
|
19177 |
"name": "Russian",
|
19178 |
"bcp_47": "ru",
|
19179 |
"population": 100935,
|
19180 |
+
"score": 0.45
|
19181 |
},
|
19182 |
{
|
19183 |
"name": "Ukrainian",
|
|
|
19206 |
]
|
19207 |
},
|
19208 |
"RU": {
|
19209 |
+
"score": 0.4065329789745318,
|
19210 |
"languages": [
|
19211 |
{
|
19212 |
"name": "Russian",
|
19213 |
"bcp_47": "ru",
|
19214 |
"population": 133218680,
|
19215 |
+
"score": 0.45
|
19216 |
},
|
19217 |
{
|
19218 |
"name": "Azerbaijani",
|
|
|
19427 |
]
|
19428 |
},
|
19429 |
"SJ": {
|
19430 |
+
"score": 0.20059435364041606,
|
19431 |
"languages": [
|
19432 |
{
|
19433 |
"name": "Russian",
|
19434 |
"bcp_47": "ru",
|
19435 |
"population": 1200,
|
19436 |
+
"score": 0.45
|
19437 |
},
|
19438 |
{
|
19439 |
"name": "Norwegian Bokmål",
|
|
|
19444 |
]
|
19445 |
},
|
19446 |
"TM": {
|
19447 |
+
"score": 0.059080984625687366,
|
19448 |
"languages": [
|
19449 |
{
|
19450 |
"name": "Russian",
|
19451 |
"bcp_47": "ru",
|
19452 |
"population": 663436,
|
19453 |
+
"score": 0.45
|
19454 |
},
|
19455 |
{
|
19456 |
"name": "Uzbek",
|
|
|
19473 |
]
|
19474 |
},
|
19475 |
"UA": {
|
19476 |
+
"score": 0.17534632621240526,
|
19477 |
"languages": [
|
19478 |
{
|
19479 |
"name": "Russian",
|
19480 |
"bcp_47": "ru",
|
19481 |
"population": 20204534,
|
19482 |
+
"score": 0.45
|
19483 |
},
|
19484 |
{
|
19485 |
"name": "Turkish",
|
19486 |
"bcp_47": "tr",
|
19487 |
"population": 184476,
|
19488 |
+
"score": 0.44
|
19489 |
},
|
19490 |
{
|
19491 |
"name": "Polish",
|
|
|
19550 |
]
|
19551 |
},
|
19552 |
"UZ": {
|
19553 |
+
"score": 0.05701615696541229,
|
19554 |
"languages": [
|
19555 |
{
|
19556 |
"name": "Russian",
|
19557 |
"bcp_47": "ru",
|
19558 |
"population": 4279156,
|
19559 |
+
"score": 0.45
|
19560 |
},
|
19561 |
{
|
19562 |
"name": "Turkish",
|
19563 |
"bcp_47": "tr",
|
19564 |
"population": 232297,
|
19565 |
+
"score": 0.44
|
19566 |
},
|
19567 |
{
|
19568 |
"name": "Uzbek",
|
|
|
19579 |
]
|
19580 |
},
|
19581 |
"LI": {
|
19582 |
+
"score": 0.26022294592577516,
|
19583 |
"languages": [
|
19584 |
{
|
19585 |
"name": "German",
|
19586 |
"bcp_47": "de",
|
19587 |
"population": 39137,
|
19588 |
+
"score": 0.49
|
19589 |
},
|
19590 |
{
|
19591 |
"name": "Swiss German",
|
|
|
19602 |
]
|
19603 |
},
|
19604 |
"JP": {
|
19605 |
+
"score": 0.4560515108353953,
|
19606 |
"languages": [
|
19607 |
{
|
19608 |
"name": "Japanese",
|
19609 |
"bcp_47": "ja",
|
19610 |
"population": 119231650,
|
19611 |
+
"score": 0.46
|
19612 |
},
|
19613 |
{
|
19614 |
"name": "Korean",
|
19615 |
"bcp_47": "ko",
|
19616 |
"population": 652636,
|
19617 |
+
"score": 0.41
|
19618 |
},
|
19619 |
{
|
19620 |
"name": "Central Okinawan",
|
|
|
19625 |
]
|
19626 |
},
|
19627 |
"AF": {
|
19628 |
+
"score": 0.19133182400153392,
|
19629 |
"languages": [
|
19630 |
{
|
19631 |
"name": "Persian",
|
19632 |
"bcp_47": "fa",
|
19633 |
"population": 18321900,
|
19634 |
+
"score": 0.41
|
19635 |
},
|
19636 |
{
|
19637 |
"name": "Pashto",
|
|
|
19684 |
]
|
19685 |
},
|
19686 |
"MK": {
|
19687 |
+
"score": 0.016125668065966572,
|
19688 |
"languages": [
|
19689 |
{
|
19690 |
"name": "Turkish",
|
19691 |
"bcp_47": "tr",
|
19692 |
"population": 74409,
|
19693 |
+
"score": 0.44
|
19694 |
},
|
19695 |
{
|
19696 |
"name": "Albanian",
|
|
|
19707 |
]
|
19708 |
},
|
19709 |
"KP": {
|
19710 |
+
"score": 0.41,
|
19711 |
"languages": [
|
19712 |
{
|
19713 |
"name": "Korean",
|
19714 |
"bcp_47": "ko",
|
19715 |
"population": 22566280,
|
19716 |
+
"score": 0.41
|
19717 |
}
|
19718 |
]
|
19719 |
},
|
19720 |
"KR": {
|
19721 |
+
"score": 0.41,
|
19722 |
"languages": [
|
19723 |
{
|
19724 |
"name": "Korean",
|
19725 |
"bcp_47": "ko",
|
19726 |
"population": 51835100,
|
19727 |
+
"score": 0.41
|
19728 |
}
|
19729 |
]
|
19730 |
},
|
19731 |
"SM": {
|
19732 |
+
"score": 0.4654018916371436,
|
19733 |
"languages": [
|
19734 |
{
|
19735 |
"name": "Italian",
|
19736 |
"bcp_47": "it",
|
19737 |
"population": 30466,
|
19738 |
+
"score": 0.47
|
19739 |
},
|
19740 |
{
|
19741 |
"name": "Esperanto",
|
|
|
19746 |
]
|
19747 |
},
|
19748 |
"VA": {
|
19749 |
+
"score": 0.235,
|
19750 |
"languages": [
|
19751 |
{
|
19752 |
"name": "Italian",
|
19753 |
"bcp_47": "it",
|
19754 |
"population": 820,
|
19755 |
+
"score": 0.47
|
19756 |
},
|
19757 |
{
|
19758 |
"name": "Latin",
|
results.json
CHANGED
@@ -3,29 +3,29 @@
|
|
3 |
{
|
4 |
"task": "classification",
|
5 |
"metric": "accuracy",
|
6 |
-
"score": 0.
|
7 |
-
"bcp_47":
|
8 |
"model": 12
|
9 |
},
|
10 |
{
|
11 |
"task": "language_modeling",
|
12 |
"metric": "chrf",
|
13 |
-
"score": 0.
|
14 |
-
"bcp_47":
|
15 |
"model": 12
|
16 |
},
|
17 |
{
|
18 |
"task": "translation",
|
19 |
"metric": "bleu",
|
20 |
-
"score": 0.
|
21 |
-
"bcp_47":
|
22 |
"model": 12
|
23 |
},
|
24 |
{
|
25 |
"task": "translation",
|
26 |
"metric": "chrf",
|
27 |
-
"score": 0.
|
28 |
-
"bcp_47":
|
29 |
"model": 12
|
30 |
}
|
31 |
],
|
@@ -41,7 +41,7 @@
|
|
41 |
"model": "amazon/nova-micro-v1",
|
42 |
"task": "language_modeling",
|
43 |
"metric": "chrf",
|
44 |
-
"score": 0.
|
45 |
"bcp_47": 2
|
46 |
},
|
47 |
{
|
@@ -69,7 +69,7 @@
|
|
69 |
"model": "google/gemini-2.0-flash-001",
|
70 |
"task": "language_modeling",
|
71 |
"metric": "chrf",
|
72 |
-
"score": 0.
|
73 |
"bcp_47": 2
|
74 |
},
|
75 |
{
|
@@ -97,7 +97,7 @@
|
|
97 |
"model": "google/gemini-2.0-flash-lite-001",
|
98 |
"task": "language_modeling",
|
99 |
"metric": "chrf",
|
100 |
-
"score": 0.
|
101 |
"bcp_47": 2
|
102 |
},
|
103 |
{
|
@@ -125,7 +125,7 @@
|
|
125 |
"model": "google/gemma-3-27b-it",
|
126 |
"task": "language_modeling",
|
127 |
"metric": "chrf",
|
128 |
-
"score": 0.
|
129 |
"bcp_47": 2
|
130 |
},
|
131 |
{
|
@@ -153,7 +153,7 @@
|
|
153 |
"model": "meta-llama/llama-3-70b-instruct",
|
154 |
"task": "language_modeling",
|
155 |
"metric": "chrf",
|
156 |
-
"score": 0.
|
157 |
"bcp_47": 2
|
158 |
},
|
159 |
{
|
@@ -181,14 +181,14 @@
|
|
181 |
"model": "meta-llama/llama-3.1-70b-instruct",
|
182 |
"task": "language_modeling",
|
183 |
"metric": "chrf",
|
184 |
-
"score": 0.
|
185 |
"bcp_47": 2
|
186 |
},
|
187 |
{
|
188 |
"model": "meta-llama/llama-3.1-70b-instruct",
|
189 |
"task": "translation",
|
190 |
"metric": "bleu",
|
191 |
-
"score": 0.
|
192 |
"bcp_47": 2
|
193 |
},
|
194 |
{
|
@@ -202,29 +202,29 @@
|
|
202 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
203 |
"task": "classification",
|
204 |
"metric": "accuracy",
|
205 |
-
"score": 0.
|
206 |
-
"bcp_47":
|
207 |
},
|
208 |
{
|
209 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
210 |
"task": "language_modeling",
|
211 |
"metric": "chrf",
|
212 |
-
"score": 0.
|
213 |
-
"bcp_47":
|
214 |
},
|
215 |
{
|
216 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
217 |
"task": "translation",
|
218 |
"metric": "bleu",
|
219 |
-
"score": 0.
|
220 |
-
"bcp_47":
|
221 |
},
|
222 |
{
|
223 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
224 |
"task": "translation",
|
225 |
"metric": "chrf",
|
226 |
-
"score": 0.
|
227 |
-
"bcp_47":
|
228 |
},
|
229 |
{
|
230 |
"model": "microsoft/phi-4-multimodal-instruct",
|
@@ -237,7 +237,7 @@
|
|
237 |
"model": "microsoft/phi-4-multimodal-instruct",
|
238 |
"task": "language_modeling",
|
239 |
"metric": "chrf",
|
240 |
-
"score": 0.
|
241 |
"bcp_47": 2
|
242 |
},
|
243 |
{
|
@@ -265,7 +265,7 @@
|
|
265 |
"model": "mistralai/mistral-nemo",
|
266 |
"task": "language_modeling",
|
267 |
"metric": "chrf",
|
268 |
-
"score": 0.
|
269 |
"bcp_47": 2
|
270 |
},
|
271 |
{
|
@@ -293,7 +293,7 @@
|
|
293 |
"model": "mistralai/mistral-small-24b-instruct-2501",
|
294 |
"task": "language_modeling",
|
295 |
"metric": "chrf",
|
296 |
-
"score": 0.
|
297 |
"bcp_47": 2
|
298 |
},
|
299 |
{
|
@@ -321,7 +321,7 @@
|
|
321 |
"model": "openai/gpt-4o-mini",
|
322 |
"task": "language_modeling",
|
323 |
"metric": "chrf",
|
324 |
-
"score": 0.
|
325 |
"bcp_47": 2
|
326 |
},
|
327 |
{
|
@@ -349,7 +349,7 @@
|
|
349 |
"model": "qwen/qwq-32b",
|
350 |
"task": "language_modeling",
|
351 |
"metric": "chrf",
|
352 |
-
"score": 0.
|
353 |
"bcp_47": 2
|
354 |
},
|
355 |
{
|
@@ -701,7 +701,7 @@
|
|
701 |
"in_benchmark": true,
|
702 |
"task": "language_modeling",
|
703 |
"metric": "chrf",
|
704 |
-
"score": 0.
|
705 |
"model": 1.0
|
706 |
},
|
707 |
{
|
@@ -827,10 +827,58 @@
|
|
827 |
"commonvoice_hours": null,
|
828 |
"commonvoice_locale": null,
|
829 |
"in_benchmark": true,
|
830 |
-
"task":
|
831 |
-
"metric":
|
832 |
-
"score":
|
833 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
834 |
},
|
835 |
{
|
836 |
"bcp_47": "as",
|
@@ -1613,7 +1661,7 @@
|
|
1613 |
"in_benchmark": true,
|
1614 |
"task": "language_modeling",
|
1615 |
"metric": "chrf",
|
1616 |
-
"score": 0.
|
1617 |
"model": 1.0
|
1618 |
},
|
1619 |
{
|
@@ -1992,7 +2040,7 @@
|
|
1992 |
"family": "Indo-European",
|
1993 |
"flores_path": "cat_Latn",
|
1994 |
"fleurs_tag": "ca_es",
|
1995 |
-
"commonvoice_hours":
|
1996 |
"commonvoice_locale": "ca",
|
1997 |
"in_benchmark": true,
|
1998 |
"task": null,
|
@@ -2587,10 +2635,58 @@
|
|
2587 |
"commonvoice_hours": 1360.0,
|
2588 |
"commonvoice_locale": "de",
|
2589 |
"in_benchmark": true,
|
2590 |
-
"task":
|
2591 |
-
"metric":
|
2592 |
-
"score":
|
2593 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2594 |
},
|
2595 |
{
|
2596 |
"bcp_47": "den",
|
@@ -2925,7 +3021,7 @@
|
|
2925 |
"in_benchmark": true,
|
2926 |
"task": "language_modeling",
|
2927 |
"metric": "chrf",
|
2928 |
-
"score": 0.
|
2929 |
"model": 12.0
|
2930 |
},
|
2931 |
{
|
@@ -2941,7 +3037,7 @@
|
|
2941 |
"in_benchmark": true,
|
2942 |
"task": "translation",
|
2943 |
"metric": "bleu",
|
2944 |
-
"score": 0.
|
2945 |
"model": 12.0
|
2946 |
},
|
2947 |
{
|
@@ -3005,7 +3101,7 @@
|
|
3005 |
"in_benchmark": true,
|
3006 |
"task": "language_modeling",
|
3007 |
"metric": "chrf",
|
3008 |
-
"score": 0.
|
3009 |
"model": 1.0
|
3010 |
},
|
3011 |
{
|
@@ -3080,7 +3176,7 @@
|
|
3080 |
"family": null,
|
3081 |
"flores_path": "eus_Latn",
|
3082 |
"fleurs_tag": null,
|
3083 |
-
"commonvoice_hours":
|
3084 |
"commonvoice_locale": "eu",
|
3085 |
"in_benchmark": true,
|
3086 |
"task": null,
|
@@ -3131,10 +3227,58 @@
|
|
3131 |
"commonvoice_hours": 370.0,
|
3132 |
"commonvoice_locale": "fa",
|
3133 |
"in_benchmark": true,
|
3134 |
-
"task":
|
3135 |
-
"metric":
|
3136 |
-
"score":
|
3137 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3138 |
},
|
3139 |
{
|
3140 |
"bcp_47": "fan",
|
@@ -3243,10 +3387,58 @@
|
|
3243 |
"commonvoice_hours": 0.0,
|
3244 |
"commonvoice_locale": "tl",
|
3245 |
"in_benchmark": true,
|
3246 |
-
"task":
|
3247 |
-
"metric":
|
3248 |
-
"score":
|
3249 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3250 |
},
|
3251 |
{
|
3252 |
"bcp_47": "fit",
|
@@ -3341,7 +3533,7 @@
|
|
3341 |
"in_benchmark": true,
|
3342 |
"task": "language_modeling",
|
3343 |
"metric": "chrf",
|
3344 |
-
"score": 0.
|
3345 |
"model": 1.0
|
3346 |
},
|
3347 |
{
|
@@ -3544,7 +3736,7 @@
|
|
3544 |
"family": "Indo-European",
|
3545 |
"flores_path": "gle_Latn",
|
3546 |
"fleurs_tag": "ga_ie",
|
3547 |
-
"commonvoice_hours":
|
3548 |
"commonvoice_locale": "ga-IE",
|
3549 |
"in_benchmark": true,
|
3550 |
"task": null,
|
@@ -3899,36 +4091,84 @@
|
|
3899 |
"commonvoice_hours": 0.0,
|
3900 |
"commonvoice_locale": "gu-IN",
|
3901 |
"in_benchmark": true,
|
3902 |
-
"task":
|
3903 |
-
"metric":
|
3904 |
-
"score":
|
3905 |
-
"model":
|
3906 |
},
|
3907 |
{
|
3908 |
-
"bcp_47": "
|
3909 |
-
"speakers":
|
3910 |
-
"language_name": "
|
3911 |
-
"autonym": "
|
3912 |
-
"family": "
|
3913 |
-
"flores_path":
|
3914 |
-
"fleurs_tag":
|
3915 |
-
"commonvoice_hours":
|
3916 |
-
"commonvoice_locale":
|
3917 |
-
"in_benchmark":
|
3918 |
-
"task":
|
3919 |
-
"metric":
|
3920 |
-
"score":
|
3921 |
-
"model":
|
3922 |
},
|
3923 |
{
|
3924 |
-
"bcp_47": "
|
3925 |
-
"speakers":
|
3926 |
-
"language_name": "
|
3927 |
-
"autonym": "
|
3928 |
-
"family": "
|
3929 |
-
"flores_path":
|
3930 |
-
"fleurs_tag":
|
3931 |
-
"commonvoice_hours": 0.0,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3932 |
"commonvoice_locale": "guc",
|
3933 |
"in_benchmark": false,
|
3934 |
"task": null,
|
@@ -4125,7 +4365,7 @@
|
|
4125 |
"in_benchmark": true,
|
4126 |
"task": "language_modeling",
|
4127 |
"metric": "chrf",
|
4128 |
-
"score": 0.
|
4129 |
"model": 1.0
|
4130 |
},
|
4131 |
{
|
@@ -4507,10 +4747,58 @@
|
|
4507 |
"commonvoice_hours": 33.0,
|
4508 |
"commonvoice_locale": "id",
|
4509 |
"in_benchmark": true,
|
4510 |
-
"task":
|
4511 |
-
"metric":
|
4512 |
-
"score":
|
4513 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4514 |
},
|
4515 |
{
|
4516 |
"bcp_47": "ie",
|
@@ -4667,10 +4955,58 @@
|
|
4667 |
"commonvoice_hours": 362.0,
|
4668 |
"commonvoice_locale": "it",
|
4669 |
"in_benchmark": true,
|
4670 |
-
"task":
|
4671 |
-
"metric":
|
4672 |
-
"score":
|
4673 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4674 |
},
|
4675 |
{
|
4676 |
"bcp_47": "iu",
|
@@ -4715,10 +5051,58 @@
|
|
4715 |
"commonvoice_hours": 222.0,
|
4716 |
"commonvoice_locale": "ja",
|
4717 |
"in_benchmark": true,
|
4718 |
-
"task":
|
4719 |
-
"metric":
|
4720 |
-
"score":
|
4721 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4722 |
},
|
4723 |
{
|
4724 |
"bcp_47": "jam",
|
@@ -4827,39 +5211,87 @@
|
|
4827 |
"commonvoice_hours": 0.0,
|
4828 |
"commonvoice_locale": "jv",
|
4829 |
"in_benchmark": true,
|
4830 |
-
"task":
|
4831 |
-
"metric":
|
4832 |
-
"score":
|
4833 |
-
"model":
|
4834 |
},
|
4835 |
{
|
4836 |
-
"bcp_47": "
|
4837 |
-
"speakers":
|
4838 |
-
"language_name": "
|
4839 |
-
"autonym": "
|
4840 |
-
"family": "
|
4841 |
-
"flores_path": "
|
4842 |
-
"fleurs_tag": "
|
4843 |
-
"commonvoice_hours":
|
4844 |
-
"commonvoice_locale": "
|
4845 |
"in_benchmark": true,
|
4846 |
-
"task":
|
4847 |
-
"metric":
|
4848 |
-
"score":
|
4849 |
-
"model":
|
4850 |
},
|
4851 |
{
|
4852 |
-
"bcp_47": "
|
4853 |
-
"speakers":
|
4854 |
-
"language_name": "
|
4855 |
-
"autonym": "
|
4856 |
-
"family": "
|
4857 |
-
"flores_path":
|
4858 |
-
"fleurs_tag":
|
4859 |
-
"commonvoice_hours": 0.0,
|
4860 |
-
"commonvoice_locale": "
|
4861 |
-
"in_benchmark":
|
4862 |
-
"task":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4863 |
"metric": null,
|
4864 |
"score": null,
|
4865 |
"model": null
|
@@ -4952,7 +5384,7 @@
|
|
4952 |
"family": "Abkhaz-Adyge",
|
4953 |
"flores_path": null,
|
4954 |
"fleurs_tag": null,
|
4955 |
-
"commonvoice_hours":
|
4956 |
"commonvoice_locale": "kbd",
|
4957 |
"in_benchmark": false,
|
4958 |
"task": null,
|
@@ -5451,10 +5883,58 @@
|
|
5451 |
"commonvoice_hours": 1.7,
|
5452 |
"commonvoice_locale": "ko",
|
5453 |
"in_benchmark": true,
|
5454 |
-
"task":
|
5455 |
-
"metric":
|
5456 |
-
"score":
|
5457 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
5458 |
},
|
5459 |
{
|
5460 |
"bcp_47": "koi",
|
@@ -5752,7 +6232,7 @@
|
|
5752 |
"family": "Indo-European",
|
5753 |
"flores_path": null,
|
5754 |
"fleurs_tag": null,
|
5755 |
-
"commonvoice_hours":
|
5756 |
"commonvoice_locale": "kw",
|
5757 |
"in_benchmark": false,
|
5758 |
"task": null,
|
@@ -6872,7 +7352,7 @@
|
|
6872 |
"family": "Indo-European",
|
6873 |
"flores_path": "mkd_Cyrl",
|
6874 |
"fleurs_tag": "mk_mk",
|
6875 |
-
"commonvoice_hours":
|
6876 |
"commonvoice_locale": "mk",
|
6877 |
"in_benchmark": true,
|
6878 |
"task": null,
|
@@ -7019,10 +7499,58 @@
|
|
7019 |
"commonvoice_hours": 20.0,
|
7020 |
"commonvoice_locale": "mr",
|
7021 |
"in_benchmark": true,
|
7022 |
-
"task":
|
7023 |
-
"metric":
|
7024 |
-
"score":
|
7025 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
7026 |
},
|
7027 |
{
|
7028 |
"bcp_47": "mrd",
|
@@ -7976,7 +8504,7 @@
|
|
7976 |
"family": "Indo-European",
|
7977 |
"flores_path": null,
|
7978 |
"fleurs_tag": null,
|
7979 |
-
"commonvoice_hours": 0.
|
7980 |
"commonvoice_locale": "os",
|
7981 |
"in_benchmark": false,
|
7982 |
"task": null,
|
@@ -8029,7 +8557,7 @@
|
|
8029 |
"in_benchmark": true,
|
8030 |
"task": "language_modeling",
|
8031 |
"metric": "chrf",
|
8032 |
-
"score": 0.
|
8033 |
"model": 1.0
|
8034 |
},
|
8035 |
{
|
@@ -8397,7 +8925,7 @@
|
|
8397 |
"in_benchmark": true,
|
8398 |
"task": "language_modeling",
|
8399 |
"metric": "chrf",
|
8400 |
-
"score": 0.
|
8401 |
"model": 1.0
|
8402 |
},
|
8403 |
{
|
@@ -8824,13 +9352,61 @@
|
|
8824 |
"family": "Indo-European",
|
8825 |
"flores_path": "rus_Cyrl",
|
8826 |
"fleurs_tag": "ru_ru",
|
8827 |
-
"commonvoice_hours":
|
8828 |
"commonvoice_locale": "ru",
|
8829 |
"in_benchmark": true,
|
8830 |
-
"task":
|
8831 |
-
"metric":
|
8832 |
-
"score":
|
8833 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8834 |
},
|
8835 |
{
|
8836 |
"bcp_47": "rue",
|
@@ -9224,7 +9800,7 @@
|
|
9224 |
"family": null,
|
9225 |
"flores_path": null,
|
9226 |
"fleurs_tag": null,
|
9227 |
-
"commonvoice_hours":
|
9228 |
"commonvoice_locale": "sei",
|
9229 |
"in_benchmark": false,
|
9230 |
"task": null,
|
@@ -9803,32 +10379,80 @@
|
|
9803 |
"commonvoice_hours": 411.0,
|
9804 |
"commonvoice_locale": "sw",
|
9805 |
"in_benchmark": true,
|
9806 |
-
"task":
|
9807 |
-
"metric":
|
9808 |
-
"score":
|
9809 |
-
"model":
|
9810 |
},
|
9811 |
{
|
9812 |
-
"bcp_47": "
|
9813 |
-
"speakers":
|
9814 |
-
"language_name": "
|
9815 |
-
"autonym": "
|
9816 |
"family": "Atlantic-Congo",
|
9817 |
-
"flores_path":
|
9818 |
-
"fleurs_tag":
|
9819 |
-
"commonvoice_hours":
|
9820 |
-
"commonvoice_locale":
|
9821 |
-
"in_benchmark":
|
9822 |
-
"task":
|
9823 |
-
"metric":
|
9824 |
-
"score":
|
9825 |
-
"model":
|
9826 |
},
|
9827 |
{
|
9828 |
-
"bcp_47": "
|
9829 |
-
"speakers":
|
9830 |
-
"language_name": "
|
9831 |
-
"autonym": "
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
9832 |
"family": "Indo-European",
|
9833 |
"flores_path": null,
|
9834 |
"fleurs_tag": null,
|
@@ -9931,10 +10555,58 @@
|
|
9931 |
"commonvoice_hours": 234.0,
|
9932 |
"commonvoice_locale": "ta",
|
9933 |
"in_benchmark": true,
|
9934 |
-
"task":
|
9935 |
-
"metric":
|
9936 |
-
"score":
|
9937 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
9938 |
},
|
9939 |
{
|
9940 |
"bcp_47": "taj",
|
@@ -10043,10 +10715,58 @@
|
|
10043 |
"commonvoice_hours": 0.3,
|
10044 |
"commonvoice_locale": "te",
|
10045 |
"in_benchmark": true,
|
10046 |
-
"task":
|
10047 |
-
"metric":
|
10048 |
-
"score":
|
10049 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
10050 |
},
|
10051 |
{
|
10052 |
"bcp_47": "tem",
|
@@ -10411,10 +11131,58 @@
|
|
10411 |
"commonvoice_hours": 128.0,
|
10412 |
"commonvoice_locale": "tr",
|
10413 |
"in_benchmark": true,
|
10414 |
-
"task":
|
10415 |
-
"metric":
|
10416 |
-
"score":
|
10417 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
10418 |
},
|
10419 |
{
|
10420 |
"bcp_47": "tru",
|
@@ -10829,7 +11597,7 @@
|
|
10829 |
"in_benchmark": true,
|
10830 |
"task": "language_modeling",
|
10831 |
"metric": "chrf",
|
10832 |
-
"score": 0.
|
10833 |
"model": 1.0
|
10834 |
},
|
10835 |
{
|
@@ -10845,7 +11613,7 @@
|
|
10845 |
"in_benchmark": true,
|
10846 |
"task": "translation",
|
10847 |
"metric": "bleu",
|
10848 |
-
"score": 0.
|
10849 |
"model": 1.0
|
10850 |
},
|
10851 |
{
|
@@ -10955,42 +11723,90 @@
|
|
10955 |
"commonvoice_hours": 6.0,
|
10956 |
"commonvoice_locale": "vi",
|
10957 |
"in_benchmark": true,
|
10958 |
-
"task":
|
10959 |
-
"metric":
|
10960 |
-
"score":
|
10961 |
-
"model":
|
10962 |
},
|
10963 |
{
|
10964 |
-
"bcp_47": "
|
10965 |
-
"speakers":
|
10966 |
-
"language_name": "
|
10967 |
-
"autonym": "
|
10968 |
-
"family": "
|
10969 |
-
"flores_path":
|
10970 |
-
"fleurs_tag":
|
10971 |
-
"commonvoice_hours":
|
10972 |
-
"commonvoice_locale":
|
10973 |
-
"in_benchmark":
|
10974 |
-
"task":
|
10975 |
-
"metric":
|
10976 |
-
"score":
|
10977 |
-
"model":
|
10978 |
},
|
10979 |
{
|
10980 |
-
"bcp_47": "
|
10981 |
-
"speakers":
|
10982 |
-
"language_name": "
|
10983 |
-
"autonym": "
|
10984 |
-
"family": "
|
10985 |
-
"flores_path":
|
10986 |
-
"fleurs_tag":
|
10987 |
-
"commonvoice_hours":
|
10988 |
-
"commonvoice_locale":
|
10989 |
-
"in_benchmark":
|
10990 |
-
"task":
|
10991 |
-
"metric":
|
10992 |
-
"score":
|
10993 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
10994 |
},
|
10995 |
{
|
10996 |
"bcp_47": "vmf",
|
@@ -11499,10 +12315,58 @@
|
|
11499 |
"commonvoice_hours": 203.0,
|
11500 |
"commonvoice_locale": "yue",
|
11501 |
"in_benchmark": true,
|
11502 |
-
"task":
|
11503 |
-
"metric":
|
11504 |
-
"score":
|
11505 |
-
"model":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
11506 |
},
|
11507 |
{
|
11508 |
"bcp_47": "za",
|
@@ -11613,7 +12477,7 @@
|
|
11613 |
"in_benchmark": true,
|
11614 |
"task": "language_modeling",
|
11615 |
"metric": "chrf",
|
11616 |
-
"score": 0.
|
11617 |
"model": 12.0
|
11618 |
},
|
11619 |
{
|
@@ -11711,7 +12575,7 @@
|
|
11711 |
"bcp_47": "en",
|
11712 |
"task": "language_modeling",
|
11713 |
"metric": "chrf",
|
11714 |
-
"score": 0.
|
11715 |
"sentence_nr": 14.5
|
11716 |
},
|
11717 |
{
|
@@ -11743,7 +12607,7 @@
|
|
11743 |
"bcp_47": "zh",
|
11744 |
"task": "language_modeling",
|
11745 |
"metric": "chrf",
|
11746 |
-
"score": 0.
|
11747 |
"sentence_nr": 14.5
|
11748 |
},
|
11749 |
{
|
@@ -11775,7 +12639,7 @@
|
|
11775 |
"bcp_47": "en",
|
11776 |
"task": "language_modeling",
|
11777 |
"metric": "chrf",
|
11778 |
-
"score": 0.
|
11779 |
"sentence_nr": 14.5
|
11780 |
},
|
11781 |
{
|
@@ -11807,7 +12671,7 @@
|
|
11807 |
"bcp_47": "zh",
|
11808 |
"task": "language_modeling",
|
11809 |
"metric": "chrf",
|
11810 |
-
"score": 0.
|
11811 |
"sentence_nr": 14.5
|
11812 |
},
|
11813 |
{
|
@@ -11839,7 +12703,7 @@
|
|
11839 |
"bcp_47": "en",
|
11840 |
"task": "language_modeling",
|
11841 |
"metric": "chrf",
|
11842 |
-
"score": 0.
|
11843 |
"sentence_nr": 14.5
|
11844 |
},
|
11845 |
{
|
@@ -11871,7 +12735,7 @@
|
|
11871 |
"bcp_47": "zh",
|
11872 |
"task": "language_modeling",
|
11873 |
"metric": "chrf",
|
11874 |
-
"score": 0.
|
11875 |
"sentence_nr": 14.5
|
11876 |
},
|
11877 |
{
|
@@ -11903,7 +12767,7 @@
|
|
11903 |
"bcp_47": "en",
|
11904 |
"task": "language_modeling",
|
11905 |
"metric": "chrf",
|
11906 |
-
"score": 0.
|
11907 |
"sentence_nr": 14.5
|
11908 |
},
|
11909 |
{
|
@@ -11935,7 +12799,7 @@
|
|
11935 |
"bcp_47": "zh",
|
11936 |
"task": "language_modeling",
|
11937 |
"metric": "chrf",
|
11938 |
-
"score": 0.
|
11939 |
"sentence_nr": 14.5
|
11940 |
},
|
11941 |
{
|
@@ -11967,7 +12831,7 @@
|
|
11967 |
"bcp_47": "en",
|
11968 |
"task": "language_modeling",
|
11969 |
"metric": "chrf",
|
11970 |
-
"score": 0.
|
11971 |
"sentence_nr": 14.5
|
11972 |
},
|
11973 |
{
|
@@ -11999,7 +12863,7 @@
|
|
11999 |
"bcp_47": "zh",
|
12000 |
"task": "language_modeling",
|
12001 |
"metric": "chrf",
|
12002 |
-
"score": 0.
|
12003 |
"sentence_nr": 14.5
|
12004 |
},
|
12005 |
{
|
@@ -12031,7 +12895,7 @@
|
|
12031 |
"bcp_47": "en",
|
12032 |
"task": "language_modeling",
|
12033 |
"metric": "chrf",
|
12034 |
-
"score": 0.
|
12035 |
"sentence_nr": 14.5
|
12036 |
},
|
12037 |
{
|
@@ -12039,7 +12903,7 @@
|
|
12039 |
"bcp_47": "en",
|
12040 |
"task": "translation",
|
12041 |
"metric": "bleu",
|
12042 |
-
"score": 0.
|
12043 |
"sentence_nr": 14.5
|
12044 |
},
|
12045 |
{
|
@@ -12063,7 +12927,7 @@
|
|
12063 |
"bcp_47": "zh",
|
12064 |
"task": "language_modeling",
|
12065 |
"metric": "chrf",
|
12066 |
-
"score": 0.
|
12067 |
"sentence_nr": 14.5
|
12068 |
},
|
12069 |
{
|
@@ -12095,7 +12959,7 @@
|
|
12095 |
"bcp_47": "ar",
|
12096 |
"task": "language_modeling",
|
12097 |
"metric": "chrf",
|
12098 |
-
"score": 0.
|
12099 |
"sentence_nr": 14.5
|
12100 |
},
|
12101 |
{
|
@@ -12114,6 +12978,38 @@
|
|
12114 |
"score": 0.4684314458952127,
|
12115 |
"sentence_nr": 14.5
|
12116 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
12117 |
{
|
12118 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12119 |
"bcp_47": "bn",
|
@@ -12127,7 +13023,7 @@
|
|
12127 |
"bcp_47": "bn",
|
12128 |
"task": "language_modeling",
|
12129 |
"metric": "chrf",
|
12130 |
-
"score": 0.
|
12131 |
"sentence_nr": 14.5
|
12132 |
},
|
12133 |
{
|
@@ -12146,6 +13042,38 @@
|
|
12146 |
"score": 0.4076175886917154,
|
12147 |
"sentence_nr": 14.5
|
12148 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
12149 |
{
|
12150 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12151 |
"bcp_47": "en",
|
@@ -12159,7 +13087,7 @@
|
|
12159 |
"bcp_47": "en",
|
12160 |
"task": "language_modeling",
|
12161 |
"metric": "chrf",
|
12162 |
-
"score": 0.
|
12163 |
"sentence_nr": 14.5
|
12164 |
},
|
12165 |
{
|
@@ -12191,7 +13119,7 @@
|
|
12191 |
"bcp_47": "es",
|
12192 |
"task": "language_modeling",
|
12193 |
"metric": "chrf",
|
12194 |
-
"score": 0.
|
12195 |
"sentence_nr": 14.5
|
12196 |
},
|
12197 |
{
|
@@ -12212,162 +13140,674 @@
|
|
12212 |
},
|
12213 |
{
|
12214 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12215 |
-
"bcp_47": "
|
12216 |
"task": "classification",
|
12217 |
"metric": "accuracy",
|
12218 |
-
"score": 0.
|
12219 |
"sentence_nr": 14.5
|
12220 |
},
|
12221 |
{
|
12222 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12223 |
-
"bcp_47": "
|
12224 |
"task": "language_modeling",
|
12225 |
"metric": "chrf",
|
12226 |
-
"score": 0.
|
12227 |
"sentence_nr": 14.5
|
12228 |
},
|
12229 |
{
|
12230 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12231 |
-
"bcp_47": "
|
12232 |
"task": "translation",
|
12233 |
"metric": "bleu",
|
12234 |
-
"score": 0.
|
12235 |
"sentence_nr": 14.5
|
12236 |
},
|
12237 |
{
|
12238 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12239 |
-
"bcp_47": "
|
12240 |
"task": "translation",
|
12241 |
"metric": "chrf",
|
12242 |
-
"score": 0.
|
12243 |
"sentence_nr": 14.5
|
12244 |
},
|
12245 |
{
|
12246 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12247 |
-
"bcp_47": "
|
12248 |
"task": "classification",
|
12249 |
"metric": "accuracy",
|
12250 |
-
"score": 0.
|
12251 |
"sentence_nr": 14.5
|
12252 |
},
|
12253 |
{
|
12254 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12255 |
-
"bcp_47": "
|
12256 |
"task": "language_modeling",
|
12257 |
"metric": "chrf",
|
12258 |
-
"score": 0.
|
12259 |
"sentence_nr": 14.5
|
12260 |
},
|
12261 |
{
|
12262 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12263 |
-
"bcp_47": "
|
12264 |
"task": "translation",
|
12265 |
"metric": "bleu",
|
12266 |
-
"score": 0.
|
12267 |
"sentence_nr": 14.5
|
12268 |
},
|
12269 |
{
|
12270 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12271 |
-
"bcp_47": "
|
12272 |
"task": "translation",
|
12273 |
"metric": "chrf",
|
12274 |
-
"score": 0.
|
12275 |
"sentence_nr": 14.5
|
12276 |
},
|
12277 |
{
|
12278 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12279 |
-
"bcp_47": "
|
12280 |
"task": "classification",
|
12281 |
"metric": "accuracy",
|
12282 |
-
"score": 0.
|
12283 |
"sentence_nr": 14.5
|
12284 |
},
|
12285 |
{
|
12286 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12287 |
-
"bcp_47": "
|
12288 |
"task": "language_modeling",
|
12289 |
"metric": "chrf",
|
12290 |
-
"score": 0.
|
12291 |
"sentence_nr": 14.5
|
12292 |
},
|
12293 |
{
|
12294 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12295 |
-
"bcp_47": "
|
12296 |
"task": "translation",
|
12297 |
"metric": "bleu",
|
12298 |
-
"score": 0.
|
12299 |
"sentence_nr": 14.5
|
12300 |
},
|
12301 |
{
|
12302 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12303 |
-
"bcp_47": "
|
12304 |
"task": "translation",
|
12305 |
"metric": "chrf",
|
12306 |
-
"score": 0.
|
12307 |
"sentence_nr": 14.5
|
12308 |
},
|
12309 |
{
|
12310 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12311 |
-
"bcp_47": "
|
12312 |
"task": "classification",
|
12313 |
"metric": "accuracy",
|
12314 |
-
"score": 0.
|
12315 |
"sentence_nr": 14.5
|
12316 |
},
|
12317 |
{
|
12318 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12319 |
-
"bcp_47": "
|
12320 |
"task": "language_modeling",
|
12321 |
"metric": "chrf",
|
12322 |
-
"score": 0.
|
12323 |
"sentence_nr": 14.5
|
12324 |
},
|
12325 |
{
|
12326 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12327 |
-
"bcp_47": "
|
12328 |
"task": "translation",
|
12329 |
"metric": "bleu",
|
12330 |
-
"score": 0.
|
12331 |
"sentence_nr": 14.5
|
12332 |
},
|
12333 |
{
|
12334 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12335 |
-
"bcp_47": "
|
12336 |
"task": "translation",
|
12337 |
"metric": "chrf",
|
12338 |
-
"score": 0.
|
12339 |
"sentence_nr": 14.5
|
12340 |
},
|
12341 |
{
|
12342 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12343 |
-
"bcp_47": "
|
12344 |
"task": "classification",
|
12345 |
"metric": "accuracy",
|
12346 |
-
"score": 0.
|
12347 |
"sentence_nr": 14.5
|
12348 |
},
|
12349 |
{
|
12350 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12351 |
-
"bcp_47": "
|
12352 |
"task": "language_modeling",
|
12353 |
"metric": "chrf",
|
12354 |
-
"score": 0.
|
12355 |
"sentence_nr": 14.5
|
12356 |
},
|
12357 |
{
|
12358 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12359 |
-
"bcp_47": "
|
12360 |
"task": "translation",
|
12361 |
"metric": "bleu",
|
12362 |
-
"score": 0.
|
12363 |
"sentence_nr": 14.5
|
12364 |
},
|
12365 |
{
|
12366 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
12367 |
-
"bcp_47": "
|
12368 |
"task": "translation",
|
12369 |
"metric": "chrf",
|
12370 |
-
"score": 0.
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
12371 |
"sentence_nr": 14.5
|
12372 |
},
|
12373 |
{
|
@@ -12383,7 +13823,7 @@
|
|
12383 |
"bcp_47": "zh",
|
12384 |
"task": "language_modeling",
|
12385 |
"metric": "chrf",
|
12386 |
-
"score": 0.
|
12387 |
"sentence_nr": 14.5
|
12388 |
},
|
12389 |
{
|
@@ -12415,7 +13855,7 @@
|
|
12415 |
"bcp_47": "en",
|
12416 |
"task": "language_modeling",
|
12417 |
"metric": "chrf",
|
12418 |
-
"score": 0.
|
12419 |
"sentence_nr": 14.5
|
12420 |
},
|
12421 |
{
|
@@ -12447,7 +13887,7 @@
|
|
12447 |
"bcp_47": "zh",
|
12448 |
"task": "language_modeling",
|
12449 |
"metric": "chrf",
|
12450 |
-
"score": 0.
|
12451 |
"sentence_nr": 14.5
|
12452 |
},
|
12453 |
{
|
@@ -12479,7 +13919,7 @@
|
|
12479 |
"bcp_47": "en",
|
12480 |
"task": "language_modeling",
|
12481 |
"metric": "chrf",
|
12482 |
-
"score": 0.
|
12483 |
"sentence_nr": 14.5
|
12484 |
},
|
12485 |
{
|
@@ -12511,7 +13951,7 @@
|
|
12511 |
"bcp_47": "zh",
|
12512 |
"task": "language_modeling",
|
12513 |
"metric": "chrf",
|
12514 |
-
"score": 0.
|
12515 |
"sentence_nr": 14.5
|
12516 |
},
|
12517 |
{
|
@@ -12543,7 +13983,7 @@
|
|
12543 |
"bcp_47": "en",
|
12544 |
"task": "language_modeling",
|
12545 |
"metric": "chrf",
|
12546 |
-
"score": 0.
|
12547 |
"sentence_nr": 14.5
|
12548 |
},
|
12549 |
{
|
@@ -12575,7 +14015,7 @@
|
|
12575 |
"bcp_47": "zh",
|
12576 |
"task": "language_modeling",
|
12577 |
"metric": "chrf",
|
12578 |
-
"score": 0.
|
12579 |
"sentence_nr": 14.5
|
12580 |
},
|
12581 |
{
|
@@ -12607,7 +14047,7 @@
|
|
12607 |
"bcp_47": "en",
|
12608 |
"task": "language_modeling",
|
12609 |
"metric": "chrf",
|
12610 |
-
"score": 0.
|
12611 |
"sentence_nr": 14.5
|
12612 |
},
|
12613 |
{
|
@@ -12639,7 +14079,7 @@
|
|
12639 |
"bcp_47": "zh",
|
12640 |
"task": "language_modeling",
|
12641 |
"metric": "chrf",
|
12642 |
-
"score": 0.
|
12643 |
"sentence_nr": 14.5
|
12644 |
},
|
12645 |
{
|
@@ -12671,7 +14111,7 @@
|
|
12671 |
"bcp_47": "en",
|
12672 |
"task": "language_modeling",
|
12673 |
"metric": "chrf",
|
12674 |
-
"score": 0.
|
12675 |
"sentence_nr": 14.5
|
12676 |
},
|
12677 |
{
|
@@ -12703,7 +14143,7 @@
|
|
12703 |
"bcp_47": "zh",
|
12704 |
"task": "language_modeling",
|
12705 |
"metric": "chrf",
|
12706 |
-
"score": 0.
|
12707 |
"sentence_nr": 14.5
|
12708 |
},
|
12709 |
{
|
|
|
3 |
{
|
4 |
"task": "classification",
|
5 |
"metric": "accuracy",
|
6 |
+
"score": 0.5353333333333333,
|
7 |
+
"bcp_47": 28,
|
8 |
"model": 12
|
9 |
},
|
10 |
{
|
11 |
"task": "language_modeling",
|
12 |
"metric": "chrf",
|
13 |
+
"score": 0.9172787041570468,
|
14 |
+
"bcp_47": 28,
|
15 |
"model": 12
|
16 |
},
|
17 |
{
|
18 |
"task": "translation",
|
19 |
"metric": "bleu",
|
20 |
+
"score": 0.31440758611811165,
|
21 |
+
"bcp_47": 28,
|
22 |
"model": 12
|
23 |
},
|
24 |
{
|
25 |
"task": "translation",
|
26 |
"metric": "chrf",
|
27 |
+
"score": 0.4776446463431595,
|
28 |
+
"bcp_47": 28,
|
29 |
"model": 12
|
30 |
}
|
31 |
],
|
|
|
41 |
"model": "amazon/nova-micro-v1",
|
42 |
"task": "language_modeling",
|
43 |
"metric": "chrf",
|
44 |
+
"score": 0.9358428899682786,
|
45 |
"bcp_47": 2
|
46 |
},
|
47 |
{
|
|
|
69 |
"model": "google/gemini-2.0-flash-001",
|
70 |
"task": "language_modeling",
|
71 |
"metric": "chrf",
|
72 |
+
"score": 0.9585325034195884,
|
73 |
"bcp_47": 2
|
74 |
},
|
75 |
{
|
|
|
97 |
"model": "google/gemini-2.0-flash-lite-001",
|
98 |
"task": "language_modeling",
|
99 |
"metric": "chrf",
|
100 |
+
"score": 0.9574729426945592,
|
101 |
"bcp_47": 2
|
102 |
},
|
103 |
{
|
|
|
125 |
"model": "google/gemma-3-27b-it",
|
126 |
"task": "language_modeling",
|
127 |
"metric": "chrf",
|
128 |
+
"score": 0.9402106879094536,
|
129 |
"bcp_47": 2
|
130 |
},
|
131 |
{
|
|
|
153 |
"model": "meta-llama/llama-3-70b-instruct",
|
154 |
"task": "language_modeling",
|
155 |
"metric": "chrf",
|
156 |
+
"score": 0.9555990324827045,
|
157 |
"bcp_47": 2
|
158 |
},
|
159 |
{
|
|
|
181 |
"model": "meta-llama/llama-3.1-70b-instruct",
|
182 |
"task": "language_modeling",
|
183 |
"metric": "chrf",
|
184 |
+
"score": 0.9458265879125298,
|
185 |
"bcp_47": 2
|
186 |
},
|
187 |
{
|
188 |
"model": "meta-llama/llama-3.1-70b-instruct",
|
189 |
"task": "translation",
|
190 |
"metric": "bleu",
|
191 |
+
"score": 0.4318584195195329,
|
192 |
"bcp_47": 2
|
193 |
},
|
194 |
{
|
|
|
202 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
203 |
"task": "classification",
|
204 |
"metric": "accuracy",
|
205 |
+
"score": 0.5142857142857143,
|
206 |
+
"bcp_47": 28
|
207 |
},
|
208 |
{
|
209 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
210 |
"task": "language_modeling",
|
211 |
"metric": "chrf",
|
212 |
+
"score": 0.9422717613037961,
|
213 |
+
"bcp_47": 28
|
214 |
},
|
215 |
{
|
216 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
217 |
"task": "translation",
|
218 |
"metric": "bleu",
|
219 |
+
"score": 0.28045810258852616,
|
220 |
+
"bcp_47": 28
|
221 |
},
|
222 |
{
|
223 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
224 |
"task": "translation",
|
225 |
"metric": "chrf",
|
226 |
+
"score": 0.45694310450071773,
|
227 |
+
"bcp_47": 28
|
228 |
},
|
229 |
{
|
230 |
"model": "microsoft/phi-4-multimodal-instruct",
|
|
|
237 |
"model": "microsoft/phi-4-multimodal-instruct",
|
238 |
"task": "language_modeling",
|
239 |
"metric": "chrf",
|
240 |
+
"score": 0.8811352896333067,
|
241 |
"bcp_47": 2
|
242 |
},
|
243 |
{
|
|
|
265 |
"model": "mistralai/mistral-nemo",
|
266 |
"task": "language_modeling",
|
267 |
"metric": "chrf",
|
268 |
+
"score": 0.8612477844203897,
|
269 |
"bcp_47": 2
|
270 |
},
|
271 |
{
|
|
|
293 |
"model": "mistralai/mistral-small-24b-instruct-2501",
|
294 |
"task": "language_modeling",
|
295 |
"metric": "chrf",
|
296 |
+
"score": 0.8782400543225595,
|
297 |
"bcp_47": 2
|
298 |
},
|
299 |
{
|
|
|
321 |
"model": "openai/gpt-4o-mini",
|
322 |
"task": "language_modeling",
|
323 |
"metric": "chrf",
|
324 |
+
"score": 0.9560369064537906,
|
325 |
"bcp_47": 2
|
326 |
},
|
327 |
{
|
|
|
349 |
"model": "qwen/qwq-32b",
|
350 |
"task": "language_modeling",
|
351 |
"metric": "chrf",
|
352 |
+
"score": 0.47001826645586636,
|
353 |
"bcp_47": 2
|
354 |
},
|
355 |
{
|
|
|
701 |
"in_benchmark": true,
|
702 |
"task": "language_modeling",
|
703 |
"metric": "chrf",
|
704 |
+
"score": 0.9392314289764625,
|
705 |
"model": 1.0
|
706 |
},
|
707 |
{
|
|
|
827 |
"commonvoice_hours": null,
|
828 |
"commonvoice_locale": null,
|
829 |
"in_benchmark": true,
|
830 |
+
"task": "classification",
|
831 |
+
"metric": "accuracy",
|
832 |
+
"score": 0.4,
|
833 |
+
"model": 1.0
|
834 |
+
},
|
835 |
+
{
|
836 |
+
"bcp_47": "arz",
|
837 |
+
"speakers": 66639360,
|
838 |
+
"language_name": "Egyptian Arabic",
|
839 |
+
"autonym": "Egyptian Arabic",
|
840 |
+
"family": "Afro-Asiatic",
|
841 |
+
"flores_path": "arz_Arab",
|
842 |
+
"fleurs_tag": null,
|
843 |
+
"commonvoice_hours": null,
|
844 |
+
"commonvoice_locale": null,
|
845 |
+
"in_benchmark": true,
|
846 |
+
"task": "language_modeling",
|
847 |
+
"metric": "chrf",
|
848 |
+
"score": 0.930329195667362,
|
849 |
+
"model": 1.0
|
850 |
+
},
|
851 |
+
{
|
852 |
+
"bcp_47": "arz",
|
853 |
+
"speakers": 66639360,
|
854 |
+
"language_name": "Egyptian Arabic",
|
855 |
+
"autonym": "Egyptian Arabic",
|
856 |
+
"family": "Afro-Asiatic",
|
857 |
+
"flores_path": "arz_Arab",
|
858 |
+
"fleurs_tag": null,
|
859 |
+
"commonvoice_hours": null,
|
860 |
+
"commonvoice_locale": null,
|
861 |
+
"in_benchmark": true,
|
862 |
+
"task": "translation",
|
863 |
+
"metric": "bleu",
|
864 |
+
"score": 0.19793415292805128,
|
865 |
+
"model": 1.0
|
866 |
+
},
|
867 |
+
{
|
868 |
+
"bcp_47": "arz",
|
869 |
+
"speakers": 66639360,
|
870 |
+
"language_name": "Egyptian Arabic",
|
871 |
+
"autonym": "Egyptian Arabic",
|
872 |
+
"family": "Afro-Asiatic",
|
873 |
+
"flores_path": "arz_Arab",
|
874 |
+
"fleurs_tag": null,
|
875 |
+
"commonvoice_hours": null,
|
876 |
+
"commonvoice_locale": null,
|
877 |
+
"in_benchmark": true,
|
878 |
+
"task": "translation",
|
879 |
+
"metric": "chrf",
|
880 |
+
"score": 0.3881278724939126,
|
881 |
+
"model": 1.0
|
882 |
},
|
883 |
{
|
884 |
"bcp_47": "as",
|
|
|
1661 |
"in_benchmark": true,
|
1662 |
"task": "language_modeling",
|
1663 |
"metric": "chrf",
|
1664 |
+
"score": 0.9097658392566466,
|
1665 |
"model": 1.0
|
1666 |
},
|
1667 |
{
|
|
|
2040 |
"family": "Indo-European",
|
2041 |
"flores_path": "cat_Latn",
|
2042 |
"fleurs_tag": "ca_es",
|
2043 |
+
"commonvoice_hours": 2845.0,
|
2044 |
"commonvoice_locale": "ca",
|
2045 |
"in_benchmark": true,
|
2046 |
"task": null,
|
|
|
2635 |
"commonvoice_hours": 1360.0,
|
2636 |
"commonvoice_locale": "de",
|
2637 |
"in_benchmark": true,
|
2638 |
+
"task": "classification",
|
2639 |
+
"metric": "accuracy",
|
2640 |
+
"score": 0.6666666666666666,
|
2641 |
+
"model": 1.0
|
2642 |
+
},
|
2643 |
+
{
|
2644 |
+
"bcp_47": "de",
|
2645 |
+
"speakers": 136350226,
|
2646 |
+
"language_name": "German",
|
2647 |
+
"autonym": "Deutsch",
|
2648 |
+
"family": "Indo-European",
|
2649 |
+
"flores_path": "deu_Latn",
|
2650 |
+
"fleurs_tag": "de_de",
|
2651 |
+
"commonvoice_hours": 1360.0,
|
2652 |
+
"commonvoice_locale": "de",
|
2653 |
+
"in_benchmark": true,
|
2654 |
+
"task": "language_modeling",
|
2655 |
+
"metric": "chrf",
|
2656 |
+
"score": 0.9594656177914042,
|
2657 |
+
"model": 1.0
|
2658 |
+
},
|
2659 |
+
{
|
2660 |
+
"bcp_47": "de",
|
2661 |
+
"speakers": 136350226,
|
2662 |
+
"language_name": "German",
|
2663 |
+
"autonym": "Deutsch",
|
2664 |
+
"family": "Indo-European",
|
2665 |
+
"flores_path": "deu_Latn",
|
2666 |
+
"fleurs_tag": "de_de",
|
2667 |
+
"commonvoice_hours": 1360.0,
|
2668 |
+
"commonvoice_locale": "de",
|
2669 |
+
"in_benchmark": true,
|
2670 |
+
"task": "translation",
|
2671 |
+
"metric": "bleu",
|
2672 |
+
"score": 0.3207642359472324,
|
2673 |
+
"model": 1.0
|
2674 |
+
},
|
2675 |
+
{
|
2676 |
+
"bcp_47": "de",
|
2677 |
+
"speakers": 136350226,
|
2678 |
+
"language_name": "German",
|
2679 |
+
"autonym": "Deutsch",
|
2680 |
+
"family": "Indo-European",
|
2681 |
+
"flores_path": "deu_Latn",
|
2682 |
+
"fleurs_tag": "de_de",
|
2683 |
+
"commonvoice_hours": 1360.0,
|
2684 |
+
"commonvoice_locale": "de",
|
2685 |
+
"in_benchmark": true,
|
2686 |
+
"task": "translation",
|
2687 |
+
"metric": "chrf",
|
2688 |
+
"score": 0.49973270743869647,
|
2689 |
+
"model": 1.0
|
2690 |
},
|
2691 |
{
|
2692 |
"bcp_47": "den",
|
|
|
3021 |
"in_benchmark": true,
|
3022 |
"task": "language_modeling",
|
3023 |
"metric": "chrf",
|
3024 |
+
"score": 0.9180269549823046,
|
3025 |
"model": 12.0
|
3026 |
},
|
3027 |
{
|
|
|
3037 |
"in_benchmark": true,
|
3038 |
"task": "translation",
|
3039 |
"metric": "bleu",
|
3040 |
+
"score": 0.3703633711863608,
|
3041 |
"model": 12.0
|
3042 |
},
|
3043 |
{
|
|
|
3101 |
"in_benchmark": true,
|
3102 |
"task": "language_modeling",
|
3103 |
"metric": "chrf",
|
3104 |
+
"score": 0.9569342865902168,
|
3105 |
"model": 1.0
|
3106 |
},
|
3107 |
{
|
|
|
3176 |
"family": null,
|
3177 |
"flores_path": "eus_Latn",
|
3178 |
"fleurs_tag": null,
|
3179 |
+
"commonvoice_hours": 336.0,
|
3180 |
"commonvoice_locale": "eu",
|
3181 |
"in_benchmark": true,
|
3182 |
"task": null,
|
|
|
3227 |
"commonvoice_hours": 370.0,
|
3228 |
"commonvoice_locale": "fa",
|
3229 |
"in_benchmark": true,
|
3230 |
+
"task": "classification",
|
3231 |
+
"metric": "accuracy",
|
3232 |
+
"score": 0.4,
|
3233 |
+
"model": 1.0
|
3234 |
+
},
|
3235 |
+
{
|
3236 |
+
"bcp_47": "fa",
|
3237 |
+
"speakers": 84710459,
|
3238 |
+
"language_name": "Persian",
|
3239 |
+
"autonym": "فارسی",
|
3240 |
+
"family": "Indo-European",
|
3241 |
+
"flores_path": "pes_Arab",
|
3242 |
+
"fleurs_tag": "fa_ir",
|
3243 |
+
"commonvoice_hours": 370.0,
|
3244 |
+
"commonvoice_locale": "fa",
|
3245 |
+
"in_benchmark": true,
|
3246 |
+
"task": "language_modeling",
|
3247 |
+
"metric": "chrf",
|
3248 |
+
"score": 0.9414698824984596,
|
3249 |
+
"model": 1.0
|
3250 |
+
},
|
3251 |
+
{
|
3252 |
+
"bcp_47": "fa",
|
3253 |
+
"speakers": 84710459,
|
3254 |
+
"language_name": "Persian",
|
3255 |
+
"autonym": "فارسی",
|
3256 |
+
"family": "Indo-European",
|
3257 |
+
"flores_path": "pes_Arab",
|
3258 |
+
"fleurs_tag": "fa_ir",
|
3259 |
+
"commonvoice_hours": 370.0,
|
3260 |
+
"commonvoice_locale": "fa",
|
3261 |
+
"in_benchmark": true,
|
3262 |
+
"task": "translation",
|
3263 |
+
"metric": "bleu",
|
3264 |
+
"score": 0.26232478733341374,
|
3265 |
+
"model": 1.0
|
3266 |
+
},
|
3267 |
+
{
|
3268 |
+
"bcp_47": "fa",
|
3269 |
+
"speakers": 84710459,
|
3270 |
+
"language_name": "Persian",
|
3271 |
+
"autonym": "فارسی",
|
3272 |
+
"family": "Indo-European",
|
3273 |
+
"flores_path": "pes_Arab",
|
3274 |
+
"fleurs_tag": "fa_ir",
|
3275 |
+
"commonvoice_hours": 370.0,
|
3276 |
+
"commonvoice_locale": "fa",
|
3277 |
+
"in_benchmark": true,
|
3278 |
+
"task": "translation",
|
3279 |
+
"metric": "chrf",
|
3280 |
+
"score": 0.44641220608314985,
|
3281 |
+
"model": 1.0
|
3282 |
},
|
3283 |
{
|
3284 |
"bcp_47": "fan",
|
|
|
3387 |
"commonvoice_hours": 0.0,
|
3388 |
"commonvoice_locale": "tl",
|
3389 |
"in_benchmark": true,
|
3390 |
+
"task": "classification",
|
3391 |
+
"metric": "accuracy",
|
3392 |
+
"score": 0.43333333333333335,
|
3393 |
+
"model": 1.0
|
3394 |
+
},
|
3395 |
+
{
|
3396 |
+
"bcp_47": "fil",
|
3397 |
+
"speakers": 67471096,
|
3398 |
+
"language_name": "Filipino",
|
3399 |
+
"autonym": "Filipino",
|
3400 |
+
"family": "Austronesian",
|
3401 |
+
"flores_path": "fil_Latn",
|
3402 |
+
"fleurs_tag": "fil_ph",
|
3403 |
+
"commonvoice_hours": 0.0,
|
3404 |
+
"commonvoice_locale": "tl",
|
3405 |
+
"in_benchmark": true,
|
3406 |
+
"task": "language_modeling",
|
3407 |
+
"metric": "chrf",
|
3408 |
+
"score": 0.9402707475255596,
|
3409 |
+
"model": 1.0
|
3410 |
+
},
|
3411 |
+
{
|
3412 |
+
"bcp_47": "fil",
|
3413 |
+
"speakers": 67471096,
|
3414 |
+
"language_name": "Filipino",
|
3415 |
+
"autonym": "Filipino",
|
3416 |
+
"family": "Austronesian",
|
3417 |
+
"flores_path": "fil_Latn",
|
3418 |
+
"fleurs_tag": "fil_ph",
|
3419 |
+
"commonvoice_hours": 0.0,
|
3420 |
+
"commonvoice_locale": "tl",
|
3421 |
+
"in_benchmark": true,
|
3422 |
+
"task": "translation",
|
3423 |
+
"metric": "bleu",
|
3424 |
+
"score": 0.29097818784870333,
|
3425 |
+
"model": 1.0
|
3426 |
+
},
|
3427 |
+
{
|
3428 |
+
"bcp_47": "fil",
|
3429 |
+
"speakers": 67471096,
|
3430 |
+
"language_name": "Filipino",
|
3431 |
+
"autonym": "Filipino",
|
3432 |
+
"family": "Austronesian",
|
3433 |
+
"flores_path": "fil_Latn",
|
3434 |
+
"fleurs_tag": "fil_ph",
|
3435 |
+
"commonvoice_hours": 0.0,
|
3436 |
+
"commonvoice_locale": "tl",
|
3437 |
+
"in_benchmark": true,
|
3438 |
+
"task": "translation",
|
3439 |
+
"metric": "chrf",
|
3440 |
+
"score": 0.44978114149245985,
|
3441 |
+
"model": 1.0
|
3442 |
},
|
3443 |
{
|
3444 |
"bcp_47": "fit",
|
|
|
3533 |
"in_benchmark": true,
|
3534 |
"task": "language_modeling",
|
3535 |
"metric": "chrf",
|
3536 |
+
"score": 0.9815706066541411,
|
3537 |
"model": 1.0
|
3538 |
},
|
3539 |
{
|
|
|
3736 |
"family": "Indo-European",
|
3737 |
"flores_path": "gle_Latn",
|
3738 |
"fleurs_tag": "ga_ie",
|
3739 |
+
"commonvoice_hours": 6.0,
|
3740 |
"commonvoice_locale": "ga-IE",
|
3741 |
"in_benchmark": true,
|
3742 |
"task": null,
|
|
|
4091 |
"commonvoice_hours": 0.0,
|
4092 |
"commonvoice_locale": "gu-IN",
|
4093 |
"in_benchmark": true,
|
4094 |
+
"task": "classification",
|
4095 |
+
"metric": "accuracy",
|
4096 |
+
"score": 0.43333333333333335,
|
4097 |
+
"model": 1.0
|
4098 |
},
|
4099 |
{
|
4100 |
+
"bcp_47": "gu",
|
4101 |
+
"speakers": 61721799,
|
4102 |
+
"language_name": "Gujarati",
|
4103 |
+
"autonym": "ગુજરાતી",
|
4104 |
+
"family": "Indo-European",
|
4105 |
+
"flores_path": "guj_Gujr",
|
4106 |
+
"fleurs_tag": "gu_in",
|
4107 |
+
"commonvoice_hours": 0.0,
|
4108 |
+
"commonvoice_locale": "gu-IN",
|
4109 |
+
"in_benchmark": true,
|
4110 |
+
"task": "language_modeling",
|
4111 |
+
"metric": "chrf",
|
4112 |
+
"score": 0.938086045460355,
|
4113 |
+
"model": 1.0
|
4114 |
},
|
4115 |
{
|
4116 |
+
"bcp_47": "gu",
|
4117 |
+
"speakers": 61721799,
|
4118 |
+
"language_name": "Gujarati",
|
4119 |
+
"autonym": "ગુજરાતી",
|
4120 |
+
"family": "Indo-European",
|
4121 |
+
"flores_path": "guj_Gujr",
|
4122 |
+
"fleurs_tag": "gu_in",
|
4123 |
+
"commonvoice_hours": 0.0,
|
4124 |
+
"commonvoice_locale": "gu-IN",
|
4125 |
+
"in_benchmark": true,
|
4126 |
+
"task": "translation",
|
4127 |
+
"metric": "bleu",
|
4128 |
+
"score": 0.26442484966880464,
|
4129 |
+
"model": 1.0
|
4130 |
+
},
|
4131 |
+
{
|
4132 |
+
"bcp_47": "gu",
|
4133 |
+
"speakers": 61721799,
|
4134 |
+
"language_name": "Gujarati",
|
4135 |
+
"autonym": "ગુજરાતી",
|
4136 |
+
"family": "Indo-European",
|
4137 |
+
"flores_path": "guj_Gujr",
|
4138 |
+
"fleurs_tag": "gu_in",
|
4139 |
+
"commonvoice_hours": 0.0,
|
4140 |
+
"commonvoice_locale": "gu-IN",
|
4141 |
+
"in_benchmark": true,
|
4142 |
+
"task": "translation",
|
4143 |
+
"metric": "chrf",
|
4144 |
+
"score": 0.44452182973195975,
|
4145 |
+
"model": 1.0
|
4146 |
+
},
|
4147 |
+
{
|
4148 |
+
"bcp_47": "gub",
|
4149 |
+
"speakers": 17784,
|
4150 |
+
"language_name": "Guajajára",
|
4151 |
+
"autonym": "Guajajára",
|
4152 |
+
"family": "Tupian",
|
4153 |
+
"flores_path": null,
|
4154 |
+
"fleurs_tag": null,
|
4155 |
+
"commonvoice_hours": null,
|
4156 |
+
"commonvoice_locale": null,
|
4157 |
+
"in_benchmark": false,
|
4158 |
+
"task": null,
|
4159 |
+
"metric": null,
|
4160 |
+
"score": null,
|
4161 |
+
"model": null
|
4162 |
+
},
|
4163 |
+
{
|
4164 |
+
"bcp_47": "guc",
|
4165 |
+
"speakers": 132529,
|
4166 |
+
"language_name": "Wayuu",
|
4167 |
+
"autonym": "Wayuu",
|
4168 |
+
"family": "Arawakan",
|
4169 |
+
"flores_path": null,
|
4170 |
+
"fleurs_tag": null,
|
4171 |
+
"commonvoice_hours": 0.0,
|
4172 |
"commonvoice_locale": "guc",
|
4173 |
"in_benchmark": false,
|
4174 |
"task": null,
|
|
|
4365 |
"in_benchmark": true,
|
4366 |
"task": "language_modeling",
|
4367 |
"metric": "chrf",
|
4368 |
+
"score": 0.9428185393832219,
|
4369 |
"model": 1.0
|
4370 |
},
|
4371 |
{
|
|
|
4747 |
"commonvoice_hours": 33.0,
|
4748 |
"commonvoice_locale": "id",
|
4749 |
"in_benchmark": true,
|
4750 |
+
"task": "classification",
|
4751 |
+
"metric": "accuracy",
|
4752 |
+
"score": 0.6333333333333333,
|
4753 |
+
"model": 1.0
|
4754 |
+
},
|
4755 |
+
{
|
4756 |
+
"bcp_47": "id",
|
4757 |
+
"speakers": 171207687,
|
4758 |
+
"language_name": "Indonesian",
|
4759 |
+
"autonym": "Bahasa Indonesia",
|
4760 |
+
"family": "Austronesian",
|
4761 |
+
"flores_path": "ind_Latn",
|
4762 |
+
"fleurs_tag": "id_id",
|
4763 |
+
"commonvoice_hours": 33.0,
|
4764 |
+
"commonvoice_locale": "id",
|
4765 |
+
"in_benchmark": true,
|
4766 |
+
"task": "language_modeling",
|
4767 |
+
"metric": "chrf",
|
4768 |
+
"score": 0.9598314474300775,
|
4769 |
+
"model": 1.0
|
4770 |
+
},
|
4771 |
+
{
|
4772 |
+
"bcp_47": "id",
|
4773 |
+
"speakers": 171207687,
|
4774 |
+
"language_name": "Indonesian",
|
4775 |
+
"autonym": "Bahasa Indonesia",
|
4776 |
+
"family": "Austronesian",
|
4777 |
+
"flores_path": "ind_Latn",
|
4778 |
+
"fleurs_tag": "id_id",
|
4779 |
+
"commonvoice_hours": 33.0,
|
4780 |
+
"commonvoice_locale": "id",
|
4781 |
+
"in_benchmark": true,
|
4782 |
+
"task": "translation",
|
4783 |
+
"metric": "bleu",
|
4784 |
+
"score": 0.29354203311552335,
|
4785 |
+
"model": 1.0
|
4786 |
+
},
|
4787 |
+
{
|
4788 |
+
"bcp_47": "id",
|
4789 |
+
"speakers": 171207687,
|
4790 |
+
"language_name": "Indonesian",
|
4791 |
+
"autonym": "Bahasa Indonesia",
|
4792 |
+
"family": "Austronesian",
|
4793 |
+
"flores_path": "ind_Latn",
|
4794 |
+
"fleurs_tag": "id_id",
|
4795 |
+
"commonvoice_hours": 33.0,
|
4796 |
+
"commonvoice_locale": "id",
|
4797 |
+
"in_benchmark": true,
|
4798 |
+
"task": "translation",
|
4799 |
+
"metric": "chrf",
|
4800 |
+
"score": 0.4723493656022861,
|
4801 |
+
"model": 1.0
|
4802 |
},
|
4803 |
{
|
4804 |
"bcp_47": "ie",
|
|
|
4955 |
"commonvoice_hours": 362.0,
|
4956 |
"commonvoice_locale": "it",
|
4957 |
"in_benchmark": true,
|
4958 |
+
"task": "classification",
|
4959 |
+
"metric": "accuracy",
|
4960 |
+
"score": 0.6666666666666666,
|
4961 |
+
"model": 1.0
|
4962 |
+
},
|
4963 |
+
{
|
4964 |
+
"bcp_47": "it",
|
4965 |
+
"speakers": 70247060,
|
4966 |
+
"language_name": "Italian",
|
4967 |
+
"autonym": "Italiano",
|
4968 |
+
"family": "Indo-European",
|
4969 |
+
"flores_path": "ita_Latn",
|
4970 |
+
"fleurs_tag": "it_it",
|
4971 |
+
"commonvoice_hours": 362.0,
|
4972 |
+
"commonvoice_locale": "it",
|
4973 |
+
"in_benchmark": true,
|
4974 |
+
"task": "language_modeling",
|
4975 |
+
"metric": "chrf",
|
4976 |
+
"score": 0.9439490413212892,
|
4977 |
+
"model": 1.0
|
4978 |
+
},
|
4979 |
+
{
|
4980 |
+
"bcp_47": "it",
|
4981 |
+
"speakers": 70247060,
|
4982 |
+
"language_name": "Italian",
|
4983 |
+
"autonym": "Italiano",
|
4984 |
+
"family": "Indo-European",
|
4985 |
+
"flores_path": "ita_Latn",
|
4986 |
+
"fleurs_tag": "it_it",
|
4987 |
+
"commonvoice_hours": 362.0,
|
4988 |
+
"commonvoice_locale": "it",
|
4989 |
+
"in_benchmark": true,
|
4990 |
+
"task": "translation",
|
4991 |
+
"metric": "bleu",
|
4992 |
+
"score": 0.28142583904826096,
|
4993 |
+
"model": 1.0
|
4994 |
+
},
|
4995 |
+
{
|
4996 |
+
"bcp_47": "it",
|
4997 |
+
"speakers": 70247060,
|
4998 |
+
"language_name": "Italian",
|
4999 |
+
"autonym": "Italiano",
|
5000 |
+
"family": "Indo-European",
|
5001 |
+
"flores_path": "ita_Latn",
|
5002 |
+
"fleurs_tag": "it_it",
|
5003 |
+
"commonvoice_hours": 362.0,
|
5004 |
+
"commonvoice_locale": "it",
|
5005 |
+
"in_benchmark": true,
|
5006 |
+
"task": "translation",
|
5007 |
+
"metric": "chrf",
|
5008 |
+
"score": 0.4707591889357925,
|
5009 |
+
"model": 1.0
|
5010 |
},
|
5011 |
{
|
5012 |
"bcp_47": "iu",
|
|
|
5051 |
"commonvoice_hours": 222.0,
|
5052 |
"commonvoice_locale": "ja",
|
5053 |
"in_benchmark": true,
|
5054 |
+
"task": "classification",
|
5055 |
+
"metric": "accuracy",
|
5056 |
+
"score": 0.6333333333333333,
|
5057 |
+
"model": 1.0
|
5058 |
+
},
|
5059 |
+
{
|
5060 |
+
"bcp_47": "ja",
|
5061 |
+
"speakers": 119729026,
|
5062 |
+
"language_name": "Japanese",
|
5063 |
+
"autonym": "日本語",
|
5064 |
+
"family": "Japonic",
|
5065 |
+
"flores_path": "jpn_Jpan",
|
5066 |
+
"fleurs_tag": "ja_jp",
|
5067 |
+
"commonvoice_hours": 222.0,
|
5068 |
+
"commonvoice_locale": "ja",
|
5069 |
+
"in_benchmark": true,
|
5070 |
+
"task": "language_modeling",
|
5071 |
+
"metric": "chrf",
|
5072 |
+
"score": 0.9371132855221468,
|
5073 |
+
"model": 1.0
|
5074 |
+
},
|
5075 |
+
{
|
5076 |
+
"bcp_47": "ja",
|
5077 |
+
"speakers": 119729026,
|
5078 |
+
"language_name": "Japanese",
|
5079 |
+
"autonym": "日本語",
|
5080 |
+
"family": "Japonic",
|
5081 |
+
"flores_path": "jpn_Jpan",
|
5082 |
+
"fleurs_tag": "ja_jp",
|
5083 |
+
"commonvoice_hours": 222.0,
|
5084 |
+
"commonvoice_locale": "ja",
|
5085 |
+
"in_benchmark": true,
|
5086 |
+
"task": "translation",
|
5087 |
+
"metric": "bleu",
|
5088 |
+
"score": 0.2723410893967824,
|
5089 |
+
"model": 1.0
|
5090 |
+
},
|
5091 |
+
{
|
5092 |
+
"bcp_47": "ja",
|
5093 |
+
"speakers": 119729026,
|
5094 |
+
"language_name": "Japanese",
|
5095 |
+
"autonym": "日本語",
|
5096 |
+
"family": "Japonic",
|
5097 |
+
"flores_path": "jpn_Jpan",
|
5098 |
+
"fleurs_tag": "ja_jp",
|
5099 |
+
"commonvoice_hours": 222.0,
|
5100 |
+
"commonvoice_locale": "ja",
|
5101 |
+
"in_benchmark": true,
|
5102 |
+
"task": "translation",
|
5103 |
+
"metric": "chrf",
|
5104 |
+
"score": 0.43929453749366865,
|
5105 |
+
"model": 1.0
|
5106 |
},
|
5107 |
{
|
5108 |
"bcp_47": "jam",
|
|
|
5211 |
"commonvoice_hours": 0.0,
|
5212 |
"commonvoice_locale": "jv",
|
5213 |
"in_benchmark": true,
|
5214 |
+
"task": "classification",
|
5215 |
+
"metric": "accuracy",
|
5216 |
+
"score": 0.4666666666666667,
|
5217 |
+
"model": 1.0
|
5218 |
},
|
5219 |
{
|
5220 |
+
"bcp_47": "jv",
|
5221 |
+
"speakers": 91180665,
|
5222 |
+
"language_name": "Javanese",
|
5223 |
+
"autonym": "Jawa",
|
5224 |
+
"family": "Austronesian",
|
5225 |
+
"flores_path": "jav_Latn",
|
5226 |
+
"fleurs_tag": "jv_id",
|
5227 |
+
"commonvoice_hours": 0.0,
|
5228 |
+
"commonvoice_locale": "jv",
|
5229 |
"in_benchmark": true,
|
5230 |
+
"task": "language_modeling",
|
5231 |
+
"metric": "chrf",
|
5232 |
+
"score": 0.9298143194922116,
|
5233 |
+
"model": 1.0
|
5234 |
},
|
5235 |
{
|
5236 |
+
"bcp_47": "jv",
|
5237 |
+
"speakers": 91180665,
|
5238 |
+
"language_name": "Javanese",
|
5239 |
+
"autonym": "Jawa",
|
5240 |
+
"family": "Austronesian",
|
5241 |
+
"flores_path": "jav_Latn",
|
5242 |
+
"fleurs_tag": "jv_id",
|
5243 |
+
"commonvoice_hours": 0.0,
|
5244 |
+
"commonvoice_locale": "jv",
|
5245 |
+
"in_benchmark": true,
|
5246 |
+
"task": "translation",
|
5247 |
+
"metric": "bleu",
|
5248 |
+
"score": 0.23729186537968905,
|
5249 |
+
"model": 1.0
|
5250 |
+
},
|
5251 |
+
{
|
5252 |
+
"bcp_47": "jv",
|
5253 |
+
"speakers": 91180665,
|
5254 |
+
"language_name": "Javanese",
|
5255 |
+
"autonym": "Jawa",
|
5256 |
+
"family": "Austronesian",
|
5257 |
+
"flores_path": "jav_Latn",
|
5258 |
+
"fleurs_tag": "jv_id",
|
5259 |
+
"commonvoice_hours": 0.0,
|
5260 |
+
"commonvoice_locale": "jv",
|
5261 |
+
"in_benchmark": true,
|
5262 |
+
"task": "translation",
|
5263 |
+
"metric": "chrf",
|
5264 |
+
"score": 0.4198940727847352,
|
5265 |
+
"model": 1.0
|
5266 |
+
},
|
5267 |
+
{
|
5268 |
+
"bcp_47": "ka",
|
5269 |
+
"speakers": 3543646,
|
5270 |
+
"language_name": "Georgian",
|
5271 |
+
"autonym": "ქართული",
|
5272 |
+
"family": "Kartvelian",
|
5273 |
+
"flores_path": "kat_Geor",
|
5274 |
+
"fleurs_tag": "ka_ge",
|
5275 |
+
"commonvoice_hours": 158.0,
|
5276 |
+
"commonvoice_locale": "ka",
|
5277 |
+
"in_benchmark": true,
|
5278 |
+
"task": null,
|
5279 |
+
"metric": null,
|
5280 |
+
"score": null,
|
5281 |
+
"model": null
|
5282 |
+
},
|
5283 |
+
{
|
5284 |
+
"bcp_47": "kaa",
|
5285 |
+
"speakers": 489046,
|
5286 |
+
"language_name": "Kara-Kalpak",
|
5287 |
+
"autonym": "Kara-Kalpak",
|
5288 |
+
"family": "Turkic",
|
5289 |
+
"flores_path": null,
|
5290 |
+
"fleurs_tag": null,
|
5291 |
+
"commonvoice_hours": 0.0,
|
5292 |
+
"commonvoice_locale": "kaa",
|
5293 |
+
"in_benchmark": false,
|
5294 |
+
"task": null,
|
5295 |
"metric": null,
|
5296 |
"score": null,
|
5297 |
"model": null
|
|
|
5384 |
"family": "Abkhaz-Adyge",
|
5385 |
"flores_path": null,
|
5386 |
"fleurs_tag": null,
|
5387 |
+
"commonvoice_hours": 19.0,
|
5388 |
"commonvoice_locale": "kbd",
|
5389 |
"in_benchmark": false,
|
5390 |
"task": null,
|
|
|
5883 |
"commonvoice_hours": 1.7,
|
5884 |
"commonvoice_locale": "ko",
|
5885 |
"in_benchmark": true,
|
5886 |
+
"task": "classification",
|
5887 |
+
"metric": "accuracy",
|
5888 |
+
"score": 0.5333333333333333,
|
5889 |
+
"model": 1.0
|
5890 |
+
},
|
5891 |
+
{
|
5892 |
+
"bcp_47": "ko",
|
5893 |
+
"speakers": 78357046,
|
5894 |
+
"language_name": "Korean",
|
5895 |
+
"autonym": "한국어",
|
5896 |
+
"family": "Koreanic",
|
5897 |
+
"flores_path": "kor_Hang",
|
5898 |
+
"fleurs_tag": "ko_kr",
|
5899 |
+
"commonvoice_hours": 1.7,
|
5900 |
+
"commonvoice_locale": "ko",
|
5901 |
+
"in_benchmark": true,
|
5902 |
+
"task": "language_modeling",
|
5903 |
+
"metric": "chrf",
|
5904 |
+
"score": 0.9355445912073929,
|
5905 |
+
"model": 1.0
|
5906 |
+
},
|
5907 |
+
{
|
5908 |
+
"bcp_47": "ko",
|
5909 |
+
"speakers": 78357046,
|
5910 |
+
"language_name": "Korean",
|
5911 |
+
"autonym": "한국어",
|
5912 |
+
"family": "Koreanic",
|
5913 |
+
"flores_path": "kor_Hang",
|
5914 |
+
"fleurs_tag": "ko_kr",
|
5915 |
+
"commonvoice_hours": 1.7,
|
5916 |
+
"commonvoice_locale": "ko",
|
5917 |
+
"in_benchmark": true,
|
5918 |
+
"task": "translation",
|
5919 |
+
"metric": "bleu",
|
5920 |
+
"score": 0.20332074778330964,
|
5921 |
+
"model": 1.0
|
5922 |
+
},
|
5923 |
+
{
|
5924 |
+
"bcp_47": "ko",
|
5925 |
+
"speakers": 78357046,
|
5926 |
+
"language_name": "Korean",
|
5927 |
+
"autonym": "한국어",
|
5928 |
+
"family": "Koreanic",
|
5929 |
+
"flores_path": "kor_Hang",
|
5930 |
+
"fleurs_tag": "ko_kr",
|
5931 |
+
"commonvoice_hours": 1.7,
|
5932 |
+
"commonvoice_locale": "ko",
|
5933 |
+
"in_benchmark": true,
|
5934 |
+
"task": "translation",
|
5935 |
+
"metric": "chrf",
|
5936 |
+
"score": 0.4005255477730261,
|
5937 |
+
"model": 1.0
|
5938 |
},
|
5939 |
{
|
5940 |
"bcp_47": "koi",
|
|
|
6232 |
"family": "Indo-European",
|
6233 |
"flores_path": null,
|
6234 |
"fleurs_tag": null,
|
6235 |
+
"commonvoice_hours": 8.1,
|
6236 |
"commonvoice_locale": "kw",
|
6237 |
"in_benchmark": false,
|
6238 |
"task": null,
|
|
|
7352 |
"family": "Indo-European",
|
7353 |
"flores_path": "mkd_Cyrl",
|
7354 |
"fleurs_tag": "mk_mk",
|
7355 |
+
"commonvoice_hours": 19.0,
|
7356 |
"commonvoice_locale": "mk",
|
7357 |
"in_benchmark": true,
|
7358 |
"task": null,
|
|
|
7499 |
"commonvoice_hours": 20.0,
|
7500 |
"commonvoice_locale": "mr",
|
7501 |
"in_benchmark": true,
|
7502 |
+
"task": "classification",
|
7503 |
+
"metric": "accuracy",
|
7504 |
+
"score": 0.6333333333333333,
|
7505 |
+
"model": 1.0
|
7506 |
+
},
|
7507 |
+
{
|
7508 |
+
"bcp_47": "mr",
|
7509 |
+
"speakers": 92826300,
|
7510 |
+
"language_name": "Marathi",
|
7511 |
+
"autonym": "मराठी",
|
7512 |
+
"family": "Indo-European",
|
7513 |
+
"flores_path": "mar_Deva",
|
7514 |
+
"fleurs_tag": "mr_in",
|
7515 |
+
"commonvoice_hours": 20.0,
|
7516 |
+
"commonvoice_locale": "mr",
|
7517 |
+
"in_benchmark": true,
|
7518 |
+
"task": "language_modeling",
|
7519 |
+
"metric": "chrf",
|
7520 |
+
"score": 0.9440892312053646,
|
7521 |
+
"model": 1.0
|
7522 |
+
},
|
7523 |
+
{
|
7524 |
+
"bcp_47": "mr",
|
7525 |
+
"speakers": 92826300,
|
7526 |
+
"language_name": "Marathi",
|
7527 |
+
"autonym": "मराठी",
|
7528 |
+
"family": "Indo-European",
|
7529 |
+
"flores_path": "mar_Deva",
|
7530 |
+
"fleurs_tag": "mr_in",
|
7531 |
+
"commonvoice_hours": 20.0,
|
7532 |
+
"commonvoice_locale": "mr",
|
7533 |
+
"in_benchmark": true,
|
7534 |
+
"task": "translation",
|
7535 |
+
"metric": "bleu",
|
7536 |
+
"score": 0.24903049799655144,
|
7537 |
+
"model": 1.0
|
7538 |
+
},
|
7539 |
+
{
|
7540 |
+
"bcp_47": "mr",
|
7541 |
+
"speakers": 92826300,
|
7542 |
+
"language_name": "Marathi",
|
7543 |
+
"autonym": "मराठी",
|
7544 |
+
"family": "Indo-European",
|
7545 |
+
"flores_path": "mar_Deva",
|
7546 |
+
"fleurs_tag": "mr_in",
|
7547 |
+
"commonvoice_hours": 20.0,
|
7548 |
+
"commonvoice_locale": "mr",
|
7549 |
+
"in_benchmark": true,
|
7550 |
+
"task": "translation",
|
7551 |
+
"metric": "chrf",
|
7552 |
+
"score": 0.42489125861884175,
|
7553 |
+
"model": 1.0
|
7554 |
},
|
7555 |
{
|
7556 |
"bcp_47": "mrd",
|
|
|
8504 |
"family": "Indo-European",
|
8505 |
"flores_path": null,
|
8506 |
"fleurs_tag": null,
|
8507 |
+
"commonvoice_hours": 0.8,
|
8508 |
"commonvoice_locale": "os",
|
8509 |
"in_benchmark": false,
|
8510 |
"task": null,
|
|
|
8557 |
"in_benchmark": true,
|
8558 |
"task": "language_modeling",
|
8559 |
"metric": "chrf",
|
8560 |
+
"score": 0.9025298113664532,
|
8561 |
"model": 1.0
|
8562 |
},
|
8563 |
{
|
|
|
8925 |
"in_benchmark": true,
|
8926 |
"task": "language_modeling",
|
8927 |
"metric": "chrf",
|
8928 |
+
"score": 0.9641423549595803,
|
8929 |
"model": 1.0
|
8930 |
},
|
8931 |
{
|
|
|
9352 |
"family": "Indo-European",
|
9353 |
"flores_path": "rus_Cyrl",
|
9354 |
"fleurs_tag": "ru_ru",
|
9355 |
+
"commonvoice_hours": 243.0,
|
9356 |
"commonvoice_locale": "ru",
|
9357 |
"in_benchmark": true,
|
9358 |
+
"task": "classification",
|
9359 |
+
"metric": "accuracy",
|
9360 |
+
"score": 0.5666666666666667,
|
9361 |
+
"model": 1.0
|
9362 |
+
},
|
9363 |
+
{
|
9364 |
+
"bcp_47": "ru",
|
9365 |
+
"speakers": 195841151,
|
9366 |
+
"language_name": "Russian",
|
9367 |
+
"autonym": "Русский",
|
9368 |
+
"family": "Indo-European",
|
9369 |
+
"flores_path": "rus_Cyrl",
|
9370 |
+
"fleurs_tag": "ru_ru",
|
9371 |
+
"commonvoice_hours": 243.0,
|
9372 |
+
"commonvoice_locale": "ru",
|
9373 |
+
"in_benchmark": true,
|
9374 |
+
"task": "language_modeling",
|
9375 |
+
"metric": "chrf",
|
9376 |
+
"score": 0.9663696817874857,
|
9377 |
+
"model": 1.0
|
9378 |
+
},
|
9379 |
+
{
|
9380 |
+
"bcp_47": "ru",
|
9381 |
+
"speakers": 195841151,
|
9382 |
+
"language_name": "Russian",
|
9383 |
+
"autonym": "Русский",
|
9384 |
+
"family": "Indo-European",
|
9385 |
+
"flores_path": "rus_Cyrl",
|
9386 |
+
"fleurs_tag": "ru_ru",
|
9387 |
+
"commonvoice_hours": 243.0,
|
9388 |
+
"commonvoice_locale": "ru",
|
9389 |
+
"in_benchmark": true,
|
9390 |
+
"task": "translation",
|
9391 |
+
"metric": "bleu",
|
9392 |
+
"score": 0.26015179309825326,
|
9393 |
+
"model": 1.0
|
9394 |
+
},
|
9395 |
+
{
|
9396 |
+
"bcp_47": "ru",
|
9397 |
+
"speakers": 195841151,
|
9398 |
+
"language_name": "Russian",
|
9399 |
+
"autonym": "Русский",
|
9400 |
+
"family": "Indo-European",
|
9401 |
+
"flores_path": "rus_Cyrl",
|
9402 |
+
"fleurs_tag": "ru_ru",
|
9403 |
+
"commonvoice_hours": 243.0,
|
9404 |
+
"commonvoice_locale": "ru",
|
9405 |
+
"in_benchmark": true,
|
9406 |
+
"task": "translation",
|
9407 |
+
"metric": "chrf",
|
9408 |
+
"score": 0.4525762744858351,
|
9409 |
+
"model": 1.0
|
9410 |
},
|
9411 |
{
|
9412 |
"bcp_47": "rue",
|
|
|
9800 |
"family": null,
|
9801 |
"flores_path": null,
|
9802 |
"fleurs_tag": null,
|
9803 |
+
"commonvoice_hours": 2.5,
|
9804 |
"commonvoice_locale": "sei",
|
9805 |
"in_benchmark": false,
|
9806 |
"task": null,
|
|
|
10379 |
"commonvoice_hours": 411.0,
|
10380 |
"commonvoice_locale": "sw",
|
10381 |
"in_benchmark": true,
|
10382 |
+
"task": "classification",
|
10383 |
+
"metric": "accuracy",
|
10384 |
+
"score": 0.5666666666666667,
|
10385 |
+
"model": 1.0
|
10386 |
},
|
10387 |
{
|
10388 |
+
"bcp_47": "sw",
|
10389 |
+
"speakers": 171610296,
|
10390 |
+
"language_name": "Swahili",
|
10391 |
+
"autonym": "Kiswahili",
|
10392 |
"family": "Atlantic-Congo",
|
10393 |
+
"flores_path": "swh_Latn",
|
10394 |
+
"fleurs_tag": "sw_ke",
|
10395 |
+
"commonvoice_hours": 411.0,
|
10396 |
+
"commonvoice_locale": "sw",
|
10397 |
+
"in_benchmark": true,
|
10398 |
+
"task": "language_modeling",
|
10399 |
+
"metric": "chrf",
|
10400 |
+
"score": 0.9401745263817055,
|
10401 |
+
"model": 1.0
|
10402 |
},
|
10403 |
{
|
10404 |
+
"bcp_47": "sw",
|
10405 |
+
"speakers": 171610296,
|
10406 |
+
"language_name": "Swahili",
|
10407 |
+
"autonym": "Kiswahili",
|
10408 |
+
"family": "Atlantic-Congo",
|
10409 |
+
"flores_path": "swh_Latn",
|
10410 |
+
"fleurs_tag": "sw_ke",
|
10411 |
+
"commonvoice_hours": 411.0,
|
10412 |
+
"commonvoice_locale": "sw",
|
10413 |
+
"in_benchmark": true,
|
10414 |
+
"task": "translation",
|
10415 |
+
"metric": "bleu",
|
10416 |
+
"score": 0.30022614000139736,
|
10417 |
+
"model": 1.0
|
10418 |
+
},
|
10419 |
+
{
|
10420 |
+
"bcp_47": "sw",
|
10421 |
+
"speakers": 171610296,
|
10422 |
+
"language_name": "Swahili",
|
10423 |
+
"autonym": "Kiswahili",
|
10424 |
+
"family": "Atlantic-Congo",
|
10425 |
+
"flores_path": "swh_Latn",
|
10426 |
+
"fleurs_tag": "sw_ke",
|
10427 |
+
"commonvoice_hours": 411.0,
|
10428 |
+
"commonvoice_locale": "sw",
|
10429 |
+
"in_benchmark": true,
|
10430 |
+
"task": "translation",
|
10431 |
+
"metric": "chrf",
|
10432 |
+
"score": 0.46620999112028233,
|
10433 |
+
"model": 1.0
|
10434 |
+
},
|
10435 |
+
{
|
10436 |
+
"bcp_47": "swb",
|
10437 |
+
"speakers": 170720,
|
10438 |
+
"language_name": "Comorian",
|
10439 |
+
"autonym": "Comorian",
|
10440 |
+
"family": "Atlantic-Congo",
|
10441 |
+
"flores_path": null,
|
10442 |
+
"fleurs_tag": null,
|
10443 |
+
"commonvoice_hours": null,
|
10444 |
+
"commonvoice_locale": null,
|
10445 |
+
"in_benchmark": false,
|
10446 |
+
"task": null,
|
10447 |
+
"metric": null,
|
10448 |
+
"score": null,
|
10449 |
+
"model": null
|
10450 |
+
},
|
10451 |
+
{
|
10452 |
+
"bcp_47": "swg",
|
10453 |
+
"speakers": 801597,
|
10454 |
+
"language_name": "Swabian",
|
10455 |
+
"autonym": "Swabian",
|
10456 |
"family": "Indo-European",
|
10457 |
"flores_path": null,
|
10458 |
"fleurs_tag": null,
|
|
|
10555 |
"commonvoice_hours": 234.0,
|
10556 |
"commonvoice_locale": "ta",
|
10557 |
"in_benchmark": true,
|
10558 |
+
"task": "classification",
|
10559 |
+
"metric": "accuracy",
|
10560 |
+
"score": 0.43333333333333335,
|
10561 |
+
"model": 1.0
|
10562 |
+
},
|
10563 |
+
{
|
10564 |
+
"bcp_47": "ta",
|
10565 |
+
"speakers": 85616159,
|
10566 |
+
"language_name": "Tamil",
|
10567 |
+
"autonym": "தமிழ்",
|
10568 |
+
"family": "Dravidian",
|
10569 |
+
"flores_path": "tam_Taml",
|
10570 |
+
"fleurs_tag": "ta_in",
|
10571 |
+
"commonvoice_hours": 234.0,
|
10572 |
+
"commonvoice_locale": "ta",
|
10573 |
+
"in_benchmark": true,
|
10574 |
+
"task": "language_modeling",
|
10575 |
+
"metric": "chrf",
|
10576 |
+
"score": 0.9641464401452432,
|
10577 |
+
"model": 1.0
|
10578 |
+
},
|
10579 |
+
{
|
10580 |
+
"bcp_47": "ta",
|
10581 |
+
"speakers": 85616159,
|
10582 |
+
"language_name": "Tamil",
|
10583 |
+
"autonym": "தமிழ்",
|
10584 |
+
"family": "Dravidian",
|
10585 |
+
"flores_path": "tam_Taml",
|
10586 |
+
"fleurs_tag": "ta_in",
|
10587 |
+
"commonvoice_hours": 234.0,
|
10588 |
+
"commonvoice_locale": "ta",
|
10589 |
+
"in_benchmark": true,
|
10590 |
+
"task": "translation",
|
10591 |
+
"metric": "bleu",
|
10592 |
+
"score": 0.2528104486727614,
|
10593 |
+
"model": 1.0
|
10594 |
+
},
|
10595 |
+
{
|
10596 |
+
"bcp_47": "ta",
|
10597 |
+
"speakers": 85616159,
|
10598 |
+
"language_name": "Tamil",
|
10599 |
+
"autonym": "தமிழ்",
|
10600 |
+
"family": "Dravidian",
|
10601 |
+
"flores_path": "tam_Taml",
|
10602 |
+
"fleurs_tag": "ta_in",
|
10603 |
+
"commonvoice_hours": 234.0,
|
10604 |
+
"commonvoice_locale": "ta",
|
10605 |
+
"in_benchmark": true,
|
10606 |
+
"task": "translation",
|
10607 |
+
"metric": "chrf",
|
10608 |
+
"score": 0.42077045938882934,
|
10609 |
+
"model": 1.0
|
10610 |
},
|
10611 |
{
|
10612 |
"bcp_47": "taj",
|
|
|
10715 |
"commonvoice_hours": 0.3,
|
10716 |
"commonvoice_locale": "te",
|
10717 |
"in_benchmark": true,
|
10718 |
+
"task": "classification",
|
10719 |
+
"metric": "accuracy",
|
10720 |
+
"score": 0.36666666666666664,
|
10721 |
+
"model": 1.0
|
10722 |
+
},
|
10723 |
+
{
|
10724 |
+
"bcp_47": "te",
|
10725 |
+
"speakers": 95478480,
|
10726 |
+
"language_name": "Telugu",
|
10727 |
+
"autonym": "తెలుగు",
|
10728 |
+
"family": "Dravidian",
|
10729 |
+
"flores_path": "tel_Telu",
|
10730 |
+
"fleurs_tag": "te_in",
|
10731 |
+
"commonvoice_hours": 0.3,
|
10732 |
+
"commonvoice_locale": "te",
|
10733 |
+
"in_benchmark": true,
|
10734 |
+
"task": "language_modeling",
|
10735 |
+
"metric": "chrf",
|
10736 |
+
"score": 0.9513838296654142,
|
10737 |
+
"model": 1.0
|
10738 |
+
},
|
10739 |
+
{
|
10740 |
+
"bcp_47": "te",
|
10741 |
+
"speakers": 95478480,
|
10742 |
+
"language_name": "Telugu",
|
10743 |
+
"autonym": "తెలుగు",
|
10744 |
+
"family": "Dravidian",
|
10745 |
+
"flores_path": "tel_Telu",
|
10746 |
+
"fleurs_tag": "te_in",
|
10747 |
+
"commonvoice_hours": 0.3,
|
10748 |
+
"commonvoice_locale": "te",
|
10749 |
+
"in_benchmark": true,
|
10750 |
+
"task": "translation",
|
10751 |
+
"metric": "bleu",
|
10752 |
+
"score": 0.28338449781147135,
|
10753 |
+
"model": 1.0
|
10754 |
+
},
|
10755 |
+
{
|
10756 |
+
"bcp_47": "te",
|
10757 |
+
"speakers": 95478480,
|
10758 |
+
"language_name": "Telugu",
|
10759 |
+
"autonym": "తెలుగు",
|
10760 |
+
"family": "Dravidian",
|
10761 |
+
"flores_path": "tel_Telu",
|
10762 |
+
"fleurs_tag": "te_in",
|
10763 |
+
"commonvoice_hours": 0.3,
|
10764 |
+
"commonvoice_locale": "te",
|
10765 |
+
"in_benchmark": true,
|
10766 |
+
"task": "translation",
|
10767 |
+
"metric": "chrf",
|
10768 |
+
"score": 0.467003606031036,
|
10769 |
+
"model": 1.0
|
10770 |
},
|
10771 |
{
|
10772 |
"bcp_47": "tem",
|
|
|
11131 |
"commonvoice_hours": 128.0,
|
11132 |
"commonvoice_locale": "tr",
|
11133 |
"in_benchmark": true,
|
11134 |
+
"task": "classification",
|
11135 |
+
"metric": "accuracy",
|
11136 |
+
"score": 0.5333333333333333,
|
11137 |
+
"model": 1.0
|
11138 |
+
},
|
11139 |
+
{
|
11140 |
+
"bcp_47": "tr",
|
11141 |
+
"speakers": 80360704,
|
11142 |
+
"language_name": "Turkish",
|
11143 |
+
"autonym": "Türkçe",
|
11144 |
+
"family": "Turkic",
|
11145 |
+
"flores_path": "tur_Latn",
|
11146 |
+
"fleurs_tag": "tr_tr",
|
11147 |
+
"commonvoice_hours": 128.0,
|
11148 |
+
"commonvoice_locale": "tr",
|
11149 |
+
"in_benchmark": true,
|
11150 |
+
"task": "language_modeling",
|
11151 |
+
"metric": "chrf",
|
11152 |
+
"score": 0.9446670623712353,
|
11153 |
+
"model": 1.0
|
11154 |
+
},
|
11155 |
+
{
|
11156 |
+
"bcp_47": "tr",
|
11157 |
+
"speakers": 80360704,
|
11158 |
+
"language_name": "Turkish",
|
11159 |
+
"autonym": "Türkçe",
|
11160 |
+
"family": "Turkic",
|
11161 |
+
"flores_path": "tur_Latn",
|
11162 |
+
"fleurs_tag": "tr_tr",
|
11163 |
+
"commonvoice_hours": 128.0,
|
11164 |
+
"commonvoice_locale": "tr",
|
11165 |
+
"in_benchmark": true,
|
11166 |
+
"task": "translation",
|
11167 |
+
"metric": "bleu",
|
11168 |
+
"score": 0.2844596261435892,
|
11169 |
+
"model": 1.0
|
11170 |
+
},
|
11171 |
+
{
|
11172 |
+
"bcp_47": "tr",
|
11173 |
+
"speakers": 80360704,
|
11174 |
+
"language_name": "Turkish",
|
11175 |
+
"autonym": "Türkçe",
|
11176 |
+
"family": "Turkic",
|
11177 |
+
"flores_path": "tur_Latn",
|
11178 |
+
"fleurs_tag": "tr_tr",
|
11179 |
+
"commonvoice_hours": 128.0,
|
11180 |
+
"commonvoice_locale": "tr",
|
11181 |
+
"in_benchmark": true,
|
11182 |
+
"task": "translation",
|
11183 |
+
"metric": "chrf",
|
11184 |
+
"score": 0.4525478264239361,
|
11185 |
+
"model": 1.0
|
11186 |
},
|
11187 |
{
|
11188 |
"bcp_47": "tru",
|
|
|
11597 |
"in_benchmark": true,
|
11598 |
"task": "language_modeling",
|
11599 |
"metric": "chrf",
|
11600 |
+
"score": 0.9182703887696211,
|
11601 |
"model": 1.0
|
11602 |
},
|
11603 |
{
|
|
|
11613 |
"in_benchmark": true,
|
11614 |
"task": "translation",
|
11615 |
"metric": "bleu",
|
11616 |
+
"score": 0.2434522914619727,
|
11617 |
"model": 1.0
|
11618 |
},
|
11619 |
{
|
|
|
11723 |
"commonvoice_hours": 6.0,
|
11724 |
"commonvoice_locale": "vi",
|
11725 |
"in_benchmark": true,
|
11726 |
+
"task": "classification",
|
11727 |
+
"metric": "accuracy",
|
11728 |
+
"score": 0.6,
|
11729 |
+
"model": 1.0
|
11730 |
},
|
11731 |
{
|
11732 |
+
"bcp_47": "vi",
|
11733 |
+
"speakers": 86222962,
|
11734 |
+
"language_name": "Vietnamese",
|
11735 |
+
"autonym": "Tiếng Việt",
|
11736 |
+
"family": "Austroasiatic",
|
11737 |
+
"flores_path": "vie_Latn",
|
11738 |
+
"fleurs_tag": "vi_vn",
|
11739 |
+
"commonvoice_hours": 6.0,
|
11740 |
+
"commonvoice_locale": "vi",
|
11741 |
+
"in_benchmark": true,
|
11742 |
+
"task": "language_modeling",
|
11743 |
+
"metric": "chrf",
|
11744 |
+
"score": 0.9580044761495575,
|
11745 |
+
"model": 1.0
|
11746 |
},
|
11747 |
{
|
11748 |
+
"bcp_47": "vi",
|
11749 |
+
"speakers": 86222962,
|
11750 |
+
"language_name": "Vietnamese",
|
11751 |
+
"autonym": "Tiếng Việt",
|
11752 |
+
"family": "Austroasiatic",
|
11753 |
+
"flores_path": "vie_Latn",
|
11754 |
+
"fleurs_tag": "vi_vn",
|
11755 |
+
"commonvoice_hours": 6.0,
|
11756 |
+
"commonvoice_locale": "vi",
|
11757 |
+
"in_benchmark": true,
|
11758 |
+
"task": "translation",
|
11759 |
+
"metric": "bleu",
|
11760 |
+
"score": 0.25541664062319624,
|
11761 |
+
"model": 1.0
|
11762 |
+
},
|
11763 |
+
{
|
11764 |
+
"bcp_47": "vi",
|
11765 |
+
"speakers": 86222962,
|
11766 |
+
"language_name": "Vietnamese",
|
11767 |
+
"autonym": "Tiếng Việt",
|
11768 |
+
"family": "Austroasiatic",
|
11769 |
+
"flores_path": "vie_Latn",
|
11770 |
+
"fleurs_tag": "vi_vn",
|
11771 |
+
"commonvoice_hours": 6.0,
|
11772 |
+
"commonvoice_locale": "vi",
|
11773 |
+
"in_benchmark": true,
|
11774 |
+
"task": "translation",
|
11775 |
+
"metric": "chrf",
|
11776 |
+
"score": 0.43688984396841446,
|
11777 |
+
"model": 1.0
|
11778 |
+
},
|
11779 |
+
{
|
11780 |
+
"bcp_47": "vic",
|
11781 |
+
"speakers": 3113,
|
11782 |
+
"language_name": "Virgin Islands Creole English",
|
11783 |
+
"autonym": "Virgin Islands Creole English",
|
11784 |
+
"family": "Indo-European",
|
11785 |
+
"flores_path": null,
|
11786 |
+
"fleurs_tag": null,
|
11787 |
+
"commonvoice_hours": null,
|
11788 |
+
"commonvoice_locale": null,
|
11789 |
+
"in_benchmark": false,
|
11790 |
+
"task": null,
|
11791 |
+
"metric": null,
|
11792 |
+
"score": null,
|
11793 |
+
"model": null
|
11794 |
+
},
|
11795 |
+
{
|
11796 |
+
"bcp_47": "vls",
|
11797 |
+
"speakers": 1172070,
|
11798 |
+
"language_name": "West Flemish",
|
11799 |
+
"autonym": "West Flemish",
|
11800 |
+
"family": "Indo-European",
|
11801 |
+
"flores_path": null,
|
11802 |
+
"fleurs_tag": null,
|
11803 |
+
"commonvoice_hours": null,
|
11804 |
+
"commonvoice_locale": null,
|
11805 |
+
"in_benchmark": false,
|
11806 |
+
"task": null,
|
11807 |
+
"metric": null,
|
11808 |
+
"score": null,
|
11809 |
+
"model": null
|
11810 |
},
|
11811 |
{
|
11812 |
"bcp_47": "vmf",
|
|
|
12315 |
"commonvoice_hours": 203.0,
|
12316 |
"commonvoice_locale": "yue",
|
12317 |
"in_benchmark": true,
|
12318 |
+
"task": "classification",
|
12319 |
+
"metric": "accuracy",
|
12320 |
+
"score": 0.43333333333333335,
|
12321 |
+
"model": 1.0
|
12322 |
+
},
|
12323 |
+
{
|
12324 |
+
"bcp_47": "yue",
|
12325 |
+
"speakers": 79654759,
|
12326 |
+
"language_name": "Cantonese",
|
12327 |
+
"autonym": "粵語",
|
12328 |
+
"family": "Sino-Tibetan",
|
12329 |
+
"flores_path": "yue_Hant",
|
12330 |
+
"fleurs_tag": "yue_hant_hk",
|
12331 |
+
"commonvoice_hours": 203.0,
|
12332 |
+
"commonvoice_locale": "yue",
|
12333 |
+
"in_benchmark": true,
|
12334 |
+
"task": "language_modeling",
|
12335 |
+
"metric": "chrf",
|
12336 |
+
"score": 0.9022415223117748,
|
12337 |
+
"model": 1.0
|
12338 |
+
},
|
12339 |
+
{
|
12340 |
+
"bcp_47": "yue",
|
12341 |
+
"speakers": 79654759,
|
12342 |
+
"language_name": "Cantonese",
|
12343 |
+
"autonym": "粵語",
|
12344 |
+
"family": "Sino-Tibetan",
|
12345 |
+
"flores_path": "yue_Hant",
|
12346 |
+
"fleurs_tag": "yue_hant_hk",
|
12347 |
+
"commonvoice_hours": 203.0,
|
12348 |
+
"commonvoice_locale": "yue",
|
12349 |
+
"in_benchmark": true,
|
12350 |
+
"task": "translation",
|
12351 |
+
"metric": "bleu",
|
12352 |
+
"score": 0.22628178945118504,
|
12353 |
+
"model": 1.0
|
12354 |
+
},
|
12355 |
+
{
|
12356 |
+
"bcp_47": "yue",
|
12357 |
+
"speakers": 79654759,
|
12358 |
+
"language_name": "Cantonese",
|
12359 |
+
"autonym": "粵語",
|
12360 |
+
"family": "Sino-Tibetan",
|
12361 |
+
"flores_path": "yue_Hant",
|
12362 |
+
"fleurs_tag": "yue_hant_hk",
|
12363 |
+
"commonvoice_hours": 203.0,
|
12364 |
+
"commonvoice_locale": "yue",
|
12365 |
+
"in_benchmark": true,
|
12366 |
+
"task": "translation",
|
12367 |
+
"metric": "chrf",
|
12368 |
+
"score": 0.4052050858435178,
|
12369 |
+
"model": 1.0
|
12370 |
},
|
12371 |
{
|
12372 |
"bcp_47": "za",
|
|
|
12477 |
"in_benchmark": true,
|
12478 |
"task": "language_modeling",
|
12479 |
"metric": "chrf",
|
12480 |
+
"score": 0.862116462347859,
|
12481 |
"model": 12.0
|
12482 |
},
|
12483 |
{
|
|
|
12575 |
"bcp_47": "en",
|
12576 |
"task": "language_modeling",
|
12577 |
"metric": "chrf",
|
12578 |
+
"score": 0.9596433057062642,
|
12579 |
"sentence_nr": 14.5
|
12580 |
},
|
12581 |
{
|
|
|
12607 |
"bcp_47": "zh",
|
12608 |
"task": "language_modeling",
|
12609 |
"metric": "chrf",
|
12610 |
+
"score": 0.9120424742302929,
|
12611 |
"sentence_nr": 14.5
|
12612 |
},
|
12613 |
{
|
|
|
12639 |
"bcp_47": "en",
|
12640 |
"task": "language_modeling",
|
12641 |
"metric": "chrf",
|
12642 |
+
"score": 0.9854618933889567,
|
12643 |
"sentence_nr": 14.5
|
12644 |
},
|
12645 |
{
|
|
|
12671 |
"bcp_47": "zh",
|
12672 |
"task": "language_modeling",
|
12673 |
"metric": "chrf",
|
12674 |
+
"score": 0.93160311345022,
|
12675 |
"sentence_nr": 14.5
|
12676 |
},
|
12677 |
{
|
|
|
12703 |
"bcp_47": "en",
|
12704 |
"task": "language_modeling",
|
12705 |
"metric": "chrf",
|
12706 |
+
"score": 0.9840731165453181,
|
12707 |
"sentence_nr": 14.5
|
12708 |
},
|
12709 |
{
|
|
|
12735 |
"bcp_47": "zh",
|
12736 |
"task": "language_modeling",
|
12737 |
"metric": "chrf",
|
12738 |
+
"score": 0.9308727688438002,
|
12739 |
"sentence_nr": 14.5
|
12740 |
},
|
12741 |
{
|
|
|
12767 |
"bcp_47": "en",
|
12768 |
"task": "language_modeling",
|
12769 |
"metric": "chrf",
|
12770 |
+
"score": 0.9705999747171945,
|
12771 |
"sentence_nr": 14.5
|
12772 |
},
|
12773 |
{
|
|
|
12799 |
"bcp_47": "zh",
|
12800 |
"task": "language_modeling",
|
12801 |
"metric": "chrf",
|
12802 |
+
"score": 0.9098214011017126,
|
12803 |
"sentence_nr": 14.5
|
12804 |
},
|
12805 |
{
|
|
|
12831 |
"bcp_47": "en",
|
12832 |
"task": "language_modeling",
|
12833 |
"metric": "chrf",
|
12834 |
+
"score": 0.9802918604410554,
|
12835 |
"sentence_nr": 14.5
|
12836 |
},
|
12837 |
{
|
|
|
12863 |
"bcp_47": "zh",
|
12864 |
"task": "language_modeling",
|
12865 |
"metric": "chrf",
|
12866 |
+
"score": 0.9309062045243536,
|
12867 |
"sentence_nr": 14.5
|
12868 |
},
|
12869 |
{
|
|
|
12895 |
"bcp_47": "en",
|
12896 |
"task": "language_modeling",
|
12897 |
"metric": "chrf",
|
12898 |
+
"score": 0.9683113542489836,
|
12899 |
"sentence_nr": 14.5
|
12900 |
},
|
12901 |
{
|
|
|
12903 |
"bcp_47": "en",
|
12904 |
"task": "translation",
|
12905 |
"metric": "bleu",
|
12906 |
+
"score": 0.444507882217401,
|
12907 |
"sentence_nr": 14.5
|
12908 |
},
|
12909 |
{
|
|
|
12927 |
"bcp_47": "zh",
|
12928 |
"task": "language_modeling",
|
12929 |
"metric": "chrf",
|
12930 |
+
"score": 0.9233418215760759,
|
12931 |
"sentence_nr": 14.5
|
12932 |
},
|
12933 |
{
|
|
|
12959 |
"bcp_47": "ar",
|
12960 |
"task": "language_modeling",
|
12961 |
"metric": "chrf",
|
12962 |
+
"score": 0.9392314289764625,
|
12963 |
"sentence_nr": 14.5
|
12964 |
},
|
12965 |
{
|
|
|
12978 |
"score": 0.4684314458952127,
|
12979 |
"sentence_nr": 14.5
|
12980 |
},
|
12981 |
+
{
|
12982 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
12983 |
+
"bcp_47": "arz",
|
12984 |
+
"task": "classification",
|
12985 |
+
"metric": "accuracy",
|
12986 |
+
"score": 0.4,
|
12987 |
+
"sentence_nr": 14.5
|
12988 |
+
},
|
12989 |
+
{
|
12990 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
12991 |
+
"bcp_47": "arz",
|
12992 |
+
"task": "language_modeling",
|
12993 |
+
"metric": "chrf",
|
12994 |
+
"score": 0.930329195667362,
|
12995 |
+
"sentence_nr": 14.5
|
12996 |
+
},
|
12997 |
+
{
|
12998 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
12999 |
+
"bcp_47": "arz",
|
13000 |
+
"task": "translation",
|
13001 |
+
"metric": "bleu",
|
13002 |
+
"score": 0.19793415292805128,
|
13003 |
+
"sentence_nr": 14.5
|
13004 |
+
},
|
13005 |
+
{
|
13006 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13007 |
+
"bcp_47": "arz",
|
13008 |
+
"task": "translation",
|
13009 |
+
"metric": "chrf",
|
13010 |
+
"score": 0.3881278724939126,
|
13011 |
+
"sentence_nr": 14.5
|
13012 |
+
},
|
13013 |
{
|
13014 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13015 |
"bcp_47": "bn",
|
|
|
13023 |
"bcp_47": "bn",
|
13024 |
"task": "language_modeling",
|
13025 |
"metric": "chrf",
|
13026 |
+
"score": 0.9097658392566466,
|
13027 |
"sentence_nr": 14.5
|
13028 |
},
|
13029 |
{
|
|
|
13042 |
"score": 0.4076175886917154,
|
13043 |
"sentence_nr": 14.5
|
13044 |
},
|
13045 |
+
{
|
13046 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13047 |
+
"bcp_47": "de",
|
13048 |
+
"task": "classification",
|
13049 |
+
"metric": "accuracy",
|
13050 |
+
"score": 0.6666666666666666,
|
13051 |
+
"sentence_nr": 14.5
|
13052 |
+
},
|
13053 |
+
{
|
13054 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13055 |
+
"bcp_47": "de",
|
13056 |
+
"task": "language_modeling",
|
13057 |
+
"metric": "chrf",
|
13058 |
+
"score": 0.9594656177914042,
|
13059 |
+
"sentence_nr": 14.5
|
13060 |
+
},
|
13061 |
+
{
|
13062 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13063 |
+
"bcp_47": "de",
|
13064 |
+
"task": "translation",
|
13065 |
+
"metric": "bleu",
|
13066 |
+
"score": 0.3207642359472324,
|
13067 |
+
"sentence_nr": 14.5
|
13068 |
+
},
|
13069 |
+
{
|
13070 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13071 |
+
"bcp_47": "de",
|
13072 |
+
"task": "translation",
|
13073 |
+
"metric": "chrf",
|
13074 |
+
"score": 0.49973270743869647,
|
13075 |
+
"sentence_nr": 14.5
|
13076 |
+
},
|
13077 |
{
|
13078 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13079 |
"bcp_47": "en",
|
|
|
13087 |
"bcp_47": "en",
|
13088 |
"task": "language_modeling",
|
13089 |
"metric": "chrf",
|
13090 |
+
"score": 0.9810108607325073,
|
13091 |
"sentence_nr": 14.5
|
13092 |
},
|
13093 |
{
|
|
|
13119 |
"bcp_47": "es",
|
13120 |
"task": "language_modeling",
|
13121 |
"metric": "chrf",
|
13122 |
+
"score": 0.9569342865902168,
|
13123 |
"sentence_nr": 14.5
|
13124 |
},
|
13125 |
{
|
|
|
13140 |
},
|
13141 |
{
|
13142 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13143 |
+
"bcp_47": "fa",
|
13144 |
"task": "classification",
|
13145 |
"metric": "accuracy",
|
13146 |
+
"score": 0.4,
|
13147 |
"sentence_nr": 14.5
|
13148 |
},
|
13149 |
{
|
13150 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13151 |
+
"bcp_47": "fa",
|
13152 |
"task": "language_modeling",
|
13153 |
"metric": "chrf",
|
13154 |
+
"score": 0.9414698824984596,
|
13155 |
"sentence_nr": 14.5
|
13156 |
},
|
13157 |
{
|
13158 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13159 |
+
"bcp_47": "fa",
|
13160 |
"task": "translation",
|
13161 |
"metric": "bleu",
|
13162 |
+
"score": 0.26232478733341374,
|
13163 |
"sentence_nr": 14.5
|
13164 |
},
|
13165 |
{
|
13166 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13167 |
+
"bcp_47": "fa",
|
13168 |
"task": "translation",
|
13169 |
"metric": "chrf",
|
13170 |
+
"score": 0.44641220608314985,
|
13171 |
"sentence_nr": 14.5
|
13172 |
},
|
13173 |
{
|
13174 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13175 |
+
"bcp_47": "fil",
|
13176 |
"task": "classification",
|
13177 |
"metric": "accuracy",
|
13178 |
+
"score": 0.43333333333333335,
|
13179 |
"sentence_nr": 14.5
|
13180 |
},
|
13181 |
{
|
13182 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13183 |
+
"bcp_47": "fil",
|
13184 |
"task": "language_modeling",
|
13185 |
"metric": "chrf",
|
13186 |
+
"score": 0.9402707475255596,
|
13187 |
"sentence_nr": 14.5
|
13188 |
},
|
13189 |
{
|
13190 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13191 |
+
"bcp_47": "fil",
|
13192 |
"task": "translation",
|
13193 |
"metric": "bleu",
|
13194 |
+
"score": 0.29097818784870333,
|
13195 |
"sentence_nr": 14.5
|
13196 |
},
|
13197 |
{
|
13198 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13199 |
+
"bcp_47": "fil",
|
13200 |
"task": "translation",
|
13201 |
"metric": "chrf",
|
13202 |
+
"score": 0.44978114149245985,
|
13203 |
"sentence_nr": 14.5
|
13204 |
},
|
13205 |
{
|
13206 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13207 |
+
"bcp_47": "fr",
|
13208 |
"task": "classification",
|
13209 |
"metric": "accuracy",
|
13210 |
+
"score": 0.5333333333333333,
|
13211 |
"sentence_nr": 14.5
|
13212 |
},
|
13213 |
{
|
13214 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13215 |
+
"bcp_47": "fr",
|
13216 |
"task": "language_modeling",
|
13217 |
"metric": "chrf",
|
13218 |
+
"score": 0.9815706066541411,
|
13219 |
"sentence_nr": 14.5
|
13220 |
},
|
13221 |
{
|
13222 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13223 |
+
"bcp_47": "fr",
|
13224 |
"task": "translation",
|
13225 |
"metric": "bleu",
|
13226 |
+
"score": 0.3193235920661593,
|
13227 |
"sentence_nr": 14.5
|
13228 |
},
|
13229 |
{
|
13230 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13231 |
+
"bcp_47": "fr",
|
13232 |
"task": "translation",
|
13233 |
"metric": "chrf",
|
13234 |
+
"score": 0.4875691290722964,
|
13235 |
"sentence_nr": 14.5
|
13236 |
},
|
13237 |
{
|
13238 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13239 |
+
"bcp_47": "gu",
|
13240 |
"task": "classification",
|
13241 |
"metric": "accuracy",
|
13242 |
+
"score": 0.43333333333333335,
|
13243 |
"sentence_nr": 14.5
|
13244 |
},
|
13245 |
{
|
13246 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13247 |
+
"bcp_47": "gu",
|
13248 |
"task": "language_modeling",
|
13249 |
"metric": "chrf",
|
13250 |
+
"score": 0.938086045460355,
|
13251 |
"sentence_nr": 14.5
|
13252 |
},
|
13253 |
{
|
13254 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13255 |
+
"bcp_47": "gu",
|
13256 |
"task": "translation",
|
13257 |
"metric": "bleu",
|
13258 |
+
"score": 0.26442484966880464,
|
13259 |
"sentence_nr": 14.5
|
13260 |
},
|
13261 |
{
|
13262 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13263 |
+
"bcp_47": "gu",
|
13264 |
"task": "translation",
|
13265 |
"metric": "chrf",
|
13266 |
+
"score": 0.44452182973195975,
|
13267 |
"sentence_nr": 14.5
|
13268 |
},
|
13269 |
{
|
13270 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13271 |
+
"bcp_47": "hi",
|
13272 |
"task": "classification",
|
13273 |
"metric": "accuracy",
|
13274 |
+
"score": 0.5333333333333333,
|
13275 |
"sentence_nr": 14.5
|
13276 |
},
|
13277 |
{
|
13278 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13279 |
+
"bcp_47": "hi",
|
13280 |
"task": "language_modeling",
|
13281 |
"metric": "chrf",
|
13282 |
+
"score": 0.9428185393832219,
|
13283 |
"sentence_nr": 14.5
|
13284 |
},
|
13285 |
{
|
13286 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13287 |
+
"bcp_47": "hi",
|
13288 |
"task": "translation",
|
13289 |
"metric": "bleu",
|
13290 |
+
"score": 0.31956422674397006,
|
13291 |
"sentence_nr": 14.5
|
13292 |
},
|
13293 |
{
|
13294 |
"model": "meta-llama/llama-3.3-70b-instruct",
|
13295 |
+
"bcp_47": "hi",
|
13296 |
"task": "translation",
|
13297 |
"metric": "chrf",
|
13298 |
+
"score": 0.4896277852320754,
|
13299 |
+
"sentence_nr": 14.5
|
13300 |
+
},
|
13301 |
+
{
|
13302 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13303 |
+
"bcp_47": "id",
|
13304 |
+
"task": "classification",
|
13305 |
+
"metric": "accuracy",
|
13306 |
+
"score": 0.6333333333333333,
|
13307 |
+
"sentence_nr": 14.5
|
13308 |
+
},
|
13309 |
+
{
|
13310 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13311 |
+
"bcp_47": "id",
|
13312 |
+
"task": "language_modeling",
|
13313 |
+
"metric": "chrf",
|
13314 |
+
"score": 0.9598314474300775,
|
13315 |
+
"sentence_nr": 14.5
|
13316 |
+
},
|
13317 |
+
{
|
13318 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13319 |
+
"bcp_47": "id",
|
13320 |
+
"task": "translation",
|
13321 |
+
"metric": "bleu",
|
13322 |
+
"score": 0.29354203311552335,
|
13323 |
+
"sentence_nr": 14.5
|
13324 |
+
},
|
13325 |
+
{
|
13326 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13327 |
+
"bcp_47": "id",
|
13328 |
+
"task": "translation",
|
13329 |
+
"metric": "chrf",
|
13330 |
+
"score": 0.4723493656022861,
|
13331 |
+
"sentence_nr": 14.5
|
13332 |
+
},
|
13333 |
+
{
|
13334 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13335 |
+
"bcp_47": "it",
|
13336 |
+
"task": "classification",
|
13337 |
+
"metric": "accuracy",
|
13338 |
+
"score": 0.6666666666666666,
|
13339 |
+
"sentence_nr": 14.5
|
13340 |
+
},
|
13341 |
+
{
|
13342 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13343 |
+
"bcp_47": "it",
|
13344 |
+
"task": "language_modeling",
|
13345 |
+
"metric": "chrf",
|
13346 |
+
"score": 0.9439490413212892,
|
13347 |
+
"sentence_nr": 14.5
|
13348 |
+
},
|
13349 |
+
{
|
13350 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13351 |
+
"bcp_47": "it",
|
13352 |
+
"task": "translation",
|
13353 |
+
"metric": "bleu",
|
13354 |
+
"score": 0.28142583904826096,
|
13355 |
+
"sentence_nr": 14.5
|
13356 |
+
},
|
13357 |
+
{
|
13358 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13359 |
+
"bcp_47": "it",
|
13360 |
+
"task": "translation",
|
13361 |
+
"metric": "chrf",
|
13362 |
+
"score": 0.4707591889357925,
|
13363 |
+
"sentence_nr": 14.5
|
13364 |
+
},
|
13365 |
+
{
|
13366 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13367 |
+
"bcp_47": "ja",
|
13368 |
+
"task": "classification",
|
13369 |
+
"metric": "accuracy",
|
13370 |
+
"score": 0.6333333333333333,
|
13371 |
+
"sentence_nr": 14.5
|
13372 |
+
},
|
13373 |
+
{
|
13374 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13375 |
+
"bcp_47": "ja",
|
13376 |
+
"task": "language_modeling",
|
13377 |
+
"metric": "chrf",
|
13378 |
+
"score": 0.9371132855221468,
|
13379 |
+
"sentence_nr": 14.5
|
13380 |
+
},
|
13381 |
+
{
|
13382 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13383 |
+
"bcp_47": "ja",
|
13384 |
+
"task": "translation",
|
13385 |
+
"metric": "bleu",
|
13386 |
+
"score": 0.2723410893967824,
|
13387 |
+
"sentence_nr": 14.5
|
13388 |
+
},
|
13389 |
+
{
|
13390 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13391 |
+
"bcp_47": "ja",
|
13392 |
+
"task": "translation",
|
13393 |
+
"metric": "chrf",
|
13394 |
+
"score": 0.43929453749366865,
|
13395 |
+
"sentence_nr": 14.5
|
13396 |
+
},
|
13397 |
+
{
|
13398 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13399 |
+
"bcp_47": "jv",
|
13400 |
+
"task": "classification",
|
13401 |
+
"metric": "accuracy",
|
13402 |
+
"score": 0.4666666666666667,
|
13403 |
+
"sentence_nr": 14.5
|
13404 |
+
},
|
13405 |
+
{
|
13406 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13407 |
+
"bcp_47": "jv",
|
13408 |
+
"task": "language_modeling",
|
13409 |
+
"metric": "chrf",
|
13410 |
+
"score": 0.9298143194922116,
|
13411 |
+
"sentence_nr": 14.5
|
13412 |
+
},
|
13413 |
+
{
|
13414 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13415 |
+
"bcp_47": "jv",
|
13416 |
+
"task": "translation",
|
13417 |
+
"metric": "bleu",
|
13418 |
+
"score": 0.23729186537968905,
|
13419 |
+
"sentence_nr": 14.5
|
13420 |
+
},
|
13421 |
+
{
|
13422 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13423 |
+
"bcp_47": "jv",
|
13424 |
+
"task": "translation",
|
13425 |
+
"metric": "chrf",
|
13426 |
+
"score": 0.4198940727847352,
|
13427 |
+
"sentence_nr": 14.5
|
13428 |
+
},
|
13429 |
+
{
|
13430 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13431 |
+
"bcp_47": "ko",
|
13432 |
+
"task": "classification",
|
13433 |
+
"metric": "accuracy",
|
13434 |
+
"score": 0.5333333333333333,
|
13435 |
+
"sentence_nr": 14.5
|
13436 |
+
},
|
13437 |
+
{
|
13438 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13439 |
+
"bcp_47": "ko",
|
13440 |
+
"task": "language_modeling",
|
13441 |
+
"metric": "chrf",
|
13442 |
+
"score": 0.9355445912073929,
|
13443 |
+
"sentence_nr": 14.5
|
13444 |
+
},
|
13445 |
+
{
|
13446 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13447 |
+
"bcp_47": "ko",
|
13448 |
+
"task": "translation",
|
13449 |
+
"metric": "bleu",
|
13450 |
+
"score": 0.20332074778330964,
|
13451 |
+
"sentence_nr": 14.5
|
13452 |
+
},
|
13453 |
+
{
|
13454 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13455 |
+
"bcp_47": "ko",
|
13456 |
+
"task": "translation",
|
13457 |
+
"metric": "chrf",
|
13458 |
+
"score": 0.4005255477730261,
|
13459 |
+
"sentence_nr": 14.5
|
13460 |
+
},
|
13461 |
+
{
|
13462 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13463 |
+
"bcp_47": "mr",
|
13464 |
+
"task": "classification",
|
13465 |
+
"metric": "accuracy",
|
13466 |
+
"score": 0.6333333333333333,
|
13467 |
+
"sentence_nr": 14.5
|
13468 |
+
},
|
13469 |
+
{
|
13470 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13471 |
+
"bcp_47": "mr",
|
13472 |
+
"task": "language_modeling",
|
13473 |
+
"metric": "chrf",
|
13474 |
+
"score": 0.9440892312053646,
|
13475 |
+
"sentence_nr": 14.5
|
13476 |
+
},
|
13477 |
+
{
|
13478 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13479 |
+
"bcp_47": "mr",
|
13480 |
+
"task": "translation",
|
13481 |
+
"metric": "bleu",
|
13482 |
+
"score": 0.24903049799655144,
|
13483 |
+
"sentence_nr": 14.5
|
13484 |
+
},
|
13485 |
+
{
|
13486 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13487 |
+
"bcp_47": "mr",
|
13488 |
+
"task": "translation",
|
13489 |
+
"metric": "chrf",
|
13490 |
+
"score": 0.42489125861884175,
|
13491 |
+
"sentence_nr": 14.5
|
13492 |
+
},
|
13493 |
+
{
|
13494 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13495 |
+
"bcp_47": "pa",
|
13496 |
+
"task": "classification",
|
13497 |
+
"metric": "accuracy",
|
13498 |
+
"score": 0.4,
|
13499 |
+
"sentence_nr": 14.5
|
13500 |
+
},
|
13501 |
+
{
|
13502 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13503 |
+
"bcp_47": "pa",
|
13504 |
+
"task": "language_modeling",
|
13505 |
+
"metric": "chrf",
|
13506 |
+
"score": 0.9025298113664532,
|
13507 |
+
"sentence_nr": 14.5
|
13508 |
+
},
|
13509 |
+
{
|
13510 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13511 |
+
"bcp_47": "pa",
|
13512 |
+
"task": "translation",
|
13513 |
+
"metric": "bleu",
|
13514 |
+
"score": 0.3368333727390049,
|
13515 |
+
"sentence_nr": 14.5
|
13516 |
+
},
|
13517 |
+
{
|
13518 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13519 |
+
"bcp_47": "pa",
|
13520 |
+
"task": "translation",
|
13521 |
+
"metric": "chrf",
|
13522 |
+
"score": 0.4873541452250132,
|
13523 |
+
"sentence_nr": 14.5
|
13524 |
+
},
|
13525 |
+
{
|
13526 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13527 |
+
"bcp_47": "pt",
|
13528 |
+
"task": "classification",
|
13529 |
+
"metric": "accuracy",
|
13530 |
+
"score": 0.5,
|
13531 |
+
"sentence_nr": 14.5
|
13532 |
+
},
|
13533 |
+
{
|
13534 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13535 |
+
"bcp_47": "pt",
|
13536 |
+
"task": "language_modeling",
|
13537 |
+
"metric": "chrf",
|
13538 |
+
"score": 0.9641423549595803,
|
13539 |
+
"sentence_nr": 14.5
|
13540 |
+
},
|
13541 |
+
{
|
13542 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13543 |
+
"bcp_47": "pt",
|
13544 |
+
"task": "translation",
|
13545 |
+
"metric": "bleu",
|
13546 |
+
"score": 0.3110105331834714,
|
13547 |
+
"sentence_nr": 14.5
|
13548 |
+
},
|
13549 |
+
{
|
13550 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13551 |
+
"bcp_47": "pt",
|
13552 |
+
"task": "translation",
|
13553 |
+
"metric": "chrf",
|
13554 |
+
"score": 0.49172080600981716,
|
13555 |
+
"sentence_nr": 14.5
|
13556 |
+
},
|
13557 |
+
{
|
13558 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13559 |
+
"bcp_47": "ru",
|
13560 |
+
"task": "classification",
|
13561 |
+
"metric": "accuracy",
|
13562 |
+
"score": 0.5666666666666667,
|
13563 |
+
"sentence_nr": 14.5
|
13564 |
+
},
|
13565 |
+
{
|
13566 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13567 |
+
"bcp_47": "ru",
|
13568 |
+
"task": "language_modeling",
|
13569 |
+
"metric": "chrf",
|
13570 |
+
"score": 0.9663696817874857,
|
13571 |
+
"sentence_nr": 14.5
|
13572 |
+
},
|
13573 |
+
{
|
13574 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13575 |
+
"bcp_47": "ru",
|
13576 |
+
"task": "translation",
|
13577 |
+
"metric": "bleu",
|
13578 |
+
"score": 0.26015179309825326,
|
13579 |
+
"sentence_nr": 14.5
|
13580 |
+
},
|
13581 |
+
{
|
13582 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13583 |
+
"bcp_47": "ru",
|
13584 |
+
"task": "translation",
|
13585 |
+
"metric": "chrf",
|
13586 |
+
"score": 0.4525762744858351,
|
13587 |
+
"sentence_nr": 14.5
|
13588 |
+
},
|
13589 |
+
{
|
13590 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13591 |
+
"bcp_47": "sw",
|
13592 |
+
"task": "classification",
|
13593 |
+
"metric": "accuracy",
|
13594 |
+
"score": 0.5666666666666667,
|
13595 |
+
"sentence_nr": 14.5
|
13596 |
+
},
|
13597 |
+
{
|
13598 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13599 |
+
"bcp_47": "sw",
|
13600 |
+
"task": "language_modeling",
|
13601 |
+
"metric": "chrf",
|
13602 |
+
"score": 0.9401745263817055,
|
13603 |
+
"sentence_nr": 14.5
|
13604 |
+
},
|
13605 |
+
{
|
13606 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13607 |
+
"bcp_47": "sw",
|
13608 |
+
"task": "translation",
|
13609 |
+
"metric": "bleu",
|
13610 |
+
"score": 0.30022614000139736,
|
13611 |
+
"sentence_nr": 14.5
|
13612 |
+
},
|
13613 |
+
{
|
13614 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13615 |
+
"bcp_47": "sw",
|
13616 |
+
"task": "translation",
|
13617 |
+
"metric": "chrf",
|
13618 |
+
"score": 0.46620999112028233,
|
13619 |
+
"sentence_nr": 14.5
|
13620 |
+
},
|
13621 |
+
{
|
13622 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13623 |
+
"bcp_47": "ta",
|
13624 |
+
"task": "classification",
|
13625 |
+
"metric": "accuracy",
|
13626 |
+
"score": 0.43333333333333335,
|
13627 |
+
"sentence_nr": 14.5
|
13628 |
+
},
|
13629 |
+
{
|
13630 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13631 |
+
"bcp_47": "ta",
|
13632 |
+
"task": "language_modeling",
|
13633 |
+
"metric": "chrf",
|
13634 |
+
"score": 0.9641464401452432,
|
13635 |
+
"sentence_nr": 14.5
|
13636 |
+
},
|
13637 |
+
{
|
13638 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13639 |
+
"bcp_47": "ta",
|
13640 |
+
"task": "translation",
|
13641 |
+
"metric": "bleu",
|
13642 |
+
"score": 0.2528104486727614,
|
13643 |
+
"sentence_nr": 14.5
|
13644 |
+
},
|
13645 |
+
{
|
13646 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13647 |
+
"bcp_47": "ta",
|
13648 |
+
"task": "translation",
|
13649 |
+
"metric": "chrf",
|
13650 |
+
"score": 0.42077045938882934,
|
13651 |
+
"sentence_nr": 14.5
|
13652 |
+
},
|
13653 |
+
{
|
13654 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13655 |
+
"bcp_47": "te",
|
13656 |
+
"task": "classification",
|
13657 |
+
"metric": "accuracy",
|
13658 |
+
"score": 0.36666666666666664,
|
13659 |
+
"sentence_nr": 14.5
|
13660 |
+
},
|
13661 |
+
{
|
13662 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13663 |
+
"bcp_47": "te",
|
13664 |
+
"task": "language_modeling",
|
13665 |
+
"metric": "chrf",
|
13666 |
+
"score": 0.9513838296654142,
|
13667 |
+
"sentence_nr": 14.5
|
13668 |
+
},
|
13669 |
+
{
|
13670 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13671 |
+
"bcp_47": "te",
|
13672 |
+
"task": "translation",
|
13673 |
+
"metric": "bleu",
|
13674 |
+
"score": 0.28338449781147135,
|
13675 |
+
"sentence_nr": 14.5
|
13676 |
+
},
|
13677 |
+
{
|
13678 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13679 |
+
"bcp_47": "te",
|
13680 |
+
"task": "translation",
|
13681 |
+
"metric": "chrf",
|
13682 |
+
"score": 0.467003606031036,
|
13683 |
+
"sentence_nr": 14.5
|
13684 |
+
},
|
13685 |
+
{
|
13686 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13687 |
+
"bcp_47": "tr",
|
13688 |
+
"task": "classification",
|
13689 |
+
"metric": "accuracy",
|
13690 |
+
"score": 0.5333333333333333,
|
13691 |
+
"sentence_nr": 14.5
|
13692 |
+
},
|
13693 |
+
{
|
13694 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13695 |
+
"bcp_47": "tr",
|
13696 |
+
"task": "language_modeling",
|
13697 |
+
"metric": "chrf",
|
13698 |
+
"score": 0.9446670623712353,
|
13699 |
+
"sentence_nr": 14.5
|
13700 |
+
},
|
13701 |
+
{
|
13702 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13703 |
+
"bcp_47": "tr",
|
13704 |
+
"task": "translation",
|
13705 |
+
"metric": "bleu",
|
13706 |
+
"score": 0.2844596261435892,
|
13707 |
+
"sentence_nr": 14.5
|
13708 |
+
},
|
13709 |
+
{
|
13710 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13711 |
+
"bcp_47": "tr",
|
13712 |
+
"task": "translation",
|
13713 |
+
"metric": "chrf",
|
13714 |
+
"score": 0.4525478264239361,
|
13715 |
+
"sentence_nr": 14.5
|
13716 |
+
},
|
13717 |
+
{
|
13718 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13719 |
+
"bcp_47": "ur",
|
13720 |
+
"task": "classification",
|
13721 |
+
"metric": "accuracy",
|
13722 |
+
"score": 0.5,
|
13723 |
+
"sentence_nr": 14.5
|
13724 |
+
},
|
13725 |
+
{
|
13726 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13727 |
+
"bcp_47": "ur",
|
13728 |
+
"task": "language_modeling",
|
13729 |
+
"metric": "chrf",
|
13730 |
+
"score": 0.9182703887696211,
|
13731 |
+
"sentence_nr": 14.5
|
13732 |
+
},
|
13733 |
+
{
|
13734 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13735 |
+
"bcp_47": "ur",
|
13736 |
+
"task": "translation",
|
13737 |
+
"metric": "bleu",
|
13738 |
+
"score": 0.2434522914619727,
|
13739 |
+
"sentence_nr": 14.5
|
13740 |
+
},
|
13741 |
+
{
|
13742 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13743 |
+
"bcp_47": "ur",
|
13744 |
+
"task": "translation",
|
13745 |
+
"metric": "chrf",
|
13746 |
+
"score": 0.42196914378741973,
|
13747 |
+
"sentence_nr": 14.5
|
13748 |
+
},
|
13749 |
+
{
|
13750 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13751 |
+
"bcp_47": "vi",
|
13752 |
+
"task": "classification",
|
13753 |
+
"metric": "accuracy",
|
13754 |
+
"score": 0.6,
|
13755 |
+
"sentence_nr": 14.5
|
13756 |
+
},
|
13757 |
+
{
|
13758 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13759 |
+
"bcp_47": "vi",
|
13760 |
+
"task": "language_modeling",
|
13761 |
+
"metric": "chrf",
|
13762 |
+
"score": 0.9580044761495575,
|
13763 |
+
"sentence_nr": 14.5
|
13764 |
+
},
|
13765 |
+
{
|
13766 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13767 |
+
"bcp_47": "vi",
|
13768 |
+
"task": "translation",
|
13769 |
+
"metric": "bleu",
|
13770 |
+
"score": 0.25541664062319624,
|
13771 |
+
"sentence_nr": 14.5
|
13772 |
+
},
|
13773 |
+
{
|
13774 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13775 |
+
"bcp_47": "vi",
|
13776 |
+
"task": "translation",
|
13777 |
+
"metric": "chrf",
|
13778 |
+
"score": 0.43688984396841446,
|
13779 |
+
"sentence_nr": 14.5
|
13780 |
+
},
|
13781 |
+
{
|
13782 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13783 |
+
"bcp_47": "yue",
|
13784 |
+
"task": "classification",
|
13785 |
+
"metric": "accuracy",
|
13786 |
+
"score": 0.43333333333333335,
|
13787 |
+
"sentence_nr": 14.5
|
13788 |
+
},
|
13789 |
+
{
|
13790 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13791 |
+
"bcp_47": "yue",
|
13792 |
+
"task": "language_modeling",
|
13793 |
+
"metric": "chrf",
|
13794 |
+
"score": 0.9022415223117748,
|
13795 |
+
"sentence_nr": 14.5
|
13796 |
+
},
|
13797 |
+
{
|
13798 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13799 |
+
"bcp_47": "yue",
|
13800 |
+
"task": "translation",
|
13801 |
+
"metric": "bleu",
|
13802 |
+
"score": 0.22628178945118504,
|
13803 |
+
"sentence_nr": 14.5
|
13804 |
+
},
|
13805 |
+
{
|
13806 |
+
"model": "meta-llama/llama-3.3-70b-instruct",
|
13807 |
+
"bcp_47": "yue",
|
13808 |
+
"task": "translation",
|
13809 |
+
"metric": "chrf",
|
13810 |
+
"score": 0.4052050858435178,
|
13811 |
"sentence_nr": 14.5
|
13812 |
},
|
13813 |
{
|
|
|
13823 |
"bcp_47": "zh",
|
13824 |
"task": "language_modeling",
|
13825 |
"metric": "chrf",
|
13826 |
+
"score": 0.9003842558834025,
|
13827 |
"sentence_nr": 14.5
|
13828 |
},
|
13829 |
{
|
|
|
13855 |
"bcp_47": "en",
|
13856 |
"task": "language_modeling",
|
13857 |
"metric": "chrf",
|
13858 |
+
"score": 0.9312514772455793,
|
13859 |
"sentence_nr": 14.5
|
13860 |
},
|
13861 |
{
|
|
|
13887 |
"bcp_47": "zh",
|
13888 |
"task": "language_modeling",
|
13889 |
"metric": "chrf",
|
13890 |
+
"score": 0.831019102021034,
|
13891 |
"sentence_nr": 14.5
|
13892 |
},
|
13893 |
{
|
|
|
13919 |
"bcp_47": "en",
|
13920 |
"task": "language_modeling",
|
13921 |
"metric": "chrf",
|
13922 |
+
"score": 0.9126664788853867,
|
13923 |
"sentence_nr": 14.5
|
13924 |
},
|
13925 |
{
|
|
|
13951 |
"bcp_47": "zh",
|
13952 |
"task": "language_modeling",
|
13953 |
"metric": "chrf",
|
13954 |
+
"score": 0.8098290899553928,
|
13955 |
"sentence_nr": 14.5
|
13956 |
},
|
13957 |
{
|
|
|
13983 |
"bcp_47": "en",
|
13984 |
"task": "language_modeling",
|
13985 |
"metric": "chrf",
|
13986 |
+
"score": 0.8397325387031247,
|
13987 |
"sentence_nr": 14.5
|
13988 |
},
|
13989 |
{
|
|
|
14015 |
"bcp_47": "zh",
|
14016 |
"task": "language_modeling",
|
14017 |
"metric": "chrf",
|
14018 |
+
"score": 0.9167475699419941,
|
14019 |
"sentence_nr": 14.5
|
14020 |
},
|
14021 |
{
|
|
|
14047 |
"bcp_47": "en",
|
14048 |
"task": "language_modeling",
|
14049 |
"metric": "chrf",
|
14050 |
+
"score": 0.9807297060840695,
|
14051 |
"sentence_nr": 14.5
|
14052 |
},
|
14053 |
{
|
|
|
14079 |
"bcp_47": "zh",
|
14080 |
"task": "language_modeling",
|
14081 |
"metric": "chrf",
|
14082 |
+
"score": 0.9313441068235117,
|
14083 |
"sentence_nr": 14.5
|
14084 |
},
|
14085 |
{
|
|
|
14111 |
"bcp_47": "en",
|
14112 |
"task": "language_modeling",
|
14113 |
"metric": "chrf",
|
14114 |
+
"score": 0.5225508930892153,
|
14115 |
"sentence_nr": 14.5
|
14116 |
},
|
14117 |
{
|
|
|
14143 |
"bcp_47": "zh",
|
14144 |
"task": "language_modeling",
|
14145 |
"metric": "chrf",
|
14146 |
+
"score": 0.4174856398225174,
|
14147 |
"sentence_nr": 14.5
|
14148 |
},
|
14149 |
{
|