David Pomerenke commited on
Commit
eaf2d97
·
1 Parent(s): 7cdde63

spBLEU tokenizer, run on more languages

Browse files
bibliography.bib CHANGED
@@ -209,6 +209,22 @@
209
  keywords = {dataset,n=200}
210
  }
211
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
212
  @inproceedings{robinsonChatGPTMTCompetitive2023,
213
  title = {{{ChatGPT MT}}: {{Competitive}} for {{High-}} (but {{Not Low-}}) {{Resource Languages}}},
214
  shorttitle = {{{ChatGPT MT}}},
 
209
  keywords = {dataset,n=200}
210
  }
211
 
212
+ @misc{petrovLanguageModelTokenizers2023,
213
+ title = {Language {{Model Tokenizers Introduce Unfairness Between Languages}}},
214
+ author = {Petrov, Aleksandar and Malfa, Emanuele La and Torr, Philip H. S. and Bibi, Adel},
215
+ year = {2023},
216
+ month = oct,
217
+ number = {arXiv:2305.15425},
218
+ eprint = {2305.15425},
219
+ primaryclass = {cs},
220
+ publisher = {arXiv},
221
+ doi = {10.48550/arXiv.2305.15425},
222
+ urldate = {2025-03-24},
223
+ abstract = {Recent language models have shown impressive multilingual performance, even when not explicitly trained for it. Despite this, there are concerns about the quality of their outputs across different languages. In this paper, we show how disparity in the treatment of different languages arises at the tokenization stage, well before a model is even invoked. The same text translated into different languages can have drastically different tokenization lengths, with differences up to 15 times in some cases. These disparities persist even for tokenizers that are intentionally trained for multilingual support. Character-level and byte-level models also exhibit over 4 times the difference in the encoding length for some language pairs. This induces unfair treatment for some language communities in regard to the cost of accessing commercial language services, the processing time and latency, as well as the amount of content that can be provided as context to the models. Therefore, we make the case that we should train future language models using multilingually fair subword tokenizers.},
224
+ archiveprefix = {arXiv},
225
+ file = {/Users/david/Zotero/storage/NX3DT98Z/Petrov et al. - 2023 - Language Model Tokenizers Introduce Unfairness Between Languages.pdf;/Users/david/Zotero/storage/FKJQP22D/2305.html}
226
+ }
227
+
228
  @inproceedings{robinsonChatGPTMTCompetitive2023,
229
  title = {{{ChatGPT MT}}: {{Competitive}} for {{High-}} (but {{Not Low-}}) {{Resource Languages}}},
230
  shorttitle = {{{ChatGPT MT}}},
data/INFO CHANGED
@@ -2,4 +2,4 @@ fleurs: https://huggingface.co/datasets/google/fleurs via eval.py
2
  floresp-v2.0-rc.3: https://github.com/openlanguagedata/flores
3
  glottolog_languoid.csv: https://glottolog.org/meta/downloads
4
  ScriptCodes.csv: https://www.unicode.org/iso15924/iso15924-codes.html
5
- spbleu: https://github.com/facebookresearch/flores/tree/main
 
2
  floresp-v2.0-rc.3: https://github.com/openlanguagedata/flores
3
  glottolog_languoid.csv: https://glottolog.org/meta/downloads
4
  ScriptCodes.csv: https://www.unicode.org/iso15924/iso15924-codes.html
5
+ spbleu: https://github.com/facebookresearch/flores/tree/main/flores200#spm-and-dictionary
evals/main.py CHANGED
@@ -13,7 +13,7 @@ from tqdm.asyncio import tqdm_asyncio
13
  # ===== config =====
14
 
15
  n_sentences = 30
16
- langs_eval = languages.iloc[:10]
17
  langs_eval_detailed = languages.iloc[:2]
18
  transcription_langs_eval = languages.iloc[:10]
19
  transcription_langs_eval_detailed = languages.iloc[:5]
 
13
  # ===== config =====
14
 
15
  n_sentences = 30
16
+ langs_eval = languages.iloc[:30]
17
  langs_eval_detailed = languages.iloc[:2]
18
  transcription_langs_eval = languages.iloc[:10]
19
  transcription_langs_eval_detailed = languages.iloc[:5]
evals/tasks.py CHANGED
@@ -3,16 +3,16 @@ import random
3
  import evaluate
4
  import pandas as pd
5
  from joblib.memory import Memory
6
- from transformers import NllbTokenizer
7
  from languages import languages, script_name
8
  from datasets_.flores import flores_sentences
9
  from models import complete, transcribe
 
 
10
  cache = Memory(location=".cache", verbose=0).cache
11
  bleu = evaluate.load("bleu")
12
  chrf = evaluate.load("chrf")
13
  wer = evaluate.load("wer")
14
- tokenizer = NllbTokenizer.from_pretrained("facebook/nllb-200-distilled-600M")
15
-
16
 
17
  # sample languages to translate to
18
  target_languages = languages[languages["in_benchmark"]].sample(
 
3
  import evaluate
4
  import pandas as pd
5
  from joblib.memory import Memory
 
6
  from languages import languages, script_name
7
  from datasets_.flores import flores_sentences
8
  from models import complete, transcribe
9
+ import sentencepiece as spm
10
+
11
  cache = Memory(location=".cache", verbose=0).cache
12
  bleu = evaluate.load("bleu")
13
  chrf = evaluate.load("chrf")
14
  wer = evaluate.load("wer")
15
+ tokenizer = spm.SentencePieceProcessor(model_file="data/spbleu/flores200_sacrebleu_tokenizer_spm.model")
 
16
 
17
  # sample languages to translate to
18
  target_languages = languages[languages["in_benchmark"]].sample(
frontend/public/{LICENSE → INFO} RENAMED
File without changes
frontend/public/results.json CHANGED
@@ -26,7 +26,7 @@
26
  "license": null,
27
  "average": 0.66,
28
  "classification_accuracy": 0.73,
29
- "language_modeling_chrf": 0.97,
30
  "translation_bleu": 0.4,
31
  "translation_chrf": 0.54
32
  },
@@ -39,9 +39,9 @@
39
  "size": 27432406640.0,
40
  "type": "Open",
41
  "license": "Gemma",
42
- "average": 0.65,
43
  "classification_accuracy": 0.72,
44
- "language_modeling_chrf": 0.96,
45
  "translation_bleu": 0.37,
46
  "translation_chrf": 0.54
47
  },
@@ -54,41 +54,41 @@
54
  "size": 70553706496.0,
55
  "type": "Open",
56
  "license": "Llama3.1",
57
- "average": 0.62,
58
  "classification_accuracy": 0.57,
59
- "language_modeling_chrf": 0.92,
60
  "translation_bleu": 0.43,
61
  "translation_chrf": 0.57
62
  },
63
  {
64
  "rank": 5,
65
- "provider": "Amazon",
66
- "model": "Nova Micro V1",
67
  "hf_id": null,
68
  "creation_date": null,
69
  "size": null,
70
  "type": "Commercial",
71
  "license": null,
72
  "average": 0.61,
73
- "classification_accuracy": 0.52,
74
- "language_modeling_chrf": 0.94,
75
- "translation_bleu": 0.4,
76
- "translation_chrf": 0.56
77
  },
78
  {
79
  "rank": 6,
80
- "provider": "Meta Llama",
81
- "model": "Llama 3 70b Instruct",
82
  "hf_id": null,
83
  "creation_date": null,
84
  "size": null,
85
  "type": "Commercial",
86
  "license": null,
87
- "average": 0.61,
88
- "classification_accuracy": 0.8,
89
- "language_modeling_chrf": 0.95,
90
- "translation_bleu": 0.25,
91
- "translation_chrf": 0.43
92
  },
93
  {
94
  "rank": 7,
@@ -101,7 +101,7 @@
101
  "license": null,
102
  "average": 0.6,
103
  "classification_accuracy": 0.52,
104
- "language_modeling_chrf": 0.95,
105
  "translation_bleu": 0.39,
106
  "translation_chrf": 0.55
107
  },
@@ -116,7 +116,7 @@
116
  "license": "Apache 2.0",
117
  "average": 0.58,
118
  "classification_accuracy": 0.55,
119
- "language_modeling_chrf": 0.86,
120
  "translation_bleu": 0.38,
121
  "translation_chrf": 0.52
122
  },
@@ -129,11 +129,11 @@
129
  "size": 70553706496.0,
130
  "type": "Open",
131
  "license": "Llama3.3",
132
- "average": 0.56,
133
- "classification_accuracy": 0.5,
134
  "language_modeling_chrf": 0.94,
135
- "translation_bleu": 0.31,
136
- "translation_chrf": 0.48
137
  },
138
  {
139
  "rank": 10,
@@ -144,9 +144,9 @@
144
  "size": null,
145
  "type": "Commercial",
146
  "license": null,
147
- "average": 0.55,
148
  "classification_accuracy": 0.5,
149
- "language_modeling_chrf": 0.88,
150
  "translation_bleu": 0.32,
151
  "translation_chrf": 0.49
152
  },
@@ -161,7 +161,7 @@
161
  "license": "Mit",
162
  "average": 0.52,
163
  "classification_accuracy": 0.42,
164
- "language_modeling_chrf": 0.87,
165
  "translation_bleu": 0.32,
166
  "translation_chrf": 0.46
167
  },
@@ -176,7 +176,7 @@
176
  "license": "Apache 2.0",
177
  "average": 0.25,
178
  "classification_accuracy": 0.0,
179
- "language_modeling_chrf": 0.48,
180
  "translation_bleu": 0.21,
181
  "translation_chrf": 0.3
182
  }
@@ -220,7 +220,7 @@
220
  "in_benchmark": true,
221
  "NaN": 0.0,
222
  "classification_accuracy": 0.53,
223
- "language_modeling_chrf": 0.95,
224
  "translation_bleu": 0.32,
225
  "translation_chrf": 0.49
226
  },
@@ -248,7 +248,7 @@
248
  "in_benchmark": true,
249
  "NaN": 0.0,
250
  "classification_accuracy": 0.43,
251
- "language_modeling_chrf": 0.93,
252
  "translation_bleu": 0.28,
253
  "translation_chrf": 0.47
254
  },
@@ -262,7 +262,7 @@
262
  "in_benchmark": true,
263
  "NaN": 0.0,
264
  "classification_accuracy": 0.5,
265
- "language_modeling_chrf": 0.93,
266
  "translation_bleu": 0.24,
267
  "translation_chrf": 0.42
268
  },
@@ -290,7 +290,7 @@
290
  "in_benchmark": true,
291
  "NaN": 0.0,
292
  "classification_accuracy": 0.4,
293
- "language_modeling_chrf": 0.9,
294
  "translation_bleu": 0.2,
295
  "translation_chrf": 0.41
296
  },
@@ -300,11 +300,11 @@
300
  "autonym": "Português",
301
  "speakers": 237496885,
302
  "family": "Indo-European",
303
- "average": 0.46,
304
  "in_benchmark": true,
305
  "NaN": 0.0,
306
  "classification_accuracy": 0.5,
307
- "language_modeling_chrf": 0.97,
308
  "translation_bleu": 0.31,
309
  "translation_chrf": 0.49
310
  },
@@ -314,11 +314,11 @@
314
  "autonym": "ਪੰਜਾਬੀ",
315
  "speakers": 203571210,
316
  "family": "Indo-European",
317
- "average": 0.42,
318
  "in_benchmark": true,
319
  "NaN": 0.0,
320
  "classification_accuracy": 0.4,
321
- "language_modeling_chrf": 0.87,
322
  "translation_bleu": 0.34,
323
  "translation_chrf": 0.49
324
  },
@@ -328,13 +328,13 @@
328
  "autonym": "Русский",
329
  "speakers": 195841151,
330
  "family": "Indo-European",
331
- "average": 0.0,
332
  "in_benchmark": true,
333
  "NaN": 0.0,
334
- "classification_accuracy": 0.0,
335
- "language_modeling_chrf": 0.0,
336
- "translation_bleu": 0.0,
337
- "translation_chrf": 0.0
338
  },
339
  {
340
  "bcp_47": "sw",
@@ -342,13 +342,13 @@
342
  "autonym": "Kiswahili",
343
  "speakers": 171610296,
344
  "family": "Atlantic-Congo",
345
- "average": 0.0,
346
  "in_benchmark": true,
347
  "NaN": 0.0,
348
- "classification_accuracy": 0.0,
349
- "language_modeling_chrf": 0.0,
350
- "translation_bleu": 0.0,
351
- "translation_chrf": 0.0
352
  },
353
  {
354
  "bcp_47": "id",
@@ -356,13 +356,13 @@
356
  "autonym": "Bahasa Indonesia",
357
  "speakers": 171207687,
358
  "family": "Austronesian",
359
- "average": 0.0,
360
  "in_benchmark": true,
361
  "NaN": 0.0,
362
- "classification_accuracy": 0.0,
363
- "language_modeling_chrf": 0.0,
364
- "translation_bleu": 0.0,
365
- "translation_chrf": 0.0
366
  },
367
  {
368
  "bcp_47": "de",
@@ -370,13 +370,13 @@
370
  "autonym": "Deutsch",
371
  "speakers": 136350226,
372
  "family": "Indo-European",
373
- "average": 0.0,
374
  "in_benchmark": true,
375
  "NaN": 0.0,
376
- "classification_accuracy": 0.0,
377
- "language_modeling_chrf": 0.0,
378
- "translation_bleu": 0.0,
379
- "translation_chrf": 0.0
380
  },
381
  {
382
  "bcp_47": "ja",
@@ -384,13 +384,13 @@
384
  "autonym": "日本語",
385
  "speakers": 119729026,
386
  "family": "Japonic",
387
- "average": 0.0,
388
  "in_benchmark": true,
389
  "NaN": 0.0,
390
- "classification_accuracy": 0.0,
391
- "language_modeling_chrf": 0.0,
392
- "translation_bleu": 0.0,
393
- "translation_chrf": 0.0
394
  },
395
  {
396
  "bcp_47": "te",
@@ -398,13 +398,13 @@
398
  "autonym": "తెలుగు",
399
  "speakers": 95478480,
400
  "family": "Dravidian",
401
- "average": 0.0,
402
  "in_benchmark": true,
403
  "NaN": 0.0,
404
- "classification_accuracy": 0.0,
405
- "language_modeling_chrf": 0.0,
406
- "translation_bleu": 0.0,
407
- "translation_chrf": 0.0
408
  },
409
  {
410
  "bcp_47": "lah",
@@ -426,13 +426,13 @@
426
  "autonym": "मराठी",
427
  "speakers": 92826300,
428
  "family": "Indo-European",
429
- "average": 0.0,
430
  "in_benchmark": true,
431
  "NaN": 0.0,
432
- "classification_accuracy": 0.0,
433
- "language_modeling_chrf": 0.0,
434
- "translation_bleu": 0.0,
435
- "translation_chrf": 0.0
436
  },
437
  {
438
  "bcp_47": "jv",
@@ -440,13 +440,13 @@
440
  "autonym": "Jawa",
441
  "speakers": 91180665,
442
  "family": "Austronesian",
443
- "average": 0.0,
444
  "in_benchmark": true,
445
  "NaN": 0.0,
446
- "classification_accuracy": 0.0,
447
- "language_modeling_chrf": 0.0,
448
- "translation_bleu": 0.0,
449
- "translation_chrf": 0.0
450
  },
451
  {
452
  "bcp_47": "vi",
@@ -454,13 +454,13 @@
454
  "autonym": "Tiếng Việt",
455
  "speakers": 86222962,
456
  "family": "Austroasiatic",
457
- "average": 0.0,
458
  "in_benchmark": true,
459
  "NaN": 0.0,
460
- "classification_accuracy": 0.0,
461
- "language_modeling_chrf": 0.0,
462
- "translation_bleu": 0.0,
463
- "translation_chrf": 0.0
464
  },
465
  {
466
  "bcp_47": "ta",
@@ -468,13 +468,13 @@
468
  "autonym": "தமிழ்",
469
  "speakers": 85616159,
470
  "family": "Dravidian",
471
- "average": 0.0,
472
  "in_benchmark": true,
473
  "NaN": 0.0,
474
- "classification_accuracy": 0.0,
475
- "language_modeling_chrf": 0.0,
476
- "translation_bleu": 0.0,
477
- "translation_chrf": 0.0
478
  },
479
  {
480
  "bcp_47": "fa",
@@ -482,13 +482,13 @@
482
  "autonym": "فارسی",
483
  "speakers": 84710459,
484
  "family": "Indo-European",
485
- "average": 0.0,
486
  "in_benchmark": true,
487
  "NaN": 0.0,
488
- "classification_accuracy": 0.0,
489
- "language_modeling_chrf": 0.0,
490
- "translation_bleu": 0.0,
491
- "translation_chrf": 0.0
492
  },
493
  {
494
  "bcp_47": "wuu",
@@ -510,13 +510,13 @@
510
  "autonym": "Türkçe",
511
  "speakers": 80360704,
512
  "family": "Turkic",
513
- "average": 0.0,
514
  "in_benchmark": true,
515
  "NaN": 0.0,
516
- "classification_accuracy": 0.0,
517
- "language_modeling_chrf": 0.0,
518
- "translation_bleu": 0.0,
519
- "translation_chrf": 0.0
520
  },
521
  {
522
  "bcp_47": "yue",
@@ -524,13 +524,13 @@
524
  "autonym": "粵語",
525
  "speakers": 79654759,
526
  "family": "Sino-Tibetan",
527
- "average": 0.0,
528
  "in_benchmark": true,
529
  "NaN": 0.0,
530
- "classification_accuracy": 0.0,
531
- "language_modeling_chrf": 0.0,
532
- "translation_bleu": 0.0,
533
- "translation_chrf": 0.0
534
  },
535
  {
536
  "bcp_47": "ko",
@@ -538,13 +538,13 @@
538
  "autonym": "한국어",
539
  "speakers": 78357046,
540
  "family": "Koreanic",
541
- "average": 0.0,
542
  "in_benchmark": true,
543
  "NaN": 0.0,
544
- "classification_accuracy": 0.0,
545
- "language_modeling_chrf": 0.0,
546
- "translation_bleu": 0.0,
547
- "translation_chrf": 0.0
548
  },
549
  {
550
  "bcp_47": "it",
@@ -552,13 +552,13 @@
552
  "autonym": "Italiano",
553
  "speakers": 70247060,
554
  "family": "Indo-European",
555
- "average": 0.0,
556
  "in_benchmark": true,
557
  "NaN": 0.0,
558
- "classification_accuracy": 0.0,
559
- "language_modeling_chrf": 0.0,
560
- "translation_bleu": 0.0,
561
- "translation_chrf": 0.0
562
  },
563
  {
564
  "bcp_47": "fil",
@@ -566,13 +566,13 @@
566
  "autonym": "Filipino",
567
  "speakers": 67471096,
568
  "family": "Austronesian",
569
- "average": 0.0,
570
  "in_benchmark": true,
571
  "NaN": 0.0,
572
- "classification_accuracy": 0.0,
573
- "language_modeling_chrf": 0.0,
574
- "translation_bleu": 0.0,
575
- "translation_chrf": 0.0
576
  },
577
  {
578
  "bcp_47": "arz",
@@ -580,13 +580,13 @@
580
  "autonym": "Egyptian Arabic",
581
  "speakers": 66639360,
582
  "family": "Afro-Asiatic",
583
- "average": 0.0,
584
  "in_benchmark": true,
585
  "NaN": 0.0,
586
- "classification_accuracy": 0.0,
587
- "language_modeling_chrf": 0.0,
588
- "translation_bleu": 0.0,
589
- "translation_chrf": 0.0
590
  },
591
  {
592
  "bcp_47": "gu",
@@ -594,13 +594,13 @@
594
  "autonym": "ગુજરાતી",
595
  "speakers": 61721799,
596
  "family": "Indo-European",
597
- "average": 0.0,
598
  "in_benchmark": true,
599
  "NaN": 0.0,
600
- "classification_accuracy": 0.0,
601
- "language_modeling_chrf": 0.0,
602
- "translation_bleu": 0.0,
603
- "translation_chrf": 0.0
604
  },
605
  {
606
  "bcp_47": "th",
@@ -10164,7 +10164,7 @@
10164
  ]
10165
  },
10166
  "AE": {
10167
- "score": 0.39591834659201586,
10168
  "languages": [
10169
  {
10170
  "name": "English",
@@ -10182,7 +10182,7 @@
10182
  "name": "Persian",
10183
  "bcp_47": "fa",
10184
  "population": 189850,
10185
- "score": 0.0
10186
  },
10187
  {
10188
  "name": "Pashto",
@@ -10205,7 +10205,7 @@
10205
  ]
10206
  },
10207
  "AG": {
10208
- "score": 0.4698173362013836,
10209
  "languages": [
10210
  {
10211
  "name": "English",
@@ -10217,7 +10217,7 @@
10217
  "name": "Portuguese",
10218
  "bcp_47": "pt",
10219
  "population": 1571,
10220
- "score": 0.46
10221
  }
10222
  ]
10223
  },
@@ -10290,7 +10290,7 @@
10290
  ]
10291
  },
10292
  "AT": {
10293
- "score": 0.13725900574384256,
10294
  "languages": [
10295
  {
10296
  "name": "English",
@@ -10308,13 +10308,13 @@
10308
  "name": "German",
10309
  "bcp_47": "de",
10310
  "population": 8593666,
10311
- "score": 0.0
10312
  },
10313
  {
10314
  "name": "Italian",
10315
  "bcp_47": "it",
10316
  "population": 797350,
10317
- "score": 0.0
10318
  },
10319
  {
10320
  "name": "Bavarian",
@@ -10343,7 +10343,7 @@
10343
  ]
10344
  },
10345
  "AU": {
10346
- "score": 0.46077520536342514,
10347
  "languages": [
10348
  {
10349
  "name": "English",
@@ -10361,7 +10361,7 @@
10361
  "name": "Italian",
10362
  "bcp_47": "it",
10363
  "population": 483864,
10364
- "score": 0.0
10365
  },
10366
  {
10367
  "name": "Hmong Njua",
@@ -10506,7 +10506,7 @@
10506
  ]
10507
  },
10508
  "BE": {
10509
- "score": 0.23819809898359195,
10510
  "languages": [
10511
  {
10512
  "name": "English",
@@ -10524,7 +10524,7 @@
10524
  "name": "German",
10525
  "bcp_47": "de",
10526
  "population": 2578554,
10527
- "score": 0.0
10528
  },
10529
  {
10530
  "name": "Dutch",
@@ -10547,7 +10547,7 @@
10547
  ]
10548
  },
10549
  "BG": {
10550
- "score": 0.07035928143712575,
10551
  "languages": [
10552
  {
10553
  "name": "English",
@@ -10559,19 +10559,19 @@
10559
  "name": "Russian",
10560
  "bcp_47": "ru",
10561
  "population": 1602387,
10562
- "score": 0.0
10563
  },
10564
  {
10565
  "name": "German",
10566
  "bcp_47": "de",
10567
  "population": 557352,
10568
- "score": 0.0
10569
  },
10570
  {
10571
  "name": "Turkish",
10572
  "bcp_47": "tr",
10573
  "population": 766359,
10574
- "score": 0.0
10575
  },
10576
  {
10577
  "name": "Bulgarian",
@@ -10582,7 +10582,7 @@
10582
  ]
10583
  },
10584
  "BI": {
10585
- "score": 0.22246807623977216,
10586
  "languages": [
10587
  {
10588
  "name": "English",
@@ -10600,7 +10600,7 @@
10600
  "name": "Swahili",
10601
  "bcp_47": "sw",
10602
  "population": 6408,
10603
- "score": 0.0
10604
  },
10605
  {
10606
  "name": "Rundi",
@@ -10645,7 +10645,7 @@
10645
  ]
10646
  },
10647
  "BR": {
10648
- "score": 0.45330626204700775,
10649
  "languages": [
10650
  {
10651
  "name": "English",
@@ -10663,31 +10663,31 @@
10663
  "name": "Portuguese",
10664
  "bcp_47": "pt",
10665
  "population": 192661560,
10666
- "score": 0.46
10667
  },
10668
  {
10669
  "name": "German",
10670
  "bcp_47": "de",
10671
  "population": 1778414,
10672
- "score": 0.0
10673
  },
10674
  {
10675
  "name": "Japanese",
10676
  "bcp_47": "ja",
10677
  "population": 444604,
10678
- "score": 0.0
10679
  },
10680
  {
10681
  "name": "Korean",
10682
  "bcp_47": "ko",
10683
  "population": 44460,
10684
- "score": 0.0
10685
  },
10686
  {
10687
  "name": "Italian",
10688
  "bcp_47": "it",
10689
  "population": 592805,
10690
- "score": 0.0
10691
  },
10692
  {
10693
  "name": "Venetian",
@@ -10819,7 +10819,7 @@
10819
  ]
10820
  },
10821
  "CA": {
10822
- "score": 0.4280483033489603,
10823
  "languages": [
10824
  {
10825
  "name": "English",
@@ -10873,85 +10873,85 @@
10873
  "name": "Portuguese",
10874
  "bcp_47": "pt",
10875
  "population": 229934,
10876
- "score": 0.46
10877
  },
10878
  {
10879
  "name": "Punjabi",
10880
  "bcp_47": "pa",
10881
  "population": 603106,
10882
- "score": 0.42
10883
  },
10884
  {
10885
  "name": "Russian",
10886
  "bcp_47": "ru",
10887
  "population": 211087,
10888
- "score": 0.0
10889
  },
10890
  {
10891
  "name": "German",
10892
  "bcp_47": "de",
10893
  "population": 294014,
10894
- "score": 0.0
10895
  },
10896
  {
10897
  "name": "Japanese",
10898
  "bcp_47": "ja",
10899
  "population": 52772,
10900
- "score": 0.0
10901
  },
10902
  {
10903
  "name": "Vietnamese",
10904
  "bcp_47": "vi",
10905
  "population": 184701,
10906
- "score": 0.0
10907
  },
10908
  {
10909
  "name": "Tamil",
10910
  "bcp_47": "ta",
10911
  "population": 184701,
10912
- "score": 0.0
10913
  },
10914
  {
10915
  "name": "Persian",
10916
  "bcp_47": "fa",
10917
  "population": 245012,
10918
- "score": 0.0
10919
  },
10920
  {
10921
  "name": "Turkish",
10922
  "bcp_47": "tr",
10923
  "population": 37694,
10924
- "score": 0.0
10925
  },
10926
  {
10927
  "name": "Cantonese",
10928
  "bcp_47": "yue",
10929
  "population": 640800,
10930
- "score": 0.0
10931
  },
10932
  {
10933
  "name": "Korean",
10934
  "bcp_47": "ko",
10935
  "population": 169623,
10936
- "score": 0.0
10937
  },
10938
  {
10939
  "name": "Italian",
10940
  "bcp_47": "it",
10941
  "population": 343016,
10942
- "score": 0.0
10943
  },
10944
  {
10945
  "name": "Filipino",
10946
  "bcp_47": "fil",
10947
  "population": 565412,
10948
- "score": 0.0
10949
  },
10950
  {
10951
  "name": "Gujarati",
10952
  "bcp_47": "gu",
10953
  "population": 135699,
10954
- "score": 0.0
10955
  },
10956
  {
10957
  "name": "Polish",
@@ -11189,7 +11189,7 @@
11189
  ]
11190
  },
11191
  "CH": {
11192
- "score": 0.17143224232353874,
11193
  "languages": [
11194
  {
11195
  "name": "English",
@@ -11207,19 +11207,19 @@
11207
  "name": "Portuguese",
11208
  "bcp_47": "pt",
11209
  "population": 285736,
11210
- "score": 0.46
11211
  },
11212
  {
11213
  "name": "German",
11214
  "bcp_47": "de",
11215
  "population": 6134913,
11216
- "score": 0.0
11217
  },
11218
  {
11219
  "name": "Italian",
11220
  "bcp_47": "it",
11221
  "population": 361372,
11222
- "score": 0.0
11223
  },
11224
  {
11225
  "name": "Swiss German",
@@ -11455,7 +11455,7 @@
11455
  ]
11456
  },
11457
  "CN": {
11458
- "score": 0.36863417321148484,
11459
  "languages": [
11460
  {
11461
  "name": "English",
@@ -11473,13 +11473,13 @@
11473
  "name": "Russian",
11474
  "bcp_47": "ru",
11475
  "population": 13940,
11476
- "score": 0.0
11477
  },
11478
  {
11479
  "name": "Vietnamese",
11480
  "bcp_47": "vi",
11481
  "population": 6970,
11482
- "score": 0.0
11483
  },
11484
  {
11485
  "name": "Wu Chinese",
@@ -11491,13 +11491,13 @@
11491
  "name": "Cantonese",
11492
  "bcp_47": "yue",
11493
  "population": 72489040,
11494
- "score": 0.0
11495
  },
11496
  {
11497
  "name": "Korean",
11498
  "bcp_47": "ko",
11499
  "population": 2091030,
11500
- "score": 0.0
11501
  },
11502
  {
11503
  "name": "Xiang Chinese",
@@ -11649,7 +11649,7 @@
11649
  ]
11650
  },
11651
  "CY": {
11652
- "score": 0.18945142670615586,
11653
  "languages": [
11654
  {
11655
  "name": "English",
@@ -11673,7 +11673,7 @@
11673
  "name": "Turkish",
11674
  "bcp_47": "tr",
11675
  "population": 291336,
11676
- "score": 0.0
11677
  },
11678
  {
11679
  "name": "Greek",
@@ -11690,7 +11690,7 @@
11690
  ]
11691
  },
11692
  "CZ": {
11693
- "score": 0.08109144475315826,
11694
  "languages": [
11695
  {
11696
  "name": "English",
@@ -11702,7 +11702,7 @@
11702
  "name": "German",
11703
  "bcp_47": "de",
11704
  "population": 1605375,
11705
- "score": 0.0
11706
  },
11707
  {
11708
  "name": "Polish",
@@ -11725,7 +11725,7 @@
11725
  ]
11726
  },
11727
  "DE": {
11728
- "score": 0.16673407486802613,
11729
  "languages": [
11730
  {
11731
  "name": "English",
@@ -11749,25 +11749,25 @@
11749
  "name": "Russian",
11750
  "bcp_47": "ru",
11751
  "population": 4809582,
11752
- "score": 0.0
11753
  },
11754
  {
11755
  "name": "German",
11756
  "bcp_47": "de",
11757
  "population": 72945327,
11758
- "score": 0.0
11759
  },
11760
  {
11761
  "name": "Turkish",
11762
  "bcp_47": "tr",
11763
  "population": 2003992,
11764
- "score": 0.0
11765
  },
11766
  {
11767
  "name": "Italian",
11768
  "bcp_47": "it",
11769
  "population": 5611179,
11770
- "score": 0.0
11771
  },
11772
  {
11773
  "name": "Polish",
@@ -11891,7 +11891,7 @@
11891
  ]
11892
  },
11893
  "DK": {
11894
- "score": 0.1687682799969866,
11895
  "languages": [
11896
  {
11897
  "name": "English",
@@ -11903,7 +11903,7 @@
11903
  "name": "German",
11904
  "bcp_47": "de",
11905
  "population": 2758623,
11906
- "score": 0.0
11907
  },
11908
  {
11909
  "name": "Swedish",
@@ -12001,7 +12001,7 @@
12001
  ]
12002
  },
12003
  "EE": {
12004
- "score": 0.1153657311566433,
12005
  "languages": [
12006
  {
12007
  "name": "English",
@@ -12013,7 +12013,7 @@
12013
  "name": "Russian",
12014
  "bcp_47": "ru",
12015
  "population": 688027,
12016
- "score": 0.0
12017
  },
12018
  {
12019
  "name": "Finnish",
@@ -12042,7 +12042,7 @@
12042
  ]
12043
  },
12044
  "EG": {
12045
- "score": 0.28970118200899325,
12046
  "languages": [
12047
  {
12048
  "name": "English",
@@ -12060,7 +12060,7 @@
12060
  "name": "Egyptian Arabic",
12061
  "bcp_47": "arz",
12062
  "population": 66639360,
12063
- "score": 0.0
12064
  },
12065
  {
12066
  "name": "Greek",
@@ -12236,7 +12236,7 @@
12236
  ]
12237
  },
12238
  "FI": {
12239
- "score": 0.14489049029987158,
12240
  "languages": [
12241
  {
12242
  "name": "English",
@@ -12248,13 +12248,13 @@
12248
  "name": "Russian",
12249
  "bcp_47": "ru",
12250
  "population": 45131,
12251
- "score": 0.0
12252
  },
12253
  {
12254
  "name": "German",
12255
  "bcp_47": "de",
12256
  "population": 1002901,
12257
- "score": 0.0
12258
  },
12259
  {
12260
  "name": "Swedish",
@@ -12388,7 +12388,7 @@
12388
  ]
12389
  },
12390
  "FR": {
12391
- "score": 0.4241282220594123,
12392
  "languages": [
12393
  {
12394
  "name": "English",
@@ -12412,19 +12412,19 @@
12412
  "name": "Portuguese",
12413
  "bcp_47": "pt",
12414
  "population": 882027,
12415
- "score": 0.46
12416
  },
12417
  {
12418
  "name": "German",
12419
  "bcp_47": "de",
12420
  "population": 3392410,
12421
- "score": 0.0
12422
  },
12423
  {
12424
  "name": "Italian",
12425
  "bcp_47": "it",
12426
  "population": 1153419,
12427
- "score": 0.0
12428
  },
12429
  {
12430
  "name": "Dutch",
@@ -12495,7 +12495,7 @@
12495
  ]
12496
  },
12497
  "GB": {
12498
- "score": 0.3951929468077104,
12499
  "languages": [
12500
  {
12501
  "name": "English",
@@ -12543,43 +12543,43 @@
12543
  "name": "Portuguese",
12544
  "bcp_47": "pt",
12545
  "population": 131522,
12546
- "score": 0.46
12547
  },
12548
  {
12549
  "name": "Punjabi",
12550
  "bcp_47": "pa",
12551
  "population": 2367400,
12552
- "score": 0.42
12553
  },
12554
  {
12555
  "name": "German",
12556
  "bcp_47": "de",
12557
  "population": 5918499,
12558
- "score": 0.0
12559
  },
12560
  {
12561
  "name": "Tamil",
12562
  "bcp_47": "ta",
12563
  "population": 2104355,
12564
- "score": 0.0
12565
  },
12566
  {
12567
  "name": "Turkish",
12568
  "bcp_47": "tr",
12569
  "population": 131522,
12570
- "score": 0.0
12571
  },
12572
  {
12573
  "name": "Italian",
12574
  "bcp_47": "it",
12575
  "population": 131522,
12576
- "score": 0.0
12577
  },
12578
  {
12579
  "name": "Gujarati",
12580
  "bcp_47": "gu",
12581
  "population": 1907072,
12582
- "score": 0.0
12583
  },
12584
  {
12585
  "name": "Polish",
@@ -12765,7 +12765,7 @@
12765
  ]
12766
  },
12767
  "GR": {
12768
- "score": 0.16451496911429414,
12769
  "languages": [
12770
  {
12771
  "name": "English",
@@ -12783,13 +12783,13 @@
12783
  "name": "German",
12784
  "bcp_47": "de",
12785
  "population": 530355,
12786
- "score": 0.0
12787
  },
12788
  {
12789
  "name": "Turkish",
12790
  "bcp_47": "tr",
12791
  "population": 127285,
12792
- "score": 0.0
12793
  },
12794
  {
12795
  "name": "Greek",
@@ -12869,7 +12869,7 @@
12869
  ]
12870
  },
12871
  "HK": {
12872
- "score": 0.29033194917916566,
12873
  "languages": [
12874
  {
12875
  "name": "English",
@@ -12887,7 +12887,7 @@
12887
  "name": "Cantonese",
12888
  "bcp_47": "yue",
12889
  "population": 6524919,
12890
- "score": 0.0
12891
  }
12892
  ]
12893
  },
@@ -12920,7 +12920,7 @@
12920
  ]
12921
  },
12922
  "HR": {
12923
- "score": 0.15322692258543336,
12924
  "languages": [
12925
  {
12926
  "name": "English",
@@ -12932,7 +12932,7 @@
12932
  "name": "Italian",
12933
  "bcp_47": "it",
12934
  "population": 67644,
12935
- "score": 0.0
12936
  },
12937
  {
12938
  "name": "Croatian",
@@ -12949,7 +12949,7 @@
12949
  ]
12950
  },
12951
  "HU": {
12952
- "score": 0.07565921456157332,
12953
  "languages": [
12954
  {
12955
  "name": "English",
@@ -12967,7 +12967,7 @@
12967
  "name": "German",
12968
  "bcp_47": "de",
12969
  "population": 1758929,
12970
- "score": 0.0
12971
  },
12972
  {
12973
  "name": "Romanian",
@@ -13025,7 +13025,7 @@
13025
  ]
13026
  },
13027
  "IL": {
13028
- "score": 0.19791078395296563,
13029
  "languages": [
13030
  {
13031
  "name": "English",
@@ -13043,7 +13043,7 @@
13043
  "name": "Russian",
13044
  "bcp_47": "ru",
13045
  "population": 954303,
13046
- "score": 0.0
13047
  },
13048
  {
13049
  "name": "Malayalam",
@@ -13125,7 +13125,7 @@
13125
  ]
13126
  },
13127
  "IN": {
13128
- "score": 0.26031158182809067,
13129
  "languages": [
13130
  {
13131
  "name": "English",
@@ -13155,13 +13155,13 @@
13155
  "name": "Punjabi",
13156
  "bcp_47": "pa",
13157
  "population": 37130520,
13158
- "score": 0.42
13159
  },
13160
  {
13161
  "name": "Telugu",
13162
  "bcp_47": "te",
13163
  "population": 95478480,
13164
- "score": 0.0
13165
  },
13166
  {
13167
  "name": "Western Panjabi",
@@ -13173,19 +13173,19 @@
13173
  "name": "Marathi",
13174
  "bcp_47": "mr",
13175
  "population": 92826300,
13176
- "score": 0.0
13177
  },
13178
  {
13179
  "name": "Tamil",
13180
  "bcp_47": "ta",
13181
  "population": 78239310,
13182
- "score": 0.0
13183
  },
13184
  {
13185
  "name": "Gujarati",
13186
  "bcp_47": "gu",
13187
  "population": 59674050,
13188
- "score": 0.0
13189
  },
13190
  {
13191
  "name": "Kannada",
@@ -13603,7 +13603,7 @@
13603
  ]
13604
  },
13605
  "IQ": {
13606
- "score": 0.35502445223850776,
13607
  "languages": [
13608
  {
13609
  "name": "English",
@@ -13621,7 +13621,7 @@
13621
  "name": "Persian",
13622
  "bcp_47": "fa",
13623
  "population": 338192,
13624
- "score": 0.0
13625
  },
13626
  {
13627
  "name": "Azerbaijani",
@@ -13650,7 +13650,7 @@
13650
  ]
13651
  },
13652
  "IT": {
13653
- "score": 0.12688064203402252,
13654
  "languages": [
13655
  {
13656
  "name": "English",
@@ -13668,13 +13668,13 @@
13668
  "name": "German",
13669
  "bcp_47": "de",
13670
  "population": 998443,
13671
- "score": 0.0
13672
  },
13673
  {
13674
  "name": "Italian",
13675
  "bcp_47": "it",
13676
  "population": 59282565,
13677
- "score": 0.0
13678
  },
13679
  {
13680
  "name": "Greek",
@@ -13820,7 +13820,7 @@
13820
  ]
13821
  },
13822
  "KE": {
13823
- "score": 0.057955683710036364,
13824
  "languages": [
13825
  {
13826
  "name": "English",
@@ -13838,19 +13838,19 @@
13838
  "name": "Punjabi",
13839
  "bcp_47": "pa",
13840
  "population": 10170,
13841
- "score": 0.42
13842
  },
13843
  {
13844
  "name": "Swahili",
13845
  "bcp_47": "sw",
13846
  "population": 35328414,
13847
- "score": 0.0
13848
  },
13849
  {
13850
  "name": "Gujarati",
13851
  "bcp_47": "gu",
13852
  "population": 4978,
13853
- "score": 0.0
13854
  },
13855
  {
13856
  "name": "Oromo",
@@ -13984,7 +13984,7 @@
13984
  ]
13985
  },
13986
  "KZ": {
13987
- "score": 0.0442283557549302,
13988
  "languages": [
13989
  {
13990
  "name": "English",
@@ -13996,13 +13996,13 @@
13996
  "name": "Russian",
13997
  "bcp_47": "ru",
13998
  "population": 13746168,
13999
- "score": 0.0
14000
  },
14001
  {
14002
  "name": "German",
14003
  "bcp_47": "de",
14004
  "population": 1221882,
14005
- "score": 0.0
14006
  },
14007
  {
14008
  "name": "Kazakh",
@@ -14071,7 +14071,7 @@
14071
  ]
14072
  },
14073
  "LK": {
14074
- "score": 0.05053763440860214,
14075
  "languages": [
14076
  {
14077
  "name": "English",
@@ -14083,7 +14083,7 @@
14083
  "name": "Tamil",
14084
  "bcp_47": "ta",
14085
  "population": 3433380,
14086
- "score": 0.0
14087
  },
14088
  {
14089
  "name": "Sinhala",
@@ -14164,7 +14164,7 @@
14164
  ]
14165
  },
14166
  "LT": {
14167
- "score": 0.08192661853903119,
14168
  "languages": [
14169
  {
14170
  "name": "English",
@@ -14176,13 +14176,13 @@
14176
  "name": "Russian",
14177
  "bcp_47": "ru",
14178
  "population": 2185168,
14179
- "score": 0.0
14180
  },
14181
  {
14182
  "name": "German",
14183
  "bcp_47": "de",
14184
  "population": 382404,
14185
- "score": 0.0
14186
  },
14187
  {
14188
  "name": "Lithuanian",
@@ -14199,7 +14199,7 @@
14199
  ]
14200
  },
14201
  "LU": {
14202
- "score": 0.255017252012643,
14203
  "languages": [
14204
  {
14205
  "name": "English",
@@ -14217,13 +14217,13 @@
14217
  "name": "Portuguese",
14218
  "bcp_47": "pt",
14219
  "population": 100541,
14220
- "score": 0.46
14221
  },
14222
  {
14223
  "name": "German",
14224
  "bcp_47": "de",
14225
  "population": 395880,
14226
- "score": 0.0
14227
  },
14228
  {
14229
  "name": "Luxembourgish",
@@ -14234,7 +14234,7 @@
14234
  ]
14235
  },
14236
  "LV": {
14237
- "score": 0.14048091124242368,
14238
  "languages": [
14239
  {
14240
  "name": "English",
@@ -14246,7 +14246,7 @@
14246
  "name": "Russian",
14247
  "bcp_47": "ru",
14248
  "population": 714867,
14249
- "score": 0.0
14250
  },
14251
  {
14252
  "name": "Latvian",
@@ -14362,7 +14362,7 @@
14362
  ]
14363
  },
14364
  "MO": {
14365
- "score": 0.46020852883372587,
14366
  "languages": [
14367
  {
14368
  "name": "English",
@@ -14380,7 +14380,7 @@
14380
  "name": "Portuguese",
14381
  "bcp_47": "pt",
14382
  "population": 30723,
14383
- "score": 0.46
14384
  }
14385
  ]
14386
  },
@@ -14413,7 +14413,7 @@
14413
  ]
14414
  },
14415
  "MT": {
14416
- "score": 0.18203906242629914,
14417
  "languages": [
14418
  {
14419
  "name": "English",
@@ -14431,7 +14431,7 @@
14431
  "name": "Italian",
14432
  "bcp_47": "it",
14433
  "population": 256070,
14434
- "score": 0.0
14435
  },
14436
  {
14437
  "name": "Maltese",
@@ -14442,7 +14442,7 @@
14442
  ]
14443
  },
14444
  "MU": {
14445
- "score": 0.18730089040118697,
14446
  "languages": [
14447
  {
14448
  "name": "English",
@@ -14466,7 +14466,7 @@
14466
  "name": "Tamil",
14467
  "bcp_47": "ta",
14468
  "population": 34484,
14469
- "score": 0.0
14470
  },
14471
  {
14472
  "name": "Bhojpuri",
@@ -14594,7 +14594,7 @@
14594
  ]
14595
  },
14596
  "MY": {
14597
- "score": 0.1439334800637596,
14598
  "languages": [
14599
  {
14600
  "name": "English",
@@ -14612,13 +14612,13 @@
14612
  "name": "Javanese",
14613
  "bcp_47": "jv",
14614
  "population": 391825,
14615
- "score": 0.0
14616
  },
14617
  {
14618
  "name": "Tamil",
14619
  "bcp_47": "ta",
14620
  "population": 1371388,
14621
- "score": 0.0
14622
  },
14623
  {
14624
  "name": "Malayalam",
@@ -14665,7 +14665,7 @@
14665
  ]
14666
  },
14667
  "NA": {
14668
- "score": 0.020619217407487452,
14669
  "languages": [
14670
  {
14671
  "name": "English",
@@ -14677,7 +14677,7 @@
14677
  "name": "German",
14678
  "bcp_47": "de",
14679
  "population": 23671,
14680
- "score": 0.0
14681
  },
14682
  {
14683
  "name": "Afrikaans",
@@ -14836,7 +14836,7 @@
14836
  ]
14837
  },
14838
  "NL": {
14839
- "score": 0.17387499999999997,
14840
  "languages": [
14841
  {
14842
  "name": "English",
@@ -14854,19 +14854,19 @@
14854
  "name": "Indonesian",
14855
  "bcp_47": "id",
14856
  "population": 311047,
14857
- "score": 0.0
14858
  },
14859
  {
14860
  "name": "German",
14861
  "bcp_47": "de",
14862
  "population": 12269084,
14863
- "score": 0.0
14864
  },
14865
  {
14866
  "name": "Turkish",
14867
  "bcp_47": "tr",
14868
  "population": 207365,
14869
- "score": 0.0
14870
  },
14871
  {
14872
  "name": "Dutch",
@@ -15183,7 +15183,7 @@
15183
  ]
15184
  },
15185
  "PH": {
15186
- "score": 0.2080044997553085,
15187
  "languages": [
15188
  {
15189
  "name": "English",
@@ -15207,7 +15207,7 @@
15207
  "name": "Filipino",
15208
  "bcp_47": "fil",
15209
  "population": 65508600,
15210
- "score": 0.0
15211
  },
15212
  {
15213
  "name": "Cebuano",
@@ -15308,7 +15308,7 @@
15308
  ]
15309
  },
15310
  "PK": {
15311
- "score": 0.30251563862393366,
15312
  "languages": [
15313
  {
15314
  "name": "English",
@@ -15326,7 +15326,7 @@
15326
  "name": "Punjabi",
15327
  "bcp_47": "pa",
15328
  "population": 163450700,
15329
- "score": 0.42
15330
  },
15331
  {
15332
  "name": "Western Panjabi",
@@ -15338,7 +15338,7 @@
15338
  "name": "Persian",
15339
  "bcp_47": "fa",
15340
  "population": 1541107,
15341
- "score": 0.0
15342
  },
15343
  {
15344
  "name": "Pashto",
@@ -15457,7 +15457,7 @@
15457
  ]
15458
  },
15459
  "PL": {
15460
- "score": 0.09207365219510223,
15461
  "languages": [
15462
  {
15463
  "name": "English",
@@ -15469,13 +15469,13 @@
15469
  "name": "Russian",
15470
  "bcp_47": "ru",
15471
  "population": 6890814,
15472
- "score": 0.0
15473
  },
15474
  {
15475
  "name": "German",
15476
  "bcp_47": "de",
15477
  "population": 7273637,
15478
- "score": 0.0
15479
  },
15480
  {
15481
  "name": "Polish",
@@ -15573,7 +15573,7 @@
15573
  ]
15574
  },
15575
  "PT": {
15576
- "score": 0.4607128325652157,
15577
  "languages": [
15578
  {
15579
  "name": "English",
@@ -15597,7 +15597,7 @@
15597
  "name": "Portuguese",
15598
  "bcp_47": "pt",
15599
  "population": 9890592,
15600
- "score": 0.46
15601
  },
15602
  {
15603
  "name": "Galician",
@@ -15625,7 +15625,7 @@
15625
  ]
15626
  },
15627
  "RO": {
15628
- "score": 0.17334519793826225,
15629
  "languages": [
15630
  {
15631
  "name": "English",
@@ -15649,13 +15649,13 @@
15649
  "name": "German",
15650
  "bcp_47": "de",
15651
  "population": 44736,
15652
- "score": 0.0
15653
  },
15654
  {
15655
  "name": "Turkish",
15656
  "bcp_47": "tr",
15657
  "population": 27694,
15658
- "score": 0.0
15659
  },
15660
  {
15661
  "name": "Polish",
@@ -15883,7 +15883,7 @@
15883
  ]
15884
  },
15885
  "SG": {
15886
- "score": 0.42483238543445395,
15887
  "languages": [
15888
  {
15889
  "name": "English",
@@ -15901,13 +15901,13 @@
15901
  "name": "Punjabi",
15902
  "bcp_47": "pa",
15903
  "population": 9314,
15904
- "score": 0.42
15905
  },
15906
  {
15907
  "name": "Tamil",
15908
  "bcp_47": "ta",
15909
  "population": 130403,
15910
- "score": 0.0
15911
  },
15912
  {
15913
  "name": "Malayalam",
@@ -15935,7 +15935,7 @@
15935
  ]
15936
  },
15937
  "SI": {
15938
- "score": 0.11046483765124727,
15939
  "languages": [
15940
  {
15941
  "name": "English",
@@ -15947,13 +15947,13 @@
15947
  "name": "German",
15948
  "bcp_47": "de",
15949
  "population": 883126,
15950
- "score": 0.0
15951
  },
15952
  {
15953
  "name": "Italian",
15954
  "bcp_47": "it",
15955
  "population": 3995,
15956
- "score": 0.0
15957
  },
15958
  {
15959
  "name": "Hungarian",
@@ -15982,7 +15982,7 @@
15982
  ]
15983
  },
15984
  "SK": {
15985
- "score": 0.06145953818542007,
15986
  "languages": [
15987
  {
15988
  "name": "English",
@@ -15994,7 +15994,7 @@
15994
  "name": "German",
15995
  "bcp_47": "de",
15996
  "population": 1196932,
15997
- "score": 0.0
15998
  },
15999
  {
16000
  "name": "Polish",
@@ -16290,7 +16290,7 @@
16290
  ]
16291
  },
16292
  "TR": {
16293
- "score": 0.06502802610982708,
16294
  "languages": [
16295
  {
16296
  "name": "English",
@@ -16308,7 +16308,7 @@
16308
  "name": "Turkish",
16309
  "bcp_47": "tr",
16310
  "population": 76276275,
16311
- "score": 0.0
16312
  },
16313
  {
16314
  "name": "North Levantine Arabic",
@@ -16467,7 +16467,7 @@
16467
  ]
16468
  },
16469
  "TZ": {
16470
- "score": 0.17576282848459832,
16471
  "languages": [
16472
  {
16473
  "name": "English",
@@ -16479,7 +16479,7 @@
16479
  "name": "Swahili",
16480
  "bcp_47": "sw",
16481
  "population": 52697520,
16482
- "score": 0.0
16483
  },
16484
  {
16485
  "name": "Sukuma",
@@ -16568,7 +16568,7 @@
16568
  ]
16569
  },
16570
  "UG": {
16571
- "score": 0.014428243049412084,
16572
  "languages": [
16573
  {
16574
  "name": "English",
@@ -16586,7 +16586,7 @@
16586
  "name": "Swahili",
16587
  "bcp_47": "sw",
16588
  "population": 32439750,
16589
- "score": 0.0
16590
  },
16591
  {
16592
  "name": "Kinyarwanda",
@@ -16662,7 +16662,7 @@
16662
  ]
16663
  },
16664
  "US": {
16665
- "score": 0.45809839699094473,
16666
  "languages": [
16667
  {
16668
  "name": "English",
@@ -16692,37 +16692,37 @@
16692
  "name": "Russian",
16693
  "bcp_47": "ru",
16694
  "population": 798334,
16695
- "score": 0.0
16696
  },
16697
  {
16698
  "name": "German",
16699
  "bcp_47": "de",
16700
  "population": 1563403,
16701
- "score": 0.0
16702
  },
16703
  {
16704
  "name": "Vietnamese",
16705
  "bcp_47": "vi",
16706
  "population": 1130973,
16707
- "score": 0.0
16708
  },
16709
  {
16710
  "name": "Korean",
16711
  "bcp_47": "ko",
16712
  "population": 997917,
16713
- "score": 0.0
16714
  },
16715
  {
16716
  "name": "Italian",
16717
  "bcp_47": "it",
16718
  "population": 1130973,
16719
- "score": 0.0
16720
  },
16721
  {
16722
  "name": "Filipino",
16723
  "bcp_47": "fil",
16724
  "population": 1397084,
16725
- "score": 0.0
16726
  },
16727
  {
16728
  "name": "Yiddish",
@@ -16925,7 +16925,7 @@
16925
  ]
16926
  },
16927
  "ZA": {
16928
- "score": 0.12441587427910845,
16929
  "languages": [
16930
  {
16931
  "name": "English",
@@ -16943,7 +16943,7 @@
16943
  "name": "Swahili",
16944
  "bcp_47": "sw",
16945
  "population": 1016,
16946
- "score": 0.0
16947
  },
16948
  {
16949
  "name": "Zulu",
@@ -17125,7 +17125,7 @@
17125
  ]
17126
  },
17127
  "ID": {
17128
- "score": 0.0030419341755196384,
17129
  "languages": [
17130
  {
17131
  "name": "Chinese",
@@ -17137,13 +17137,13 @@
17137
  "name": "Indonesian",
17138
  "bcp_47": "id",
17139
  "population": 170896640,
17140
- "score": 0.0
17141
  },
17142
  {
17143
  "name": "Javanese",
17144
  "bcp_47": "jv",
17145
  "population": 90788840,
17146
- "score": 0.0
17147
  },
17148
  {
17149
  "name": "Malay",
@@ -17304,7 +17304,7 @@
17304
  ]
17305
  },
17306
  "MN": {
17307
- "score": 0.00632843339485398,
17308
  "languages": [
17309
  {
17310
  "name": "Chinese",
@@ -17316,7 +17316,7 @@
17316
  "name": "Russian",
17317
  "bcp_47": "ru",
17318
  "population": 4118,
17319
- "score": 0.0
17320
  },
17321
  {
17322
  "name": "Kazakh",
@@ -17408,7 +17408,7 @@
17408
  ]
17409
  },
17410
  "VN": {
17411
- "score": 0.005746798518511479,
17412
  "languages": [
17413
  {
17414
  "name": "Chinese",
@@ -17420,7 +17420,7 @@
17420
  "name": "Vietnamese",
17421
  "bcp_47": "vi",
17422
  "population": 84900318,
17423
- "score": 0.0
17424
  },
17425
  {
17426
  "name": "Hmong Njua",
@@ -17603,7 +17603,7 @@
17603
  ]
17604
  },
17605
  "GQ": {
17606
- "score": 0.2792374044214109,
17607
  "languages": [
17608
  {
17609
  "name": "Spanish",
@@ -17621,7 +17621,7 @@
17621
  "name": "Portuguese",
17622
  "bcp_47": "pt",
17623
  "population": 1,
17624
- "score": 0.46
17625
  },
17626
  {
17627
  "name": "Fang",
@@ -17700,7 +17700,7 @@
17700
  ]
17701
  },
17702
  "PY": {
17703
- "score": 0.016724733105137318,
17704
  "languages": [
17705
  {
17706
  "name": "Spanish",
@@ -17712,7 +17712,7 @@
17712
  "name": "German",
17713
  "bcp_47": "de",
17714
  "population": 208559,
17715
- "score": 0.0
17716
  },
17717
  {
17718
  "name": "Guarani",
@@ -17819,7 +17819,7 @@
17819
  ]
17820
  },
17821
  "IR": {
17822
- "score": 0.00636827269940037,
17823
  "languages": [
17824
  {
17825
  "name": "Arabic",
@@ -17831,7 +17831,7 @@
17831
  "name": "Persian",
17832
  "bcp_47": "fa",
17833
  "population": 63692475,
17834
- "score": 0.0
17835
  },
17836
  {
17837
  "name": "Pashto",
@@ -18166,7 +18166,7 @@
18166
  ]
18167
  },
18168
  "OM": {
18169
- "score": 0.3917550122860191,
18170
  "languages": [
18171
  {
18172
  "name": "Arabic",
@@ -18178,7 +18178,7 @@
18178
  "name": "Persian",
18179
  "bcp_47": "fa",
18180
  "population": 43849,
18181
- "score": 0.0
18182
  },
18183
  {
18184
  "name": "Baluchi",
@@ -18206,7 +18206,7 @@
18206
  ]
18207
  },
18208
  "QA": {
18209
- "score": 0.37279344564910033,
18210
  "languages": [
18211
  {
18212
  "name": "Arabic",
@@ -18218,7 +18218,7 @@
18218
  "name": "Persian",
18219
  "bcp_47": "fa",
18220
  "population": 268859,
18221
- "score": 0.0
18222
  },
18223
  {
18224
  "name": "Malayalam",
@@ -18246,7 +18246,7 @@
18246
  ]
18247
  },
18248
  "SO": {
18249
- "score": 0.12480335438670982,
18250
  "languages": [
18251
  {
18252
  "name": "Arabic",
@@ -18258,7 +18258,7 @@
18258
  "name": "Swahili",
18259
  "bcp_47": "sw",
18260
  "population": 235142,
18261
- "score": 0.0
18262
  },
18263
  {
18264
  "name": "Oromo",
@@ -18333,7 +18333,7 @@
18333
  ]
18334
  },
18335
  "TJ": {
18336
- "score": 4.095636386779862e-05,
18337
  "languages": [
18338
  {
18339
  "name": "Arabic",
@@ -18345,13 +18345,13 @@
18345
  "name": "Russian",
18346
  "bcp_47": "ru",
18347
  "population": 1064840,
18348
- "score": 0.0
18349
  },
18350
  {
18351
  "name": "Persian",
18352
  "bcp_47": "fa",
18353
  "population": 69215,
18354
- "score": 0.0
18355
  },
18356
  {
18357
  "name": "Tajik",
@@ -18454,7 +18454,7 @@
18454
  ]
18455
  },
18456
  "CD": {
18457
- "score": 0.024519567961845984,
18458
  "languages": [
18459
  {
18460
  "name": "French",
@@ -18466,7 +18466,7 @@
18466
  "name": "Swahili",
18467
  "bcp_47": "sw",
18468
  "population": 50890000,
18469
- "score": 0.0
18470
  },
18471
  {
18472
  "name": "Kinyarwanda",
@@ -18718,7 +18718,7 @@
18718
  ]
18719
  },
18720
  "RE": {
18721
- "score": 0.23394276750687273,
18722
  "languages": [
18723
  {
18724
  "name": "French",
@@ -18730,7 +18730,7 @@
18730
  "name": "Tamil",
18731
  "bcp_47": "ta",
18732
  "population": 118138,
18733
- "score": 0.0
18734
  },
18735
  {
18736
  "name": "Réunion Creole French",
@@ -18887,7 +18887,7 @@
18887
  ]
18888
  },
18889
  "YT": {
18890
- "score": 0.15478158205430934,
18891
  "languages": [
18892
  {
18893
  "name": "French",
@@ -18899,7 +18899,7 @@
18899
  "name": "Swahili",
18900
  "bcp_47": "sw",
18901
  "population": 2716,
18902
- "score": 0.0
18903
  },
18904
  {
18905
  "name": "Comorian",
@@ -18916,13 +18916,13 @@
18916
  ]
18917
  },
18918
  "AO": {
18919
- "score": 0.2533081311690543,
18920
  "languages": [
18921
  {
18922
  "name": "Portuguese",
18923
  "bcp_47": "pt",
18924
  "population": 21789941,
18925
- "score": 0.46
18926
  },
18927
  {
18928
  "name": "Umbundu",
@@ -18945,13 +18945,13 @@
18945
  ]
18946
  },
18947
  "CV": {
18948
- "score": 0.20934137957939955,
18949
  "languages": [
18950
  {
18951
  "name": "Portuguese",
18952
  "bcp_47": "pt",
18953
  "population": 443274,
18954
- "score": 0.46
18955
  },
18956
  {
18957
  "name": "Kabuverdianu",
@@ -18962,13 +18962,13 @@
18962
  ]
18963
  },
18964
  "GW": {
18965
- "score": 0.4483420821976837,
18966
  "languages": [
18967
  {
18968
  "name": "Portuguese",
18969
  "bcp_47": "pt",
18970
  "population": 1927100,
18971
- "score": 0.46
18972
  },
18973
  {
18974
  "name": "Fula",
@@ -18985,19 +18985,19 @@
18985
  ]
18986
  },
18987
  "MZ": {
18988
- "score": 0.1512107791359021,
18989
  "languages": [
18990
  {
18991
  "name": "Portuguese",
18992
  "bcp_47": "pt",
18993
  "population": 8126514,
18994
- "score": 0.46
18995
  },
18996
  {
18997
  "name": "Swahili",
18998
  "bcp_47": "sw",
18999
  "population": 9330,
19000
- "score": 0.0
19001
  },
19002
  {
19003
  "name": "Nyanja",
@@ -19062,24 +19062,24 @@
19062
  ]
19063
  },
19064
  "ST": {
19065
- "score": 0.45999999999999996,
19066
  "languages": [
19067
  {
19068
  "name": "Portuguese",
19069
  "bcp_47": "pt",
19070
  "population": 179454,
19071
- "score": 0.46
19072
  }
19073
  ]
19074
  },
19075
  "TL": {
19076
- "score": 0.23,
19077
  "languages": [
19078
  {
19079
  "name": "Portuguese",
19080
  "bcp_47": "pt",
19081
  "population": 816395,
19082
- "score": 0.46
19083
  },
19084
  {
19085
  "name": "Tetum",
@@ -19090,13 +19090,13 @@
19090
  ]
19091
  },
19092
  "BY": {
19093
- "score": 0.0,
19094
  "languages": [
19095
  {
19096
  "name": "Russian",
19097
  "bcp_47": "ru",
19098
  "population": 1137350,
19099
- "score": 0.0
19100
  },
19101
  {
19102
  "name": "Belarusian",
@@ -19107,13 +19107,13 @@
19107
  ]
19108
  },
19109
  "GE": {
19110
- "score": 0.0,
19111
  "languages": [
19112
  {
19113
  "name": "Russian",
19114
  "bcp_47": "ru",
19115
  "population": 359730,
19116
- "score": 0.0
19117
  },
19118
  {
19119
  "name": "Kurdish",
@@ -19154,13 +19154,13 @@
19154
  ]
19155
  },
19156
  "KG": {
19157
- "score": 0.0,
19158
  "languages": [
19159
  {
19160
  "name": "Russian",
19161
  "bcp_47": "ru",
19162
  "population": 2147364,
19163
- "score": 0.0
19164
  },
19165
  {
19166
  "name": "Kyrgyz",
@@ -19171,13 +19171,13 @@
19171
  ]
19172
  },
19173
  "MD": {
19174
- "score": 0.0,
19175
  "languages": [
19176
  {
19177
  "name": "Russian",
19178
  "bcp_47": "ru",
19179
  "population": 100935,
19180
- "score": 0.0
19181
  },
19182
  {
19183
  "name": "Ukrainian",
@@ -19206,13 +19206,13 @@
19206
  ]
19207
  },
19208
  "RU": {
19209
- "score": 0.0,
19210
  "languages": [
19211
  {
19212
  "name": "Russian",
19213
  "bcp_47": "ru",
19214
  "population": 133218680,
19215
- "score": 0.0
19216
  },
19217
  {
19218
  "name": "Azerbaijani",
@@ -19427,13 +19427,13 @@
19427
  ]
19428
  },
19429
  "SJ": {
19430
- "score": 0.0,
19431
  "languages": [
19432
  {
19433
  "name": "Russian",
19434
  "bcp_47": "ru",
19435
  "population": 1200,
19436
- "score": 0.0
19437
  },
19438
  {
19439
  "name": "Norwegian Bokmål",
@@ -19444,13 +19444,13 @@
19444
  ]
19445
  },
19446
  "TM": {
19447
- "score": 0.0,
19448
  "languages": [
19449
  {
19450
  "name": "Russian",
19451
  "bcp_47": "ru",
19452
  "population": 663436,
19453
- "score": 0.0
19454
  },
19455
  {
19456
  "name": "Uzbek",
@@ -19473,19 +19473,19 @@
19473
  ]
19474
  },
19475
  "UA": {
19476
- "score": 0.0,
19477
  "languages": [
19478
  {
19479
  "name": "Russian",
19480
  "bcp_47": "ru",
19481
  "population": 20204534,
19482
- "score": 0.0
19483
  },
19484
  {
19485
  "name": "Turkish",
19486
  "bcp_47": "tr",
19487
  "population": 184476,
19488
- "score": 0.0
19489
  },
19490
  {
19491
  "name": "Polish",
@@ -19550,19 +19550,19 @@
19550
  ]
19551
  },
19552
  "UZ": {
19553
- "score": 0.0,
19554
  "languages": [
19555
  {
19556
  "name": "Russian",
19557
  "bcp_47": "ru",
19558
  "population": 4279156,
19559
- "score": 0.0
19560
  },
19561
  {
19562
  "name": "Turkish",
19563
  "bcp_47": "tr",
19564
  "population": 232297,
19565
- "score": 0.0
19566
  },
19567
  {
19568
  "name": "Uzbek",
@@ -19579,13 +19579,13 @@
19579
  ]
19580
  },
19581
  "LI": {
19582
- "score": 0.0,
19583
  "languages": [
19584
  {
19585
  "name": "German",
19586
  "bcp_47": "de",
19587
  "population": 39137,
19588
- "score": 0.0
19589
  },
19590
  {
19591
  "name": "Swiss German",
@@ -19602,19 +19602,19 @@
19602
  ]
19603
  },
19604
  "JP": {
19605
- "score": 0.0,
19606
  "languages": [
19607
  {
19608
  "name": "Japanese",
19609
  "bcp_47": "ja",
19610
  "population": 119231650,
19611
- "score": 0.0
19612
  },
19613
  {
19614
  "name": "Korean",
19615
  "bcp_47": "ko",
19616
  "population": 652636,
19617
- "score": 0.0
19618
  },
19619
  {
19620
  "name": "Central Okinawan",
@@ -19625,13 +19625,13 @@
19625
  ]
19626
  },
19627
  "AF": {
19628
- "score": 0.0,
19629
  "languages": [
19630
  {
19631
  "name": "Persian",
19632
  "bcp_47": "fa",
19633
  "population": 18321900,
19634
- "score": 0.0
19635
  },
19636
  {
19637
  "name": "Pashto",
@@ -19684,13 +19684,13 @@
19684
  ]
19685
  },
19686
  "MK": {
19687
- "score": 0.0,
19688
  "languages": [
19689
  {
19690
  "name": "Turkish",
19691
  "bcp_47": "tr",
19692
  "population": 74409,
19693
- "score": 0.0
19694
  },
19695
  {
19696
  "name": "Albanian",
@@ -19707,35 +19707,35 @@
19707
  ]
19708
  },
19709
  "KP": {
19710
- "score": 0.0,
19711
  "languages": [
19712
  {
19713
  "name": "Korean",
19714
  "bcp_47": "ko",
19715
  "population": 22566280,
19716
- "score": 0.0
19717
  }
19718
  ]
19719
  },
19720
  "KR": {
19721
- "score": 0.0,
19722
  "languages": [
19723
  {
19724
  "name": "Korean",
19725
  "bcp_47": "ko",
19726
  "population": 51835100,
19727
- "score": 0.0
19728
  }
19729
  ]
19730
  },
19731
  "SM": {
19732
- "score": 0.0,
19733
  "languages": [
19734
  {
19735
  "name": "Italian",
19736
  "bcp_47": "it",
19737
  "population": 30466,
19738
- "score": 0.0
19739
  },
19740
  {
19741
  "name": "Esperanto",
@@ -19746,13 +19746,13 @@
19746
  ]
19747
  },
19748
  "VA": {
19749
- "score": 0.0,
19750
  "languages": [
19751
  {
19752
  "name": "Italian",
19753
  "bcp_47": "it",
19754
  "population": 820,
19755
- "score": 0.0
19756
  },
19757
  {
19758
  "name": "Latin",
 
26
  "license": null,
27
  "average": 0.66,
28
  "classification_accuracy": 0.73,
29
+ "language_modeling_chrf": 0.96,
30
  "translation_bleu": 0.4,
31
  "translation_chrf": 0.54
32
  },
 
39
  "size": 27432406640.0,
40
  "type": "Open",
41
  "license": "Gemma",
42
+ "average": 0.64,
43
  "classification_accuracy": 0.72,
44
+ "language_modeling_chrf": 0.94,
45
  "translation_bleu": 0.37,
46
  "translation_chrf": 0.54
47
  },
 
54
  "size": 70553706496.0,
55
  "type": "Open",
56
  "license": "Llama3.1",
57
+ "average": 0.63,
58
  "classification_accuracy": 0.57,
59
+ "language_modeling_chrf": 0.95,
60
  "translation_bleu": 0.43,
61
  "translation_chrf": 0.57
62
  },
63
  {
64
  "rank": 5,
65
+ "provider": "Meta Llama",
66
+ "model": "Llama 3 70b Instruct",
67
  "hf_id": null,
68
  "creation_date": null,
69
  "size": null,
70
  "type": "Commercial",
71
  "license": null,
72
  "average": 0.61,
73
+ "classification_accuracy": 0.8,
74
+ "language_modeling_chrf": 0.96,
75
+ "translation_bleu": 0.25,
76
+ "translation_chrf": 0.43
77
  },
78
  {
79
  "rank": 6,
80
+ "provider": "Amazon",
81
+ "model": "Nova Micro V1",
82
  "hf_id": null,
83
  "creation_date": null,
84
  "size": null,
85
  "type": "Commercial",
86
  "license": null,
87
+ "average": 0.6,
88
+ "classification_accuracy": 0.52,
89
+ "language_modeling_chrf": 0.94,
90
+ "translation_bleu": 0.4,
91
+ "translation_chrf": 0.56
92
  },
93
  {
94
  "rank": 7,
 
101
  "license": null,
102
  "average": 0.6,
103
  "classification_accuracy": 0.52,
104
+ "language_modeling_chrf": 0.96,
105
  "translation_bleu": 0.39,
106
  "translation_chrf": 0.55
107
  },
 
116
  "license": "Apache 2.0",
117
  "average": 0.58,
118
  "classification_accuracy": 0.55,
119
+ "language_modeling_chrf": 0.88,
120
  "translation_bleu": 0.38,
121
  "translation_chrf": 0.52
122
  },
 
129
  "size": 70553706496.0,
130
  "type": "Open",
131
  "license": "Llama3.3",
132
+ "average": 0.55,
133
+ "classification_accuracy": 0.51,
134
  "language_modeling_chrf": 0.94,
135
+ "translation_bleu": 0.28,
136
+ "translation_chrf": 0.46
137
  },
138
  {
139
  "rank": 10,
 
144
  "size": null,
145
  "type": "Commercial",
146
  "license": null,
147
+ "average": 0.54,
148
  "classification_accuracy": 0.5,
149
+ "language_modeling_chrf": 0.86,
150
  "translation_bleu": 0.32,
151
  "translation_chrf": 0.49
152
  },
 
161
  "license": "Mit",
162
  "average": 0.52,
163
  "classification_accuracy": 0.42,
164
+ "language_modeling_chrf": 0.88,
165
  "translation_bleu": 0.32,
166
  "translation_chrf": 0.46
167
  },
 
176
  "license": "Apache 2.0",
177
  "average": 0.25,
178
  "classification_accuracy": 0.0,
179
+ "language_modeling_chrf": 0.47,
180
  "translation_bleu": 0.21,
181
  "translation_chrf": 0.3
182
  }
 
220
  "in_benchmark": true,
221
  "NaN": 0.0,
222
  "classification_accuracy": 0.53,
223
+ "language_modeling_chrf": 0.94,
224
  "translation_bleu": 0.32,
225
  "translation_chrf": 0.49
226
  },
 
248
  "in_benchmark": true,
249
  "NaN": 0.0,
250
  "classification_accuracy": 0.43,
251
+ "language_modeling_chrf": 0.94,
252
  "translation_bleu": 0.28,
253
  "translation_chrf": 0.47
254
  },
 
262
  "in_benchmark": true,
263
  "NaN": 0.0,
264
  "classification_accuracy": 0.5,
265
+ "language_modeling_chrf": 0.92,
266
  "translation_bleu": 0.24,
267
  "translation_chrf": 0.42
268
  },
 
290
  "in_benchmark": true,
291
  "NaN": 0.0,
292
  "classification_accuracy": 0.4,
293
+ "language_modeling_chrf": 0.91,
294
  "translation_bleu": 0.2,
295
  "translation_chrf": 0.41
296
  },
 
300
  "autonym": "Português",
301
  "speakers": 237496885,
302
  "family": "Indo-European",
303
+ "average": 0.45,
304
  "in_benchmark": true,
305
  "NaN": 0.0,
306
  "classification_accuracy": 0.5,
307
+ "language_modeling_chrf": 0.96,
308
  "translation_bleu": 0.31,
309
  "translation_chrf": 0.49
310
  },
 
314
  "autonym": "ਪੰਜਾਬੀ",
315
  "speakers": 203571210,
316
  "family": "Indo-European",
317
+ "average": 0.43,
318
  "in_benchmark": true,
319
  "NaN": 0.0,
320
  "classification_accuracy": 0.4,
321
+ "language_modeling_chrf": 0.9,
322
  "translation_bleu": 0.34,
323
  "translation_chrf": 0.49
324
  },
 
328
  "autonym": "Русский",
329
  "speakers": 195841151,
330
  "family": "Indo-European",
331
+ "average": 0.45,
332
  "in_benchmark": true,
333
  "NaN": 0.0,
334
+ "classification_accuracy": 0.57,
335
+ "language_modeling_chrf": 0.97,
336
+ "translation_bleu": 0.26,
337
+ "translation_chrf": 0.45
338
  },
339
  {
340
  "bcp_47": "sw",
 
342
  "autonym": "Kiswahili",
343
  "speakers": 171610296,
344
  "family": "Atlantic-Congo",
345
+ "average": 0.45,
346
  "in_benchmark": true,
347
  "NaN": 0.0,
348
+ "classification_accuracy": 0.57,
349
+ "language_modeling_chrf": 0.94,
350
+ "translation_bleu": 0.3,
351
+ "translation_chrf": 0.47
352
  },
353
  {
354
  "bcp_47": "id",
 
356
  "autonym": "Bahasa Indonesia",
357
  "speakers": 171207687,
358
  "family": "Austronesian",
359
+ "average": 0.47,
360
  "in_benchmark": true,
361
  "NaN": 0.0,
362
+ "classification_accuracy": 0.63,
363
+ "language_modeling_chrf": 0.96,
364
+ "translation_bleu": 0.29,
365
+ "translation_chrf": 0.47
366
  },
367
  {
368
  "bcp_47": "de",
 
370
  "autonym": "Deutsch",
371
  "speakers": 136350226,
372
  "family": "Indo-European",
373
+ "average": 0.49,
374
  "in_benchmark": true,
375
  "NaN": 0.0,
376
+ "classification_accuracy": 0.67,
377
+ "language_modeling_chrf": 0.96,
378
+ "translation_bleu": 0.32,
379
+ "translation_chrf": 0.5
380
  },
381
  {
382
  "bcp_47": "ja",
 
384
  "autonym": "日本語",
385
  "speakers": 119729026,
386
  "family": "Japonic",
387
+ "average": 0.46,
388
  "in_benchmark": true,
389
  "NaN": 0.0,
390
+ "classification_accuracy": 0.63,
391
+ "language_modeling_chrf": 0.94,
392
+ "translation_bleu": 0.27,
393
+ "translation_chrf": 0.44
394
  },
395
  {
396
  "bcp_47": "te",
 
398
  "autonym": "తెలుగు",
399
  "speakers": 95478480,
400
  "family": "Dravidian",
401
+ "average": 0.41,
402
  "in_benchmark": true,
403
  "NaN": 0.0,
404
+ "classification_accuracy": 0.37,
405
+ "language_modeling_chrf": 0.95,
406
+ "translation_bleu": 0.28,
407
+ "translation_chrf": 0.47
408
  },
409
  {
410
  "bcp_47": "lah",
 
426
  "autonym": "मराठी",
427
  "speakers": 92826300,
428
  "family": "Indo-European",
429
+ "average": 0.45,
430
  "in_benchmark": true,
431
  "NaN": 0.0,
432
+ "classification_accuracy": 0.63,
433
+ "language_modeling_chrf": 0.94,
434
+ "translation_bleu": 0.25,
435
+ "translation_chrf": 0.42
436
  },
437
  {
438
  "bcp_47": "jv",
 
440
  "autonym": "Jawa",
441
  "speakers": 91180665,
442
  "family": "Austronesian",
443
+ "average": 0.41,
444
  "in_benchmark": true,
445
  "NaN": 0.0,
446
+ "classification_accuracy": 0.47,
447
+ "language_modeling_chrf": 0.93,
448
+ "translation_bleu": 0.24,
449
+ "translation_chrf": 0.42
450
  },
451
  {
452
  "bcp_47": "vi",
 
454
  "autonym": "Tiếng Việt",
455
  "speakers": 86222962,
456
  "family": "Austroasiatic",
457
+ "average": 0.45,
458
  "in_benchmark": true,
459
  "NaN": 0.0,
460
+ "classification_accuracy": 0.6,
461
+ "language_modeling_chrf": 0.96,
462
+ "translation_bleu": 0.26,
463
+ "translation_chrf": 0.44
464
  },
465
  {
466
  "bcp_47": "ta",
 
468
  "autonym": "தமிழ்",
469
  "speakers": 85616159,
470
  "family": "Dravidian",
471
+ "average": 0.41,
472
  "in_benchmark": true,
473
  "NaN": 0.0,
474
+ "classification_accuracy": 0.43,
475
+ "language_modeling_chrf": 0.96,
476
+ "translation_bleu": 0.25,
477
+ "translation_chrf": 0.42
478
  },
479
  {
480
  "bcp_47": "fa",
 
482
  "autonym": "فارسی",
483
  "speakers": 84710459,
484
  "family": "Indo-European",
485
+ "average": 0.41,
486
  "in_benchmark": true,
487
  "NaN": 0.0,
488
+ "classification_accuracy": 0.4,
489
+ "language_modeling_chrf": 0.94,
490
+ "translation_bleu": 0.26,
491
+ "translation_chrf": 0.45
492
  },
493
  {
494
  "bcp_47": "wuu",
 
510
  "autonym": "Türkçe",
511
  "speakers": 80360704,
512
  "family": "Turkic",
513
+ "average": 0.44,
514
  "in_benchmark": true,
515
  "NaN": 0.0,
516
+ "classification_accuracy": 0.53,
517
+ "language_modeling_chrf": 0.94,
518
+ "translation_bleu": 0.28,
519
+ "translation_chrf": 0.45
520
  },
521
  {
522
  "bcp_47": "yue",
 
524
  "autonym": "粵語",
525
  "speakers": 79654759,
526
  "family": "Sino-Tibetan",
527
+ "average": 0.39,
528
  "in_benchmark": true,
529
  "NaN": 0.0,
530
+ "classification_accuracy": 0.43,
531
+ "language_modeling_chrf": 0.9,
532
+ "translation_bleu": 0.23,
533
+ "translation_chrf": 0.41
534
  },
535
  {
536
  "bcp_47": "ko",
 
538
  "autonym": "한국어",
539
  "speakers": 78357046,
540
  "family": "Koreanic",
541
+ "average": 0.41,
542
  "in_benchmark": true,
543
  "NaN": 0.0,
544
+ "classification_accuracy": 0.53,
545
+ "language_modeling_chrf": 0.94,
546
+ "translation_bleu": 0.2,
547
+ "translation_chrf": 0.4
548
  },
549
  {
550
  "bcp_47": "it",
 
552
  "autonym": "Italiano",
553
  "speakers": 70247060,
554
  "family": "Indo-European",
555
+ "average": 0.47,
556
  "in_benchmark": true,
557
  "NaN": 0.0,
558
+ "classification_accuracy": 0.67,
559
+ "language_modeling_chrf": 0.94,
560
+ "translation_bleu": 0.28,
561
+ "translation_chrf": 0.47
562
  },
563
  {
564
  "bcp_47": "fil",
 
566
  "autonym": "Filipino",
567
  "speakers": 67471096,
568
  "family": "Austronesian",
569
+ "average": 0.42,
570
  "in_benchmark": true,
571
  "NaN": 0.0,
572
+ "classification_accuracy": 0.43,
573
+ "language_modeling_chrf": 0.94,
574
+ "translation_bleu": 0.29,
575
+ "translation_chrf": 0.45
576
  },
577
  {
578
  "bcp_47": "arz",
 
580
  "autonym": "Egyptian Arabic",
581
  "speakers": 66639360,
582
  "family": "Afro-Asiatic",
583
+ "average": 0.38,
584
  "in_benchmark": true,
585
  "NaN": 0.0,
586
+ "classification_accuracy": 0.4,
587
+ "language_modeling_chrf": 0.93,
588
+ "translation_bleu": 0.2,
589
+ "translation_chrf": 0.39
590
  },
591
  {
592
  "bcp_47": "gu",
 
594
  "autonym": "ગુજરાતી",
595
  "speakers": 61721799,
596
  "family": "Indo-European",
597
+ "average": 0.42,
598
  "in_benchmark": true,
599
  "NaN": 0.0,
600
+ "classification_accuracy": 0.43,
601
+ "language_modeling_chrf": 0.94,
602
+ "translation_bleu": 0.26,
603
+ "translation_chrf": 0.44
604
  },
605
  {
606
  "bcp_47": "th",
 
10164
  ]
10165
  },
10166
  "AE": {
10167
+ "score": 0.40140041521976655,
10168
  "languages": [
10169
  {
10170
  "name": "English",
 
10182
  "name": "Persian",
10183
  "bcp_47": "fa",
10184
  "population": 189850,
10185
+ "score": 0.41
10186
  },
10187
  {
10188
  "name": "Pashto",
 
10205
  ]
10206
  },
10207
  "AG": {
10208
+ "score": 0.4696346724027672,
10209
  "languages": [
10210
  {
10211
  "name": "English",
 
10217
  "name": "Portuguese",
10218
  "bcp_47": "pt",
10219
  "population": 1571,
10220
+ "score": 0.45
10221
  }
10222
  ]
10223
  },
 
10290
  ]
10291
  },
10292
  "AT": {
10293
+ "score": 0.31771431191158667,
10294
  "languages": [
10295
  {
10296
  "name": "English",
 
10308
  "name": "German",
10309
  "bcp_47": "de",
10310
  "population": 8593666,
10311
+ "score": 0.49
10312
  },
10313
  {
10314
  "name": "Italian",
10315
  "bcp_47": "it",
10316
  "population": 797350,
10317
+ "score": 0.47
10318
  },
10319
  {
10320
  "name": "Bavarian",
 
10343
  ]
10344
  },
10345
  "AU": {
10346
+ "score": 0.46970357171432847,
10347
  "languages": [
10348
  {
10349
  "name": "English",
 
10361
  "name": "Italian",
10362
  "bcp_47": "it",
10363
  "population": 483864,
10364
+ "score": 0.47
10365
  },
10366
  {
10367
  "name": "Hmong Njua",
 
10506
  ]
10507
  },
10508
  "BE": {
10509
+ "score": 0.29499472599184506,
10510
  "languages": [
10511
  {
10512
  "name": "English",
 
10524
  "name": "German",
10525
  "bcp_47": "de",
10526
  "population": 2578554,
10527
+ "score": 0.49
10528
  },
10529
  {
10530
  "name": "Dutch",
 
10547
  ]
10548
  },
10549
  "BG": {
10550
+ "score": 0.18479041916167663,
10551
  "languages": [
10552
  {
10553
  "name": "English",
 
10559
  "name": "Russian",
10560
  "bcp_47": "ru",
10561
  "population": 1602387,
10562
+ "score": 0.45
10563
  },
10564
  {
10565
  "name": "German",
10566
  "bcp_47": "de",
10567
  "population": 557352,
10568
+ "score": 0.49
10569
  },
10570
  {
10571
  "name": "Turkish",
10572
  "bcp_47": "tr",
10573
  "population": 766359,
10574
+ "score": 0.44
10575
  },
10576
  {
10577
  "name": "Bulgarian",
 
10582
  ]
10583
  },
10584
  "BI": {
10585
+ "score": 0.2226670965568091,
10586
  "languages": [
10587
  {
10588
  "name": "English",
 
10600
  "name": "Swahili",
10601
  "bcp_47": "sw",
10602
  "population": 6408,
10603
+ "score": 0.45
10604
  },
10605
  {
10606
  "name": "Rundi",
 
10645
  ]
10646
  },
10647
  "BR": {
10648
+ "score": 0.45070787745315494,
10649
  "languages": [
10650
  {
10651
  "name": "English",
 
10663
  "name": "Portuguese",
10664
  "bcp_47": "pt",
10665
  "population": 192661560,
10666
+ "score": 0.45
10667
  },
10668
  {
10669
  "name": "German",
10670
  "bcp_47": "de",
10671
  "population": 1778414,
10672
+ "score": 0.49
10673
  },
10674
  {
10675
  "name": "Japanese",
10676
  "bcp_47": "ja",
10677
  "population": 444604,
10678
+ "score": 0.46
10679
  },
10680
  {
10681
  "name": "Korean",
10682
  "bcp_47": "ko",
10683
  "population": 44460,
10684
+ "score": 0.41
10685
  },
10686
  {
10687
  "name": "Italian",
10688
  "bcp_47": "it",
10689
  "population": 592805,
10690
+ "score": 0.47
10691
  },
10692
  {
10693
  "name": "Venetian",
 
10819
  ]
10820
  },
10821
  "CA": {
10822
+ "score": 0.4538591979207903,
10823
  "languages": [
10824
  {
10825
  "name": "English",
 
10873
  "name": "Portuguese",
10874
  "bcp_47": "pt",
10875
  "population": 229934,
10876
+ "score": 0.45
10877
  },
10878
  {
10879
  "name": "Punjabi",
10880
  "bcp_47": "pa",
10881
  "population": 603106,
10882
+ "score": 0.43
10883
  },
10884
  {
10885
  "name": "Russian",
10886
  "bcp_47": "ru",
10887
  "population": 211087,
10888
+ "score": 0.45
10889
  },
10890
  {
10891
  "name": "German",
10892
  "bcp_47": "de",
10893
  "population": 294014,
10894
+ "score": 0.49
10895
  },
10896
  {
10897
  "name": "Japanese",
10898
  "bcp_47": "ja",
10899
  "population": 52772,
10900
+ "score": 0.46
10901
  },
10902
  {
10903
  "name": "Vietnamese",
10904
  "bcp_47": "vi",
10905
  "population": 184701,
10906
+ "score": 0.45
10907
  },
10908
  {
10909
  "name": "Tamil",
10910
  "bcp_47": "ta",
10911
  "population": 184701,
10912
+ "score": 0.41
10913
  },
10914
  {
10915
  "name": "Persian",
10916
  "bcp_47": "fa",
10917
  "population": 245012,
10918
+ "score": 0.41
10919
  },
10920
  {
10921
  "name": "Turkish",
10922
  "bcp_47": "tr",
10923
  "population": 37694,
10924
+ "score": 0.44
10925
  },
10926
  {
10927
  "name": "Cantonese",
10928
  "bcp_47": "yue",
10929
  "population": 640800,
10930
+ "score": 0.39
10931
  },
10932
  {
10933
  "name": "Korean",
10934
  "bcp_47": "ko",
10935
  "population": 169623,
10936
+ "score": 0.41
10937
  },
10938
  {
10939
  "name": "Italian",
10940
  "bcp_47": "it",
10941
  "population": 343016,
10942
+ "score": 0.47
10943
  },
10944
  {
10945
  "name": "Filipino",
10946
  "bcp_47": "fil",
10947
  "population": 565412,
10948
+ "score": 0.42
10949
  },
10950
  {
10951
  "name": "Gujarati",
10952
  "bcp_47": "gu",
10953
  "population": 135699,
10954
+ "score": 0.42
10955
  },
10956
  {
10957
  "name": "Polish",
 
11189
  ]
11190
  },
11191
  "CH": {
11192
+ "score": 0.33368138748580556,
11193
  "languages": [
11194
  {
11195
  "name": "English",
 
11207
  "name": "Portuguese",
11208
  "bcp_47": "pt",
11209
  "population": 285736,
11210
+ "score": 0.45
11211
  },
11212
  {
11213
  "name": "German",
11214
  "bcp_47": "de",
11215
  "population": 6134913,
11216
+ "score": 0.49
11217
  },
11218
  {
11219
  "name": "Italian",
11220
  "bcp_47": "it",
11221
  "population": 361372,
11222
+ "score": 0.47
11223
  },
11224
  {
11225
  "name": "Swiss German",
 
11455
  ]
11456
  },
11457
  "CN": {
11458
+ "score": 0.38724457341349466,
11459
  "languages": [
11460
  {
11461
  "name": "English",
 
11473
  "name": "Russian",
11474
  "bcp_47": "ru",
11475
  "population": 13940,
11476
+ "score": 0.45
11477
  },
11478
  {
11479
  "name": "Vietnamese",
11480
  "bcp_47": "vi",
11481
  "population": 6970,
11482
+ "score": 0.45
11483
  },
11484
  {
11485
  "name": "Wu Chinese",
 
11491
  "name": "Cantonese",
11492
  "bcp_47": "yue",
11493
  "population": 72489040,
11494
+ "score": 0.39
11495
  },
11496
  {
11497
  "name": "Korean",
11498
  "bcp_47": "ko",
11499
  "population": 2091030,
11500
+ "score": 0.41
11501
  },
11502
  {
11503
  "name": "Xiang Chinese",
 
11649
  ]
11650
  },
11651
  "CY": {
11652
+ "score": 0.2404799926753925,
11653
  "languages": [
11654
  {
11655
  "name": "English",
 
11673
  "name": "Turkish",
11674
  "bcp_47": "tr",
11675
  "population": 291336,
11676
+ "score": 0.44
11677
  },
11678
  {
11679
  "name": "Greek",
 
11690
  ]
11691
  },
11692
  "CZ": {
11693
+ "score": 0.12805930282531847,
11694
  "languages": [
11695
  {
11696
  "name": "English",
 
11702
  "name": "German",
11703
  "bcp_47": "de",
11704
  "population": 1605375,
11705
+ "score": 0.49
11706
  },
11707
  {
11708
  "name": "Polish",
 
11725
  ]
11726
  },
11727
  "DE": {
11728
+ "score": 0.3765932308207555,
11729
  "languages": [
11730
  {
11731
  "name": "English",
 
11749
  "name": "Russian",
11750
  "bcp_47": "ru",
11751
  "population": 4809582,
11752
+ "score": 0.45
11753
  },
11754
  {
11755
  "name": "German",
11756
  "bcp_47": "de",
11757
  "population": 72945327,
11758
+ "score": 0.49
11759
  },
11760
  {
11761
  "name": "Turkish",
11762
  "bcp_47": "tr",
11763
  "population": 2003992,
11764
+ "score": 0.44
11765
  },
11766
  {
11767
  "name": "Italian",
11768
  "bcp_47": "it",
11769
  "population": 5611179,
11770
+ "score": 0.47
11771
  },
11772
  {
11773
  "name": "Polish",
 
11891
  ]
11892
  },
11893
  "DK": {
11894
+ "score": 0.2649269539952979,
11895
  "languages": [
11896
  {
11897
  "name": "English",
 
11903
  "name": "German",
11904
  "bcp_47": "de",
11905
  "population": 2758623,
11906
+ "score": 0.49
11907
  },
11908
  {
11909
  "name": "Swedish",
 
12001
  ]
12002
  },
12003
  "EE": {
12004
+ "score": 0.23907703243578238,
12005
  "languages": [
12006
  {
12007
  "name": "English",
 
12013
  "name": "Russian",
12014
  "bcp_47": "ru",
12015
  "population": 688027,
12016
+ "score": 0.45
12017
  },
12018
  {
12019
  "name": "Finnish",
 
12042
  ]
12043
  },
12044
  "EG": {
12045
+ "score": 0.4156717299521135,
12046
  "languages": [
12047
  {
12048
  "name": "English",
 
12060
  "name": "Egyptian Arabic",
12061
  "bcp_47": "arz",
12062
  "population": 66639360,
12063
+ "score": 0.38
12064
  },
12065
  {
12066
  "name": "Greek",
 
12236
  ]
12237
  },
12238
  "FI": {
12239
+ "score": 0.18533875082776866,
12240
  "languages": [
12241
  {
12242
  "name": "English",
 
12248
  "name": "Russian",
12249
  "bcp_47": "ru",
12250
  "population": 45131,
12251
+ "score": 0.45
12252
  },
12253
  {
12254
  "name": "German",
12255
  "bcp_47": "de",
12256
  "population": 1002901,
12257
+ "score": 0.49
12258
  },
12259
  {
12260
  "name": "Swedish",
 
12388
  ]
12389
  },
12390
  "FR": {
12391
+ "score": 0.4436463938115849,
12392
  "languages": [
12393
  {
12394
  "name": "English",
 
12412
  "name": "Portuguese",
12413
  "bcp_47": "pt",
12414
  "population": 882027,
12415
+ "score": 0.45
12416
  },
12417
  {
12418
  "name": "German",
12419
  "bcp_47": "de",
12420
  "population": 3392410,
12421
+ "score": 0.49
12422
  },
12423
  {
12424
  "name": "Italian",
12425
  "bcp_47": "it",
12426
  "population": 1153419,
12427
+ "score": 0.47
12428
  },
12429
  {
12430
  "name": "Dutch",
 
12495
  ]
12496
  },
12497
  "GB": {
12498
+ "score": 0.43956766255639257,
12499
  "languages": [
12500
  {
12501
  "name": "English",
 
12543
  "name": "Portuguese",
12544
  "bcp_47": "pt",
12545
  "population": 131522,
12546
+ "score": 0.45
12547
  },
12548
  {
12549
  "name": "Punjabi",
12550
  "bcp_47": "pa",
12551
  "population": 2367400,
12552
+ "score": 0.43
12553
  },
12554
  {
12555
  "name": "German",
12556
  "bcp_47": "de",
12557
  "population": 5918499,
12558
+ "score": 0.49
12559
  },
12560
  {
12561
  "name": "Tamil",
12562
  "bcp_47": "ta",
12563
  "population": 2104355,
12564
+ "score": 0.41
12565
  },
12566
  {
12567
  "name": "Turkish",
12568
  "bcp_47": "tr",
12569
  "population": 131522,
12570
+ "score": 0.44
12571
  },
12572
  {
12573
  "name": "Italian",
12574
  "bcp_47": "it",
12575
  "population": 131522,
12576
+ "score": 0.47
12577
  },
12578
  {
12579
  "name": "Gujarati",
12580
  "bcp_47": "gu",
12581
  "population": 1907072,
12582
+ "score": 0.42
12583
  },
12584
  {
12585
  "name": "Polish",
 
12765
  ]
12766
  },
12767
  "GR": {
12768
+ "score": 0.18194383576443016,
12769
  "languages": [
12770
  {
12771
  "name": "English",
 
12783
  "name": "German",
12784
  "bcp_47": "de",
12785
  "population": 530355,
12786
+ "score": 0.49
12787
  },
12788
  {
12789
  "name": "Turkish",
12790
  "bcp_47": "tr",
12791
  "population": 127285,
12792
+ "score": 0.44
12793
  },
12794
  {
12795
  "name": "Greek",
 
12869
  ]
12870
  },
12871
  "HK": {
12872
+ "score": 0.4359751035397035,
12873
  "languages": [
12874
  {
12875
  "name": "English",
 
12887
  "name": "Cantonese",
12888
  "bcp_47": "yue",
12889
  "population": 6524919,
12890
+ "score": 0.39
12891
  }
12892
  ]
12893
  },
 
12920
  ]
12921
  },
12922
  "HR": {
12923
+ "score": 0.15823024946225459,
12924
  "languages": [
12925
  {
12926
  "name": "English",
 
12932
  "name": "Italian",
12933
  "bcp_47": "it",
12934
  "population": 67644,
12935
+ "score": 0.47
12936
  },
12937
  {
12938
  "name": "Croatian",
 
12949
  ]
12950
  },
12951
  "HU": {
12952
+ "score": 0.13756219151316587,
12953
  "languages": [
12954
  {
12955
  "name": "English",
 
12967
  "name": "German",
12968
  "bcp_47": "de",
12969
  "population": 1758929,
12970
+ "score": 0.49
12971
  },
12972
  {
12973
  "name": "Romanian",
 
13025
  ]
13026
  },
13027
  "IL": {
13028
+ "score": 0.21817259544999,
13029
  "languages": [
13030
  {
13031
  "name": "English",
 
13043
  "name": "Russian",
13044
  "bcp_47": "ru",
13045
  "population": 954303,
13046
+ "score": 0.45
13047
  },
13048
  {
13049
  "name": "Malayalam",
 
13125
  ]
13126
  },
13127
  "IN": {
13128
+ "score": 0.3397907454052606,
13129
  "languages": [
13130
  {
13131
  "name": "English",
 
13155
  "name": "Punjabi",
13156
  "bcp_47": "pa",
13157
  "population": 37130520,
13158
+ "score": 0.43
13159
  },
13160
  {
13161
  "name": "Telugu",
13162
  "bcp_47": "te",
13163
  "population": 95478480,
13164
+ "score": 0.41
13165
  },
13166
  {
13167
  "name": "Western Panjabi",
 
13173
  "name": "Marathi",
13174
  "bcp_47": "mr",
13175
  "population": 92826300,
13176
+ "score": 0.45
13177
  },
13178
  {
13179
  "name": "Tamil",
13180
  "bcp_47": "ta",
13181
  "population": 78239310,
13182
+ "score": 0.41
13183
  },
13184
  {
13185
  "name": "Gujarati",
13186
  "bcp_47": "gu",
13187
  "population": 59674050,
13188
+ "score": 0.42
13189
  },
13190
  {
13191
  "name": "Kannada",
 
13603
  ]
13604
  },
13605
  "IQ": {
13606
+ "score": 0.357837983423388,
13607
  "languages": [
13608
  {
13609
  "name": "English",
 
13621
  "name": "Persian",
13622
  "bcp_47": "fa",
13623
  "population": 338192,
13624
+ "score": 0.41
13625
  },
13626
  {
13627
  "name": "Azerbaijani",
 
13650
  ]
13651
  },
13652
  "IT": {
13653
+ "score": 0.43224641662655555,
13654
  "languages": [
13655
  {
13656
  "name": "English",
 
13668
  "name": "German",
13669
  "bcp_47": "de",
13670
  "population": 998443,
13671
+ "score": 0.49
13672
  },
13673
  {
13674
  "name": "Italian",
13675
  "bcp_47": "it",
13676
  "population": 59282565,
13677
+ "score": 0.47
13678
  },
13679
  {
13680
  "name": "Greek",
 
13820
  ]
13821
  },
13822
  "KE": {
13823
+ "score": 0.2501476621404106,
13824
  "languages": [
13825
  {
13826
  "name": "English",
 
13838
  "name": "Punjabi",
13839
  "bcp_47": "pa",
13840
  "population": 10170,
13841
+ "score": 0.43
13842
  },
13843
  {
13844
  "name": "Swahili",
13845
  "bcp_47": "sw",
13846
  "population": 35328414,
13847
+ "score": 0.45
13848
  },
13849
  {
13850
  "name": "Gujarati",
13851
  "bcp_47": "gu",
13852
  "population": 4978,
13853
+ "score": 0.42
13854
  },
13855
  {
13856
  "name": "Oromo",
 
13984
  ]
13985
  },
13986
  "KZ": {
13987
+ "score": 0.2671643693028198,
13988
  "languages": [
13989
  {
13990
  "name": "English",
 
13996
  "name": "Russian",
13997
  "bcp_47": "ru",
13998
  "population": 13746168,
13999
+ "score": 0.45
14000
  },
14001
  {
14002
  "name": "German",
14003
  "bcp_47": "de",
14004
  "population": 1221882,
14005
+ "score": 0.49
14006
  },
14007
  {
14008
  "name": "Kazakh",
 
14071
  ]
14072
  },
14073
  "LK": {
14074
+ "score": 0.11666666666666665,
14075
  "languages": [
14076
  {
14077
  "name": "English",
 
14083
  "name": "Tamil",
14084
  "bcp_47": "ta",
14085
  "population": 3433380,
14086
+ "score": 0.41
14087
  },
14088
  {
14089
  "name": "Sinhala",
 
14164
  ]
14165
  },
14166
  "LT": {
14167
+ "score": 0.2785320836068621,
14168
  "languages": [
14169
  {
14170
  "name": "English",
 
14176
  "name": "Russian",
14177
  "bcp_47": "ru",
14178
  "population": 2185168,
14179
+ "score": 0.45
14180
  },
14181
  {
14182
  "name": "German",
14183
  "bcp_47": "de",
14184
  "population": 382404,
14185
+ "score": 0.49
14186
  },
14187
  {
14188
  "name": "Lithuanian",
 
14199
  ]
14200
  },
14201
  "LU": {
14202
+ "score": 0.3612802832567923,
14203
  "languages": [
14204
  {
14205
  "name": "English",
 
14217
  "name": "Portuguese",
14218
  "bcp_47": "pt",
14219
  "population": 100541,
14220
+ "score": 0.45
14221
  },
14222
  {
14223
  "name": "German",
14224
  "bcp_47": "de",
14225
  "population": 395880,
14226
+ "score": 0.49
14227
  },
14228
  {
14229
  "name": "Luxembourgish",
 
14234
  ]
14235
  },
14236
  "LV": {
14237
+ "score": 0.2515919974081345,
14238
  "languages": [
14239
  {
14240
  "name": "English",
 
14246
  "name": "Russian",
14247
  "bcp_47": "ru",
14248
  "population": 714867,
14249
+ "score": 0.45
14250
  },
14251
  {
14252
  "name": "Latvian",
 
14362
  ]
14363
  },
14364
  "MO": {
14365
+ "score": 0.4597552187538731,
14366
  "languages": [
14367
  {
14368
  "name": "English",
 
14380
  "name": "Portuguese",
14381
  "bcp_47": "pt",
14382
  "population": 30723,
14383
+ "score": 0.45
14384
  }
14385
  ]
14386
  },
 
14413
  ]
14414
  },
14415
  "MT": {
14416
+ "score": 0.28525492889983195,
14417
  "languages": [
14418
  {
14419
  "name": "English",
 
14431
  "name": "Italian",
14432
  "bcp_47": "it",
14433
  "population": 256070,
14434
+ "score": 0.47
14435
  },
14436
  {
14437
  "name": "Maltese",
 
14442
  ]
14443
  },
14444
  "MU": {
14445
+ "score": 0.19243355389764255,
14446
  "languages": [
14447
  {
14448
  "name": "English",
 
14466
  "name": "Tamil",
14467
  "bcp_47": "ta",
14468
  "population": 34484,
14469
+ "score": 0.41
14470
  },
14471
  {
14472
  "name": "Bhojpuri",
 
14594
  ]
14595
  },
14596
  "MY": {
14597
+ "score": 0.1619475361727729,
14598
  "languages": [
14599
  {
14600
  "name": "English",
 
14612
  "name": "Javanese",
14613
  "bcp_47": "jv",
14614
  "population": 391825,
14615
+ "score": 0.41
14616
  },
14617
  {
14618
  "name": "Tamil",
14619
  "bcp_47": "ta",
14620
  "population": 1371388,
14621
+ "score": 0.41
14622
  },
14623
  {
14624
  "name": "Malayalam",
 
14665
  ]
14666
  },
14667
  "NA": {
14668
+ "score": 0.023383111654627774,
14669
  "languages": [
14670
  {
14671
  "name": "English",
 
14677
  "name": "German",
14678
  "bcp_47": "de",
14679
  "population": 23671,
14680
+ "score": 0.49
14681
  },
14682
  {
14683
  "name": "Afrikaans",
 
14836
  ]
14837
  },
14838
  "NL": {
14839
+ "score": 0.28688749989149553,
14840
  "languages": [
14841
  {
14842
  "name": "English",
 
14854
  "name": "Indonesian",
14855
  "bcp_47": "id",
14856
  "population": 311047,
14857
+ "score": 0.47
14858
  },
14859
  {
14860
  "name": "German",
14861
  "bcp_47": "de",
14862
  "population": 12269084,
14863
+ "score": 0.49
14864
  },
14865
  {
14866
  "name": "Turkish",
14867
  "bcp_47": "tr",
14868
  "population": 207365,
14869
+ "score": 0.44
14870
  },
14871
  {
14872
  "name": "Dutch",
 
15183
  ]
15184
  },
15185
  "PH": {
15186
+ "score": 0.32615211365536473,
15187
  "languages": [
15188
  {
15189
  "name": "English",
 
15207
  "name": "Filipino",
15208
  "bcp_47": "fil",
15209
  "population": 65508600,
15210
+ "score": 0.42
15211
  },
15212
  {
15213
  "name": "Cebuano",
 
15308
  ]
15309
  },
15310
  "PK": {
15311
+ "score": 0.30567966556461956,
15312
  "languages": [
15313
  {
15314
  "name": "English",
 
15326
  "name": "Punjabi",
15327
  "bcp_47": "pa",
15328
  "population": 163450700,
15329
+ "score": 0.43
15330
  },
15331
  {
15332
  "name": "Western Panjabi",
 
15338
  "name": "Persian",
15339
  "bcp_47": "fa",
15340
  "population": 1541107,
15341
+ "score": 0.41
15342
  },
15343
  {
15344
  "name": "Pashto",
 
15457
  ]
15458
  },
15459
  "PL": {
15460
+ "score": 0.19542647519424666,
15461
  "languages": [
15462
  {
15463
  "name": "English",
 
15469
  "name": "Russian",
15470
  "bcp_47": "ru",
15471
  "population": 6890814,
15472
+ "score": 0.45
15473
  },
15474
  {
15475
  "name": "German",
15476
  "bcp_47": "de",
15477
  "population": 7273637,
15478
+ "score": 0.49
15479
  },
15480
  {
15481
  "name": "Polish",
 
15573
  ]
15574
  },
15575
  "PT": {
15576
+ "score": 0.4542324762390237,
15577
  "languages": [
15578
  {
15579
  "name": "English",
 
15597
  "name": "Portuguese",
15598
  "bcp_47": "pt",
15599
  "population": 9890592,
15600
+ "score": 0.45
15601
  },
15602
  {
15603
  "name": "Galician",
 
15625
  ]
15626
  },
15627
  "RO": {
15628
+ "score": 0.1743772772485309,
15629
  "languages": [
15630
  {
15631
  "name": "English",
 
15649
  "name": "German",
15650
  "bcp_47": "de",
15651
  "population": 44736,
15652
+ "score": 0.49
15653
  },
15654
  {
15655
  "name": "Turkish",
15656
  "bcp_47": "tr",
15657
  "population": 27694,
15658
+ "score": 0.44
15659
  },
15660
  {
15661
  "name": "Polish",
 
15883
  ]
15884
  },
15885
  "SG": {
15886
+ "score": 0.4294592881506046,
15887
  "languages": [
15888
  {
15889
  "name": "English",
 
15901
  "name": "Punjabi",
15902
  "bcp_47": "pa",
15903
  "population": 9314,
15904
+ "score": 0.43
15905
  },
15906
  {
15907
  "name": "Tamil",
15908
  "bcp_47": "ta",
15909
  "population": 130403,
15910
+ "score": 0.41
15911
  },
15912
  {
15913
  "name": "Malayalam",
 
15935
  ]
15936
  },
15937
  "SI": {
15938
+ "score": 0.1928028123892293,
15939
  "languages": [
15940
  {
15941
  "name": "English",
 
15947
  "name": "German",
15948
  "bcp_47": "de",
15949
  "population": 883126,
15950
+ "score": 0.49
15951
  },
15952
  {
15953
  "name": "Italian",
15954
  "bcp_47": "it",
15955
  "population": 3995,
15956
+ "score": 0.47
15957
  },
15958
  {
15959
  "name": "Hungarian",
 
15982
  ]
15983
  },
15984
  "SK": {
15985
+ "score": 0.11567670853229638,
15986
  "languages": [
15987
  {
15988
  "name": "English",
 
15994
  "name": "German",
15995
  "bcp_47": "de",
15996
  "population": 1196932,
15997
+ "score": 0.49
15998
  },
15999
  {
16000
  "name": "Polish",
 
16290
  ]
16291
  },
16292
  "TR": {
16293
+ "score": 0.38853953080443926,
16294
  "languages": [
16295
  {
16296
  "name": "English",
 
16308
  "name": "Turkish",
16309
  "bcp_47": "tr",
16310
  "population": 76276275,
16311
+ "score": 0.44
16312
  },
16313
  {
16314
  "name": "North Levantine Arabic",
 
16467
  ]
16468
  },
16469
  "TZ": {
16470
+ "score": 0.3952631230768349,
16471
  "languages": [
16472
  {
16473
  "name": "English",
 
16479
  "name": "Swahili",
16480
  "bcp_47": "sw",
16481
  "population": 52697520,
16482
+ "score": 0.45
16483
  },
16484
  {
16485
  "name": "Sukuma",
 
16568
  ]
16569
  },
16570
  "UG": {
16571
+ "score": 0.2797477934487195,
16572
  "languages": [
16573
  {
16574
  "name": "English",
 
16586
  "name": "Swahili",
16587
  "bcp_47": "sw",
16588
  "population": 32439750,
16589
+ "score": 0.45
16590
  },
16591
  {
16592
  "name": "Kinyarwanda",
 
16662
  ]
16663
  },
16664
  "US": {
16665
+ "score": 0.46680423711359387,
16666
  "languages": [
16667
  {
16668
  "name": "English",
 
16692
  "name": "Russian",
16693
  "bcp_47": "ru",
16694
  "population": 798334,
16695
+ "score": 0.45
16696
  },
16697
  {
16698
  "name": "German",
16699
  "bcp_47": "de",
16700
  "population": 1563403,
16701
+ "score": 0.49
16702
  },
16703
  {
16704
  "name": "Vietnamese",
16705
  "bcp_47": "vi",
16706
  "population": 1130973,
16707
+ "score": 0.45
16708
  },
16709
  {
16710
  "name": "Korean",
16711
  "bcp_47": "ko",
16712
  "population": 997917,
16713
+ "score": 0.41
16714
  },
16715
  {
16716
  "name": "Italian",
16717
  "bcp_47": "it",
16718
  "population": 1130973,
16719
+ "score": 0.47
16720
  },
16721
  {
16722
  "name": "Filipino",
16723
  "bcp_47": "fil",
16724
  "population": 1397084,
16725
+ "score": 0.42
16726
  },
16727
  {
16728
  "name": "Yiddish",
 
16925
  ]
16926
  },
16927
  "ZA": {
16928
+ "score": 0.12442237800209865,
16929
  "languages": [
16930
  {
16931
  "name": "English",
 
16943
  "name": "Swahili",
16944
  "bcp_47": "sw",
16945
  "population": 1016,
16946
+ "score": 0.45
16947
  },
16948
  {
16949
  "name": "Zulu",
 
17125
  ]
17126
  },
17127
  "ID": {
17128
+ "score": 0.3194548673228042,
17129
  "languages": [
17130
  {
17131
  "name": "Chinese",
 
17137
  "name": "Indonesian",
17138
  "bcp_47": "id",
17139
  "population": 170896640,
17140
+ "score": 0.47
17141
  },
17142
  {
17143
  "name": "Javanese",
17144
  "bcp_47": "jv",
17145
  "population": 90788840,
17146
+ "score": 0.41
17147
  },
17148
  {
17149
  "name": "Malay",
 
17304
  ]
17305
  },
17306
  "MN": {
17307
+ "score": 0.006903243016889744,
17308
  "languages": [
17309
  {
17310
  "name": "Chinese",
 
17316
  "name": "Russian",
17317
  "bcp_47": "ru",
17318
  "population": 4118,
17319
+ "score": 0.45
17320
  },
17321
  {
17322
  "name": "Kazakh",
 
17408
  ]
17409
  },
17410
  "VN": {
17411
+ "score": 0.44527479082463184,
17412
  "languages": [
17413
  {
17414
  "name": "Chinese",
 
17420
  "name": "Vietnamese",
17421
  "bcp_47": "vi",
17422
  "population": 84900318,
17423
+ "score": 0.45
17424
  },
17425
  {
17426
  "name": "Hmong Njua",
 
17603
  ]
17604
  },
17605
  "GQ": {
17606
+ "score": 0.27923739669086073,
17607
  "languages": [
17608
  {
17609
  "name": "Spanish",
 
17621
  "name": "Portuguese",
17622
  "bcp_47": "pt",
17623
  "population": 1,
17624
+ "score": 0.45
17625
  },
17626
  {
17627
  "name": "Fang",
 
17700
  ]
17701
  },
17702
  "PY": {
17703
+ "score": 0.03322879759433273,
17704
  "languages": [
17705
  {
17706
  "name": "Spanish",
 
17712
  "name": "German",
17713
  "bcp_47": "de",
17714
  "population": 208559,
17715
+ "score": 0.49
17716
  },
17717
  {
17718
  "name": "Guarani",
 
17819
  ]
17820
  },
17821
  "IR": {
17822
+ "score": 0.23949254115959248,
17823
  "languages": [
17824
  {
17825
  "name": "Arabic",
 
17831
  "name": "Persian",
17832
  "bcp_47": "fa",
17833
  "population": 63692475,
17834
+ "score": 0.41
17835
  },
17836
  {
17837
  "name": "Pashto",
 
18166
  ]
18167
  },
18168
  "OM": {
18169
+ "score": 0.3961930102252659,
18170
  "languages": [
18171
  {
18172
  "name": "Arabic",
 
18178
  "name": "Persian",
18179
  "bcp_47": "fa",
18180
  "population": 43849,
18181
+ "score": 0.41
18182
  },
18183
  {
18184
  "name": "Baluchi",
 
18206
  ]
18207
  },
18208
  "QA": {
18209
+ "score": 0.41777205848450016,
18210
  "languages": [
18211
  {
18212
  "name": "Arabic",
 
18218
  "name": "Persian",
18219
  "bcp_47": "fa",
18220
  "population": 268859,
18221
+ "score": 0.41
18222
  },
18223
  {
18224
  "name": "Malayalam",
 
18246
  ]
18247
  },
18248
  "SO": {
18249
+ "score": 0.1326691120161243,
18250
  "languages": [
18251
  {
18252
  "name": "Arabic",
 
18258
  "name": "Swahili",
18259
  "bcp_47": "sw",
18260
  "population": 235142,
18261
+ "score": 0.45
18262
  },
18263
  {
18264
  "name": "Oromo",
 
18333
  ]
18334
  },
18335
  "TJ": {
18336
+ "score": 0.05075244729560809,
18337
  "languages": [
18338
  {
18339
  "name": "Arabic",
 
18345
  "name": "Russian",
18346
  "bcp_47": "ru",
18347
  "population": 1064840,
18348
+ "score": 0.45
18349
  },
18350
  {
18351
  "name": "Persian",
18352
  "bcp_47": "fa",
18353
  "population": 69215,
18354
+ "score": 0.41
18355
  },
18356
  {
18357
  "name": "Tajik",
 
18454
  ]
18455
  },
18456
  "CD": {
18457
+ "score": 0.34013185580025246,
18458
  "languages": [
18459
  {
18460
  "name": "French",
 
18466
  "name": "Swahili",
18467
  "bcp_47": "sw",
18468
  "population": 50890000,
18469
+ "score": 0.45
18470
  },
18471
  {
18472
  "name": "Kinyarwanda",
 
18718
  ]
18719
  },
18720
  "RE": {
18721
+ "score": 0.26908571814147125,
18722
  "languages": [
18723
  {
18724
  "name": "French",
 
18730
  "name": "Tamil",
18731
  "bcp_47": "ta",
18732
  "population": 118138,
18733
+ "score": 0.41
18734
  },
18735
  {
18736
  "name": "Réunion Creole French",
 
18887
  ]
18888
  },
18889
  "YT": {
18890
+ "score": 0.15850059031877214,
18891
  "languages": [
18892
  {
18893
  "name": "French",
 
18899
  "name": "Swahili",
18900
  "bcp_47": "sw",
18901
  "population": 2716,
18902
+ "score": 0.45
18903
  },
18904
  {
18905
  "name": "Comorian",
 
18916
  ]
18917
  },
18918
  "AO": {
18919
+ "score": 0.2478014326653792,
18920
  "languages": [
18921
  {
18922
  "name": "Portuguese",
18923
  "bcp_47": "pt",
18924
  "population": 21789941,
18925
+ "score": 0.45
18926
  },
18927
  {
18928
  "name": "Umbundu",
 
18945
  ]
18946
  },
18947
  "CV": {
18948
+ "score": 0.20479048002332564,
18949
  "languages": [
18950
  {
18951
  "name": "Portuguese",
18952
  "bcp_47": "pt",
18953
  "population": 443274,
18954
+ "score": 0.45
18955
  },
18956
  {
18957
  "name": "Kabuverdianu",
 
18962
  ]
18963
  },
18964
  "GW": {
18965
+ "score": 0.43859551519338624,
18966
  "languages": [
18967
  {
18968
  "name": "Portuguese",
18969
  "bcp_47": "pt",
18970
  "population": 1927100,
18971
+ "score": 0.45
18972
  },
18973
  {
18974
  "name": "Fula",
 
18985
  ]
18986
  },
18987
  "MZ": {
18988
+ "score": 0.1480934184335346,
18989
  "languages": [
18990
  {
18991
  "name": "Portuguese",
18992
  "bcp_47": "pt",
18993
  "population": 8126514,
18994
+ "score": 0.45
18995
  },
18996
  {
18997
  "name": "Swahili",
18998
  "bcp_47": "sw",
18999
  "population": 9330,
19000
+ "score": 0.45
19001
  },
19002
  {
19003
  "name": "Nyanja",
 
19062
  ]
19063
  },
19064
  "ST": {
19065
+ "score": 0.45,
19066
  "languages": [
19067
  {
19068
  "name": "Portuguese",
19069
  "bcp_47": "pt",
19070
  "population": 179454,
19071
+ "score": 0.45
19072
  }
19073
  ]
19074
  },
19075
  "TL": {
19076
+ "score": 0.225,
19077
  "languages": [
19078
  {
19079
  "name": "Portuguese",
19080
  "bcp_47": "pt",
19081
  "population": 816395,
19082
+ "score": 0.45
19083
  },
19084
  {
19085
  "name": "Tetum",
 
19090
  ]
19091
  },
19092
  "BY": {
19093
+ "score": 0.04821427057437069,
19094
  "languages": [
19095
  {
19096
  "name": "Russian",
19097
  "bcp_47": "ru",
19098
  "population": 1137350,
19099
+ "score": 0.45
19100
  },
19101
  {
19102
  "name": "Belarusian",
 
19107
  ]
19108
  },
19109
  "GE": {
19110
+ "score": 0.03423789210395573,
19111
  "languages": [
19112
  {
19113
  "name": "Russian",
19114
  "bcp_47": "ru",
19115
  "population": 359730,
19116
+ "score": 0.45
19117
  },
19118
  {
19119
  "name": "Kurdish",
 
19154
  ]
19155
  },
19156
  "KG": {
19157
+ "score": 0.19285714285714287,
19158
  "languages": [
19159
  {
19160
  "name": "Russian",
19161
  "bcp_47": "ru",
19162
  "population": 2147364,
19163
+ "score": 0.45
19164
  },
19165
  {
19166
  "name": "Kyrgyz",
 
19171
  ]
19172
  },
19173
  "MD": {
19174
+ "score": 0.014563109130777574,
19175
  "languages": [
19176
  {
19177
  "name": "Russian",
19178
  "bcp_47": "ru",
19179
  "population": 100935,
19180
+ "score": 0.45
19181
  },
19182
  {
19183
  "name": "Ukrainian",
 
19206
  ]
19207
  },
19208
  "RU": {
19209
+ "score": 0.4065329789745318,
19210
  "languages": [
19211
  {
19212
  "name": "Russian",
19213
  "bcp_47": "ru",
19214
  "population": 133218680,
19215
+ "score": 0.45
19216
  },
19217
  {
19218
  "name": "Azerbaijani",
 
19427
  ]
19428
  },
19429
  "SJ": {
19430
+ "score": 0.20059435364041606,
19431
  "languages": [
19432
  {
19433
  "name": "Russian",
19434
  "bcp_47": "ru",
19435
  "population": 1200,
19436
+ "score": 0.45
19437
  },
19438
  {
19439
  "name": "Norwegian Bokmål",
 
19444
  ]
19445
  },
19446
  "TM": {
19447
+ "score": 0.059080984625687366,
19448
  "languages": [
19449
  {
19450
  "name": "Russian",
19451
  "bcp_47": "ru",
19452
  "population": 663436,
19453
+ "score": 0.45
19454
  },
19455
  {
19456
  "name": "Uzbek",
 
19473
  ]
19474
  },
19475
  "UA": {
19476
+ "score": 0.17534632621240526,
19477
  "languages": [
19478
  {
19479
  "name": "Russian",
19480
  "bcp_47": "ru",
19481
  "population": 20204534,
19482
+ "score": 0.45
19483
  },
19484
  {
19485
  "name": "Turkish",
19486
  "bcp_47": "tr",
19487
  "population": 184476,
19488
+ "score": 0.44
19489
  },
19490
  {
19491
  "name": "Polish",
 
19550
  ]
19551
  },
19552
  "UZ": {
19553
+ "score": 0.05701615696541229,
19554
  "languages": [
19555
  {
19556
  "name": "Russian",
19557
  "bcp_47": "ru",
19558
  "population": 4279156,
19559
+ "score": 0.45
19560
  },
19561
  {
19562
  "name": "Turkish",
19563
  "bcp_47": "tr",
19564
  "population": 232297,
19565
+ "score": 0.44
19566
  },
19567
  {
19568
  "name": "Uzbek",
 
19579
  ]
19580
  },
19581
  "LI": {
19582
+ "score": 0.26022294592577516,
19583
  "languages": [
19584
  {
19585
  "name": "German",
19586
  "bcp_47": "de",
19587
  "population": 39137,
19588
+ "score": 0.49
19589
  },
19590
  {
19591
  "name": "Swiss German",
 
19602
  ]
19603
  },
19604
  "JP": {
19605
+ "score": 0.4560515108353953,
19606
  "languages": [
19607
  {
19608
  "name": "Japanese",
19609
  "bcp_47": "ja",
19610
  "population": 119231650,
19611
+ "score": 0.46
19612
  },
19613
  {
19614
  "name": "Korean",
19615
  "bcp_47": "ko",
19616
  "population": 652636,
19617
+ "score": 0.41
19618
  },
19619
  {
19620
  "name": "Central Okinawan",
 
19625
  ]
19626
  },
19627
  "AF": {
19628
+ "score": 0.19133182400153392,
19629
  "languages": [
19630
  {
19631
  "name": "Persian",
19632
  "bcp_47": "fa",
19633
  "population": 18321900,
19634
+ "score": 0.41
19635
  },
19636
  {
19637
  "name": "Pashto",
 
19684
  ]
19685
  },
19686
  "MK": {
19687
+ "score": 0.016125668065966572,
19688
  "languages": [
19689
  {
19690
  "name": "Turkish",
19691
  "bcp_47": "tr",
19692
  "population": 74409,
19693
+ "score": 0.44
19694
  },
19695
  {
19696
  "name": "Albanian",
 
19707
  ]
19708
  },
19709
  "KP": {
19710
+ "score": 0.41,
19711
  "languages": [
19712
  {
19713
  "name": "Korean",
19714
  "bcp_47": "ko",
19715
  "population": 22566280,
19716
+ "score": 0.41
19717
  }
19718
  ]
19719
  },
19720
  "KR": {
19721
+ "score": 0.41,
19722
  "languages": [
19723
  {
19724
  "name": "Korean",
19725
  "bcp_47": "ko",
19726
  "population": 51835100,
19727
+ "score": 0.41
19728
  }
19729
  ]
19730
  },
19731
  "SM": {
19732
+ "score": 0.4654018916371436,
19733
  "languages": [
19734
  {
19735
  "name": "Italian",
19736
  "bcp_47": "it",
19737
  "population": 30466,
19738
+ "score": 0.47
19739
  },
19740
  {
19741
  "name": "Esperanto",
 
19746
  ]
19747
  },
19748
  "VA": {
19749
+ "score": 0.235,
19750
  "languages": [
19751
  {
19752
  "name": "Italian",
19753
  "bcp_47": "it",
19754
  "population": 820,
19755
+ "score": 0.47
19756
  },
19757
  {
19758
  "name": "Latin",
results.json CHANGED
@@ -3,29 +3,29 @@
3
  {
4
  "task": "classification",
5
  "metric": "accuracy",
6
- "score": 0.5427083333333333,
7
- "bcp_47": 10,
8
  "model": 12
9
  },
10
  {
11
  "task": "language_modeling",
12
  "metric": "chrf",
13
- "score": 0.9024222998985517,
14
- "bcp_47": 10,
15
  "model": 12
16
  },
17
  {
18
  "task": "translation",
19
  "metric": "bleu",
20
- "score": 0.34325329881872996,
21
- "bcp_47": 10,
22
  "model": 12
23
  },
24
  {
25
  "task": "translation",
26
  "metric": "chrf",
27
- "score": 0.49764810942023735,
28
- "bcp_47": 10,
29
  "model": 12
30
  }
31
  ],
@@ -41,7 +41,7 @@
41
  "model": "amazon/nova-micro-v1",
42
  "task": "language_modeling",
43
  "metric": "chrf",
44
- "score": 0.9446198732700857,
45
  "bcp_47": 2
46
  },
47
  {
@@ -69,7 +69,7 @@
69
  "model": "google/gemini-2.0-flash-001",
70
  "task": "language_modeling",
71
  "metric": "chrf",
72
- "score": 0.9625160007216136,
73
  "bcp_47": 2
74
  },
75
  {
@@ -97,7 +97,7 @@
97
  "model": "google/gemini-2.0-flash-lite-001",
98
  "task": "language_modeling",
99
  "metric": "chrf",
100
- "score": 0.9710194350890375,
101
  "bcp_47": 2
102
  },
103
  {
@@ -125,7 +125,7 @@
125
  "model": "google/gemma-3-27b-it",
126
  "task": "language_modeling",
127
  "metric": "chrf",
128
- "score": 0.9567943176484227,
129
  "bcp_47": 2
130
  },
131
  {
@@ -153,7 +153,7 @@
153
  "model": "meta-llama/llama-3-70b-instruct",
154
  "task": "language_modeling",
155
  "metric": "chrf",
156
- "score": 0.9452435586756014,
157
  "bcp_47": 2
158
  },
159
  {
@@ -181,14 +181,14 @@
181
  "model": "meta-llama/llama-3.1-70b-instruct",
182
  "task": "language_modeling",
183
  "metric": "chrf",
184
- "score": 0.9203465184571391,
185
  "bcp_47": 2
186
  },
187
  {
188
  "model": "meta-llama/llama-3.1-70b-instruct",
189
  "task": "translation",
190
  "metric": "bleu",
191
- "score": 0.43182300663190504,
192
  "bcp_47": 2
193
  },
194
  {
@@ -202,29 +202,29 @@
202
  "model": "meta-llama/llama-3.3-70b-instruct",
203
  "task": "classification",
204
  "metric": "accuracy",
205
- "score": 0.5,
206
- "bcp_47": 10
207
  },
208
  {
209
  "model": "meta-llama/llama-3.3-70b-instruct",
210
  "task": "language_modeling",
211
  "metric": "chrf",
212
- "score": 0.9402702238563417,
213
- "bcp_47": 10
214
  },
215
  {
216
  "model": "meta-llama/llama-3.3-70b-instruct",
217
  "task": "translation",
218
  "metric": "bleu",
219
- "score": 0.3116623954547766,
220
- "bcp_47": 10
221
  },
222
  {
223
  "model": "meta-llama/llama-3.3-70b-instruct",
224
  "task": "translation",
225
  "metric": "chrf",
226
- "score": 0.4836914110309717,
227
- "bcp_47": 10
228
  },
229
  {
230
  "model": "microsoft/phi-4-multimodal-instruct",
@@ -237,7 +237,7 @@
237
  "model": "microsoft/phi-4-multimodal-instruct",
238
  "task": "language_modeling",
239
  "metric": "chrf",
240
- "score": 0.8700000415175042,
241
  "bcp_47": 2
242
  },
243
  {
@@ -265,7 +265,7 @@
265
  "model": "mistralai/mistral-nemo",
266
  "task": "language_modeling",
267
  "metric": "chrf",
268
- "score": 0.8815544644693022,
269
  "bcp_47": 2
270
  },
271
  {
@@ -293,7 +293,7 @@
293
  "model": "mistralai/mistral-small-24b-instruct-2501",
294
  "task": "language_modeling",
295
  "metric": "chrf",
296
- "score": 0.8557257213273853,
297
  "bcp_47": 2
298
  },
299
  {
@@ -321,7 +321,7 @@
321
  "model": "openai/gpt-4o-mini",
322
  "task": "language_modeling",
323
  "metric": "chrf",
324
- "score": 0.9482707322595748,
325
  "bcp_47": 2
326
  },
327
  {
@@ -349,7 +349,7 @@
349
  "model": "qwen/qwq-32b",
350
  "task": "language_modeling",
351
  "metric": "chrf",
352
- "score": 0.4813150156594517,
353
  "bcp_47": 2
354
  },
355
  {
@@ -701,7 +701,7 @@
701
  "in_benchmark": true,
702
  "task": "language_modeling",
703
  "metric": "chrf",
704
- "score": 0.9307208363594199,
705
  "model": 1.0
706
  },
707
  {
@@ -827,10 +827,58 @@
827
  "commonvoice_hours": null,
828
  "commonvoice_locale": null,
829
  "in_benchmark": true,
830
- "task": null,
831
- "metric": null,
832
- "score": null,
833
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
834
  },
835
  {
836
  "bcp_47": "as",
@@ -1613,7 +1661,7 @@
1613
  "in_benchmark": true,
1614
  "task": "language_modeling",
1615
  "metric": "chrf",
1616
- "score": 0.8990036074617607,
1617
  "model": 1.0
1618
  },
1619
  {
@@ -1992,7 +2040,7 @@
1992
  "family": "Indo-European",
1993
  "flores_path": "cat_Latn",
1994
  "fleurs_tag": "ca_es",
1995
- "commonvoice_hours": 2844.0,
1996
  "commonvoice_locale": "ca",
1997
  "in_benchmark": true,
1998
  "task": null,
@@ -2587,10 +2635,58 @@
2587
  "commonvoice_hours": 1360.0,
2588
  "commonvoice_locale": "de",
2589
  "in_benchmark": true,
2590
- "task": null,
2591
- "metric": null,
2592
- "score": null,
2593
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2594
  },
2595
  {
2596
  "bcp_47": "den",
@@ -2925,7 +3021,7 @@
2925
  "in_benchmark": true,
2926
  "task": "language_modeling",
2927
  "metric": "chrf",
2928
- "score": 0.9222343234934963,
2929
  "model": 12.0
2930
  },
2931
  {
@@ -2941,7 +3037,7 @@
2941
  "in_benchmark": true,
2942
  "task": "translation",
2943
  "metric": "bleu",
2944
- "score": 0.37035746903842287,
2945
  "model": 12.0
2946
  },
2947
  {
@@ -3005,7 +3101,7 @@
3005
  "in_benchmark": true,
3006
  "task": "language_modeling",
3007
  "metric": "chrf",
3008
- "score": 0.9602736376353148,
3009
  "model": 1.0
3010
  },
3011
  {
@@ -3080,7 +3176,7 @@
3080
  "family": null,
3081
  "flores_path": "eus_Latn",
3082
  "fleurs_tag": null,
3083
- "commonvoice_hours": 335.0,
3084
  "commonvoice_locale": "eu",
3085
  "in_benchmark": true,
3086
  "task": null,
@@ -3131,10 +3227,58 @@
3131
  "commonvoice_hours": 370.0,
3132
  "commonvoice_locale": "fa",
3133
  "in_benchmark": true,
3134
- "task": null,
3135
- "metric": null,
3136
- "score": null,
3137
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3138
  },
3139
  {
3140
  "bcp_47": "fan",
@@ -3243,10 +3387,58 @@
3243
  "commonvoice_hours": 0.0,
3244
  "commonvoice_locale": "tl",
3245
  "in_benchmark": true,
3246
- "task": null,
3247
- "metric": null,
3248
- "score": null,
3249
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3250
  },
3251
  {
3252
  "bcp_47": "fit",
@@ -3341,7 +3533,7 @@
3341
  "in_benchmark": true,
3342
  "task": "language_modeling",
3343
  "metric": "chrf",
3344
- "score": 0.9756346055321089,
3345
  "model": 1.0
3346
  },
3347
  {
@@ -3544,7 +3736,7 @@
3544
  "family": "Indo-European",
3545
  "flores_path": "gle_Latn",
3546
  "fleurs_tag": "ga_ie",
3547
- "commonvoice_hours": 5.9,
3548
  "commonvoice_locale": "ga-IE",
3549
  "in_benchmark": true,
3550
  "task": null,
@@ -3899,36 +4091,84 @@
3899
  "commonvoice_hours": 0.0,
3900
  "commonvoice_locale": "gu-IN",
3901
  "in_benchmark": true,
3902
- "task": null,
3903
- "metric": null,
3904
- "score": null,
3905
- "model": null
3906
  },
3907
  {
3908
- "bcp_47": "gub",
3909
- "speakers": 17784,
3910
- "language_name": "Guajajára",
3911
- "autonym": "Guajajára",
3912
- "family": "Tupian",
3913
- "flores_path": null,
3914
- "fleurs_tag": null,
3915
- "commonvoice_hours": null,
3916
- "commonvoice_locale": null,
3917
- "in_benchmark": false,
3918
- "task": null,
3919
- "metric": null,
3920
- "score": null,
3921
- "model": null
3922
  },
3923
  {
3924
- "bcp_47": "guc",
3925
- "speakers": 132529,
3926
- "language_name": "Wayuu",
3927
- "autonym": "Wayuu",
3928
- "family": "Arawakan",
3929
- "flores_path": null,
3930
- "fleurs_tag": null,
3931
- "commonvoice_hours": 0.0,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3932
  "commonvoice_locale": "guc",
3933
  "in_benchmark": false,
3934
  "task": null,
@@ -4125,7 +4365,7 @@
4125
  "in_benchmark": true,
4126
  "task": "language_modeling",
4127
  "metric": "chrf",
4128
- "score": 0.9489245079595486,
4129
  "model": 1.0
4130
  },
4131
  {
@@ -4507,10 +4747,58 @@
4507
  "commonvoice_hours": 33.0,
4508
  "commonvoice_locale": "id",
4509
  "in_benchmark": true,
4510
- "task": null,
4511
- "metric": null,
4512
- "score": null,
4513
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4514
  },
4515
  {
4516
  "bcp_47": "ie",
@@ -4667,10 +4955,58 @@
4667
  "commonvoice_hours": 362.0,
4668
  "commonvoice_locale": "it",
4669
  "in_benchmark": true,
4670
- "task": null,
4671
- "metric": null,
4672
- "score": null,
4673
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4674
  },
4675
  {
4676
  "bcp_47": "iu",
@@ -4715,10 +5051,58 @@
4715
  "commonvoice_hours": 222.0,
4716
  "commonvoice_locale": "ja",
4717
  "in_benchmark": true,
4718
- "task": null,
4719
- "metric": null,
4720
- "score": null,
4721
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4722
  },
4723
  {
4724
  "bcp_47": "jam",
@@ -4827,39 +5211,87 @@
4827
  "commonvoice_hours": 0.0,
4828
  "commonvoice_locale": "jv",
4829
  "in_benchmark": true,
4830
- "task": null,
4831
- "metric": null,
4832
- "score": null,
4833
- "model": null
4834
  },
4835
  {
4836
- "bcp_47": "ka",
4837
- "speakers": 3543646,
4838
- "language_name": "Georgian",
4839
- "autonym": "ქართული",
4840
- "family": "Kartvelian",
4841
- "flores_path": "kat_Geor",
4842
- "fleurs_tag": "ka_ge",
4843
- "commonvoice_hours": 158.0,
4844
- "commonvoice_locale": "ka",
4845
  "in_benchmark": true,
4846
- "task": null,
4847
- "metric": null,
4848
- "score": null,
4849
- "model": null
4850
  },
4851
  {
4852
- "bcp_47": "kaa",
4853
- "speakers": 489046,
4854
- "language_name": "Kara-Kalpak",
4855
- "autonym": "Kara-Kalpak",
4856
- "family": "Turkic",
4857
- "flores_path": null,
4858
- "fleurs_tag": null,
4859
- "commonvoice_hours": 0.0,
4860
- "commonvoice_locale": "kaa",
4861
- "in_benchmark": false,
4862
- "task": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4863
  "metric": null,
4864
  "score": null,
4865
  "model": null
@@ -4952,7 +5384,7 @@
4952
  "family": "Abkhaz-Adyge",
4953
  "flores_path": null,
4954
  "fleurs_tag": null,
4955
- "commonvoice_hours": 18.0,
4956
  "commonvoice_locale": "kbd",
4957
  "in_benchmark": false,
4958
  "task": null,
@@ -5451,10 +5883,58 @@
5451
  "commonvoice_hours": 1.7,
5452
  "commonvoice_locale": "ko",
5453
  "in_benchmark": true,
5454
- "task": null,
5455
- "metric": null,
5456
- "score": null,
5457
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5458
  },
5459
  {
5460
  "bcp_47": "koi",
@@ -5752,7 +6232,7 @@
5752
  "family": "Indo-European",
5753
  "flores_path": null,
5754
  "fleurs_tag": null,
5755
- "commonvoice_hours": 5.3,
5756
  "commonvoice_locale": "kw",
5757
  "in_benchmark": false,
5758
  "task": null,
@@ -6872,7 +7352,7 @@
6872
  "family": "Indo-European",
6873
  "flores_path": "mkd_Cyrl",
6874
  "fleurs_tag": "mk_mk",
6875
- "commonvoice_hours": 18.0,
6876
  "commonvoice_locale": "mk",
6877
  "in_benchmark": true,
6878
  "task": null,
@@ -7019,10 +7499,58 @@
7019
  "commonvoice_hours": 20.0,
7020
  "commonvoice_locale": "mr",
7021
  "in_benchmark": true,
7022
- "task": null,
7023
- "metric": null,
7024
- "score": null,
7025
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7026
  },
7027
  {
7028
  "bcp_47": "mrd",
@@ -7976,7 +8504,7 @@
7976
  "family": "Indo-European",
7977
  "flores_path": null,
7978
  "fleurs_tag": null,
7979
- "commonvoice_hours": 0.7,
7980
  "commonvoice_locale": "os",
7981
  "in_benchmark": false,
7982
  "task": null,
@@ -8029,7 +8557,7 @@
8029
  "in_benchmark": true,
8030
  "task": "language_modeling",
8031
  "metric": "chrf",
8032
- "score": 0.8692673671947869,
8033
  "model": 1.0
8034
  },
8035
  {
@@ -8397,7 +8925,7 @@
8397
  "in_benchmark": true,
8398
  "task": "language_modeling",
8399
  "metric": "chrf",
8400
- "score": 0.9723487188655754,
8401
  "model": 1.0
8402
  },
8403
  {
@@ -8824,13 +9352,61 @@
8824
  "family": "Indo-European",
8825
  "flores_path": "rus_Cyrl",
8826
  "fleurs_tag": "ru_ru",
8827
- "commonvoice_hours": 242.0,
8828
  "commonvoice_locale": "ru",
8829
  "in_benchmark": true,
8830
- "task": null,
8831
- "metric": null,
8832
- "score": null,
8833
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8834
  },
8835
  {
8836
  "bcp_47": "rue",
@@ -9224,7 +9800,7 @@
9224
  "family": null,
9225
  "flores_path": null,
9226
  "fleurs_tag": null,
9227
- "commonvoice_hours": 1.8,
9228
  "commonvoice_locale": "sei",
9229
  "in_benchmark": false,
9230
  "task": null,
@@ -9803,32 +10379,80 @@
9803
  "commonvoice_hours": 411.0,
9804
  "commonvoice_locale": "sw",
9805
  "in_benchmark": true,
9806
- "task": null,
9807
- "metric": null,
9808
- "score": null,
9809
- "model": null
9810
  },
9811
  {
9812
- "bcp_47": "swb",
9813
- "speakers": 170720,
9814
- "language_name": "Comorian",
9815
- "autonym": "Comorian",
9816
  "family": "Atlantic-Congo",
9817
- "flores_path": null,
9818
- "fleurs_tag": null,
9819
- "commonvoice_hours": null,
9820
- "commonvoice_locale": null,
9821
- "in_benchmark": false,
9822
- "task": null,
9823
- "metric": null,
9824
- "score": null,
9825
- "model": null
9826
  },
9827
  {
9828
- "bcp_47": "swg",
9829
- "speakers": 801597,
9830
- "language_name": "Swabian",
9831
- "autonym": "Swabian",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9832
  "family": "Indo-European",
9833
  "flores_path": null,
9834
  "fleurs_tag": null,
@@ -9931,10 +10555,58 @@
9931
  "commonvoice_hours": 234.0,
9932
  "commonvoice_locale": "ta",
9933
  "in_benchmark": true,
9934
- "task": null,
9935
- "metric": null,
9936
- "score": null,
9937
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9938
  },
9939
  {
9940
  "bcp_47": "taj",
@@ -10043,10 +10715,58 @@
10043
  "commonvoice_hours": 0.3,
10044
  "commonvoice_locale": "te",
10045
  "in_benchmark": true,
10046
- "task": null,
10047
- "metric": null,
10048
- "score": null,
10049
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
10050
  },
10051
  {
10052
  "bcp_47": "tem",
@@ -10411,10 +11131,58 @@
10411
  "commonvoice_hours": 128.0,
10412
  "commonvoice_locale": "tr",
10413
  "in_benchmark": true,
10414
- "task": null,
10415
- "metric": null,
10416
- "score": null,
10417
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
10418
  },
10419
  {
10420
  "bcp_47": "tru",
@@ -10829,7 +11597,7 @@
10829
  "in_benchmark": true,
10830
  "task": "language_modeling",
10831
  "metric": "chrf",
10832
- "score": 0.9345902038028003,
10833
  "model": 1.0
10834
  },
10835
  {
@@ -10845,7 +11613,7 @@
10845
  "in_benchmark": true,
10846
  "task": "translation",
10847
  "metric": "bleu",
10848
- "score": 0.2433585957791825,
10849
  "model": 1.0
10850
  },
10851
  {
@@ -10955,42 +11723,90 @@
10955
  "commonvoice_hours": 6.0,
10956
  "commonvoice_locale": "vi",
10957
  "in_benchmark": true,
10958
- "task": null,
10959
- "metric": null,
10960
- "score": null,
10961
- "model": null
10962
  },
10963
  {
10964
- "bcp_47": "vic",
10965
- "speakers": 3113,
10966
- "language_name": "Virgin Islands Creole English",
10967
- "autonym": "Virgin Islands Creole English",
10968
- "family": "Indo-European",
10969
- "flores_path": null,
10970
- "fleurs_tag": null,
10971
- "commonvoice_hours": null,
10972
- "commonvoice_locale": null,
10973
- "in_benchmark": false,
10974
- "task": null,
10975
- "metric": null,
10976
- "score": null,
10977
- "model": null
10978
  },
10979
  {
10980
- "bcp_47": "vls",
10981
- "speakers": 1172070,
10982
- "language_name": "West Flemish",
10983
- "autonym": "West Flemish",
10984
- "family": "Indo-European",
10985
- "flores_path": null,
10986
- "fleurs_tag": null,
10987
- "commonvoice_hours": null,
10988
- "commonvoice_locale": null,
10989
- "in_benchmark": false,
10990
- "task": null,
10991
- "metric": null,
10992
- "score": null,
10993
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
10994
  },
10995
  {
10996
  "bcp_47": "vmf",
@@ -11499,10 +12315,58 @@
11499
  "commonvoice_hours": 203.0,
11500
  "commonvoice_locale": "yue",
11501
  "in_benchmark": true,
11502
- "task": null,
11503
- "metric": null,
11504
- "score": null,
11505
- "model": null
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11506
  },
11507
  {
11508
  "bcp_47": "za",
@@ -11613,7 +12477,7 @@
11613
  "in_benchmark": true,
11614
  "task": "language_modeling",
11615
  "metric": "chrf",
11616
- "score": 0.8599948525016986,
11617
  "model": 12.0
11618
  },
11619
  {
@@ -11711,7 +12575,7 @@
11711
  "bcp_47": "en",
11712
  "task": "language_modeling",
11713
  "metric": "chrf",
11714
- "score": 0.9725001956658679,
11715
  "sentence_nr": 14.5
11716
  },
11717
  {
@@ -11743,7 +12607,7 @@
11743
  "bcp_47": "zh",
11744
  "task": "language_modeling",
11745
  "metric": "chrf",
11746
- "score": 0.9167395508743035,
11747
  "sentence_nr": 14.5
11748
  },
11749
  {
@@ -11775,7 +12639,7 @@
11775
  "bcp_47": "en",
11776
  "task": "language_modeling",
11777
  "metric": "chrf",
11778
- "score": 0.9775327885540744,
11779
  "sentence_nr": 14.5
11780
  },
11781
  {
@@ -11807,7 +12671,7 @@
11807
  "bcp_47": "zh",
11808
  "task": "language_modeling",
11809
  "metric": "chrf",
11810
- "score": 0.9474992128891527,
11811
  "sentence_nr": 14.5
11812
  },
11813
  {
@@ -11839,7 +12703,7 @@
11839
  "bcp_47": "en",
11840
  "task": "language_modeling",
11841
  "metric": "chrf",
11842
- "score": 0.990925430282282,
11843
  "sentence_nr": 14.5
11844
  },
11845
  {
@@ -11871,7 +12735,7 @@
11871
  "bcp_47": "zh",
11872
  "task": "language_modeling",
11873
  "metric": "chrf",
11874
- "score": 0.9511134398957932,
11875
  "sentence_nr": 14.5
11876
  },
11877
  {
@@ -11903,7 +12767,7 @@
11903
  "bcp_47": "en",
11904
  "task": "language_modeling",
11905
  "metric": "chrf",
11906
- "score": 0.9904802851977837,
11907
  "sentence_nr": 14.5
11908
  },
11909
  {
@@ -11935,7 +12799,7 @@
11935
  "bcp_47": "zh",
11936
  "task": "language_modeling",
11937
  "metric": "chrf",
11938
- "score": 0.9231083500990617,
11939
  "sentence_nr": 14.5
11940
  },
11941
  {
@@ -11967,7 +12831,7 @@
11967
  "bcp_47": "en",
11968
  "task": "language_modeling",
11969
  "metric": "chrf",
11970
- "score": 0.9674315682816375,
11971
  "sentence_nr": 14.5
11972
  },
11973
  {
@@ -11999,7 +12863,7 @@
11999
  "bcp_47": "zh",
12000
  "task": "language_modeling",
12001
  "metric": "chrf",
12002
- "score": 0.9230555490695652,
12003
  "sentence_nr": 14.5
12004
  },
12005
  {
@@ -12031,7 +12895,7 @@
12031
  "bcp_47": "en",
12032
  "task": "language_modeling",
12033
  "metric": "chrf",
12034
- "score": 0.9701295103188484,
12035
  "sentence_nr": 14.5
12036
  },
12037
  {
@@ -12039,7 +12903,7 @@
12039
  "bcp_47": "en",
12040
  "task": "translation",
12041
  "metric": "bleu",
12042
- "score": 0.44443705644214526,
12043
  "sentence_nr": 14.5
12044
  },
12045
  {
@@ -12063,7 +12927,7 @@
12063
  "bcp_47": "zh",
12064
  "task": "language_modeling",
12065
  "metric": "chrf",
12066
- "score": 0.8705635265954298,
12067
  "sentence_nr": 14.5
12068
  },
12069
  {
@@ -12095,7 +12959,7 @@
12095
  "bcp_47": "ar",
12096
  "task": "language_modeling",
12097
  "metric": "chrf",
12098
- "score": 0.9307208363594199,
12099
  "sentence_nr": 14.5
12100
  },
12101
  {
@@ -12114,6 +12978,38 @@
12114
  "score": 0.4684314458952127,
12115
  "sentence_nr": 14.5
12116
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12117
  {
12118
  "model": "meta-llama/llama-3.3-70b-instruct",
12119
  "bcp_47": "bn",
@@ -12127,7 +13023,7 @@
12127
  "bcp_47": "bn",
12128
  "task": "language_modeling",
12129
  "metric": "chrf",
12130
- "score": 0.8990036074617607,
12131
  "sentence_nr": 14.5
12132
  },
12133
  {
@@ -12146,6 +13042,38 @@
12146
  "score": 0.4076175886917154,
12147
  "sentence_nr": 14.5
12148
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12149
  {
12150
  "model": "meta-llama/llama-3.3-70b-instruct",
12151
  "bcp_47": "en",
@@ -12159,7 +13087,7 @@
12159
  "bcp_47": "en",
12160
  "task": "language_modeling",
12161
  "metric": "chrf",
12162
- "score": 0.9708732257334283,
12163
  "sentence_nr": 14.5
12164
  },
12165
  {
@@ -12191,7 +13119,7 @@
12191
  "bcp_47": "es",
12192
  "task": "language_modeling",
12193
  "metric": "chrf",
12194
- "score": 0.9602736376353148,
12195
  "sentence_nr": 14.5
12196
  },
12197
  {
@@ -12212,162 +13140,674 @@
12212
  },
12213
  {
12214
  "model": "meta-llama/llama-3.3-70b-instruct",
12215
- "bcp_47": "fr",
12216
  "task": "classification",
12217
  "metric": "accuracy",
12218
- "score": 0.5333333333333333,
12219
  "sentence_nr": 14.5
12220
  },
12221
  {
12222
  "model": "meta-llama/llama-3.3-70b-instruct",
12223
- "bcp_47": "fr",
12224
  "task": "language_modeling",
12225
  "metric": "chrf",
12226
- "score": 0.9756346055321089,
12227
  "sentence_nr": 14.5
12228
  },
12229
  {
12230
  "model": "meta-llama/llama-3.3-70b-instruct",
12231
- "bcp_47": "fr",
12232
  "task": "translation",
12233
  "metric": "bleu",
12234
- "score": 0.3193235920661593,
12235
  "sentence_nr": 14.5
12236
  },
12237
  {
12238
  "model": "meta-llama/llama-3.3-70b-instruct",
12239
- "bcp_47": "fr",
12240
  "task": "translation",
12241
  "metric": "chrf",
12242
- "score": 0.4875691290722964,
12243
  "sentence_nr": 14.5
12244
  },
12245
  {
12246
  "model": "meta-llama/llama-3.3-70b-instruct",
12247
- "bcp_47": "hi",
12248
  "task": "classification",
12249
  "metric": "accuracy",
12250
- "score": 0.5333333333333333,
12251
  "sentence_nr": 14.5
12252
  },
12253
  {
12254
  "model": "meta-llama/llama-3.3-70b-instruct",
12255
- "bcp_47": "hi",
12256
  "task": "language_modeling",
12257
  "metric": "chrf",
12258
- "score": 0.9489245079595486,
12259
  "sentence_nr": 14.5
12260
  },
12261
  {
12262
  "model": "meta-llama/llama-3.3-70b-instruct",
12263
- "bcp_47": "hi",
12264
  "task": "translation",
12265
  "metric": "bleu",
12266
- "score": 0.31956422674397006,
12267
  "sentence_nr": 14.5
12268
  },
12269
  {
12270
  "model": "meta-llama/llama-3.3-70b-instruct",
12271
- "bcp_47": "hi",
12272
  "task": "translation",
12273
  "metric": "chrf",
12274
- "score": 0.4896277852320754,
12275
  "sentence_nr": 14.5
12276
  },
12277
  {
12278
  "model": "meta-llama/llama-3.3-70b-instruct",
12279
- "bcp_47": "pa",
12280
  "task": "classification",
12281
  "metric": "accuracy",
12282
- "score": 0.4,
12283
  "sentence_nr": 14.5
12284
  },
12285
  {
12286
  "model": "meta-llama/llama-3.3-70b-instruct",
12287
- "bcp_47": "pa",
12288
  "task": "language_modeling",
12289
  "metric": "chrf",
12290
- "score": 0.8692673671947869,
12291
  "sentence_nr": 14.5
12292
  },
12293
  {
12294
  "model": "meta-llama/llama-3.3-70b-instruct",
12295
- "bcp_47": "pa",
12296
  "task": "translation",
12297
  "metric": "bleu",
12298
- "score": 0.3368333727390049,
12299
  "sentence_nr": 14.5
12300
  },
12301
  {
12302
  "model": "meta-llama/llama-3.3-70b-instruct",
12303
- "bcp_47": "pa",
12304
  "task": "translation",
12305
  "metric": "chrf",
12306
- "score": 0.4873541452250132,
12307
  "sentence_nr": 14.5
12308
  },
12309
  {
12310
  "model": "meta-llama/llama-3.3-70b-instruct",
12311
- "bcp_47": "pt",
12312
  "task": "classification",
12313
  "metric": "accuracy",
12314
- "score": 0.5,
12315
  "sentence_nr": 14.5
12316
  },
12317
  {
12318
  "model": "meta-llama/llama-3.3-70b-instruct",
12319
- "bcp_47": "pt",
12320
  "task": "language_modeling",
12321
  "metric": "chrf",
12322
- "score": 0.9723487188655754,
12323
  "sentence_nr": 14.5
12324
  },
12325
  {
12326
  "model": "meta-llama/llama-3.3-70b-instruct",
12327
- "bcp_47": "pt",
12328
  "task": "translation",
12329
  "metric": "bleu",
12330
- "score": 0.3110105331834714,
12331
  "sentence_nr": 14.5
12332
  },
12333
  {
12334
  "model": "meta-llama/llama-3.3-70b-instruct",
12335
- "bcp_47": "pt",
12336
  "task": "translation",
12337
  "metric": "chrf",
12338
- "score": 0.49172080600981716,
12339
  "sentence_nr": 14.5
12340
  },
12341
  {
12342
  "model": "meta-llama/llama-3.3-70b-instruct",
12343
- "bcp_47": "ur",
12344
  "task": "classification",
12345
  "metric": "accuracy",
12346
- "score": 0.5,
12347
  "sentence_nr": 14.5
12348
  },
12349
  {
12350
  "model": "meta-llama/llama-3.3-70b-instruct",
12351
- "bcp_47": "ur",
12352
  "task": "language_modeling",
12353
  "metric": "chrf",
12354
- "score": 0.9345902038028003,
12355
  "sentence_nr": 14.5
12356
  },
12357
  {
12358
  "model": "meta-llama/llama-3.3-70b-instruct",
12359
- "bcp_47": "ur",
12360
  "task": "translation",
12361
  "metric": "bleu",
12362
- "score": 0.2433585957791825,
12363
  "sentence_nr": 14.5
12364
  },
12365
  {
12366
  "model": "meta-llama/llama-3.3-70b-instruct",
12367
- "bcp_47": "ur",
12368
  "task": "translation",
12369
  "metric": "chrf",
12370
- "score": 0.42196914378741973,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12371
  "sentence_nr": 14.5
12372
  },
12373
  {
@@ -12383,7 +13823,7 @@
12383
  "bcp_47": "zh",
12384
  "task": "language_modeling",
12385
  "metric": "chrf",
12386
- "score": 0.9410655280186742,
12387
  "sentence_nr": 14.5
12388
  },
12389
  {
@@ -12415,7 +13855,7 @@
12415
  "bcp_47": "en",
12416
  "task": "language_modeling",
12417
  "metric": "chrf",
12418
- "score": 0.9268050965065061,
12419
  "sentence_nr": 14.5
12420
  },
12421
  {
@@ -12447,7 +13887,7 @@
12447
  "bcp_47": "zh",
12448
  "task": "language_modeling",
12449
  "metric": "chrf",
12450
- "score": 0.8131949865285024,
12451
  "sentence_nr": 14.5
12452
  },
12453
  {
@@ -12479,7 +13919,7 @@
12479
  "bcp_47": "en",
12480
  "task": "language_modeling",
12481
  "metric": "chrf",
12482
- "score": 0.9383955895073849,
12483
  "sentence_nr": 14.5
12484
  },
12485
  {
@@ -12511,7 +13951,7 @@
12511
  "bcp_47": "zh",
12512
  "task": "language_modeling",
12513
  "metric": "chrf",
12514
- "score": 0.8247133394312195,
12515
  "sentence_nr": 14.5
12516
  },
12517
  {
@@ -12543,7 +13983,7 @@
12543
  "bcp_47": "en",
12544
  "task": "language_modeling",
12545
  "metric": "chrf",
12546
- "score": 0.7898342718049297,
12547
  "sentence_nr": 14.5
12548
  },
12549
  {
@@ -12575,7 +14015,7 @@
12575
  "bcp_47": "zh",
12576
  "task": "language_modeling",
12577
  "metric": "chrf",
12578
- "score": 0.921617170849841,
12579
  "sentence_nr": 14.5
12580
  },
12581
  {
@@ -12607,7 +14047,7 @@
12607
  "bcp_47": "en",
12608
  "task": "language_modeling",
12609
  "metric": "chrf",
12610
- "score": 0.9671581799852296,
12611
  "sentence_nr": 14.5
12612
  },
12613
  {
@@ -12639,7 +14079,7 @@
12639
  "bcp_47": "zh",
12640
  "task": "language_modeling",
12641
  "metric": "chrf",
12642
- "score": 0.92938328453392,
12643
  "sentence_nr": 14.5
12644
  },
12645
  {
@@ -12671,7 +14111,7 @@
12671
  "bcp_47": "en",
12672
  "task": "language_modeling",
12673
  "metric": "chrf",
12674
- "score": 0.6047457400839834,
12675
  "sentence_nr": 14.5
12676
  },
12677
  {
@@ -12703,7 +14143,7 @@
12703
  "bcp_47": "zh",
12704
  "task": "language_modeling",
12705
  "metric": "chrf",
12706
- "score": 0.35788429123492,
12707
  "sentence_nr": 14.5
12708
  },
12709
  {
 
3
  {
4
  "task": "classification",
5
  "metric": "accuracy",
6
+ "score": 0.5353333333333333,
7
+ "bcp_47": 28,
8
  "model": 12
9
  },
10
  {
11
  "task": "language_modeling",
12
  "metric": "chrf",
13
+ "score": 0.9172787041570468,
14
+ "bcp_47": 28,
15
  "model": 12
16
  },
17
  {
18
  "task": "translation",
19
  "metric": "bleu",
20
+ "score": 0.31440758611811165,
21
+ "bcp_47": 28,
22
  "model": 12
23
  },
24
  {
25
  "task": "translation",
26
  "metric": "chrf",
27
+ "score": 0.4776446463431595,
28
+ "bcp_47": 28,
29
  "model": 12
30
  }
31
  ],
 
41
  "model": "amazon/nova-micro-v1",
42
  "task": "language_modeling",
43
  "metric": "chrf",
44
+ "score": 0.9358428899682786,
45
  "bcp_47": 2
46
  },
47
  {
 
69
  "model": "google/gemini-2.0-flash-001",
70
  "task": "language_modeling",
71
  "metric": "chrf",
72
+ "score": 0.9585325034195884,
73
  "bcp_47": 2
74
  },
75
  {
 
97
  "model": "google/gemini-2.0-flash-lite-001",
98
  "task": "language_modeling",
99
  "metric": "chrf",
100
+ "score": 0.9574729426945592,
101
  "bcp_47": 2
102
  },
103
  {
 
125
  "model": "google/gemma-3-27b-it",
126
  "task": "language_modeling",
127
  "metric": "chrf",
128
+ "score": 0.9402106879094536,
129
  "bcp_47": 2
130
  },
131
  {
 
153
  "model": "meta-llama/llama-3-70b-instruct",
154
  "task": "language_modeling",
155
  "metric": "chrf",
156
+ "score": 0.9555990324827045,
157
  "bcp_47": 2
158
  },
159
  {
 
181
  "model": "meta-llama/llama-3.1-70b-instruct",
182
  "task": "language_modeling",
183
  "metric": "chrf",
184
+ "score": 0.9458265879125298,
185
  "bcp_47": 2
186
  },
187
  {
188
  "model": "meta-llama/llama-3.1-70b-instruct",
189
  "task": "translation",
190
  "metric": "bleu",
191
+ "score": 0.4318584195195329,
192
  "bcp_47": 2
193
  },
194
  {
 
202
  "model": "meta-llama/llama-3.3-70b-instruct",
203
  "task": "classification",
204
  "metric": "accuracy",
205
+ "score": 0.5142857142857143,
206
+ "bcp_47": 28
207
  },
208
  {
209
  "model": "meta-llama/llama-3.3-70b-instruct",
210
  "task": "language_modeling",
211
  "metric": "chrf",
212
+ "score": 0.9422717613037961,
213
+ "bcp_47": 28
214
  },
215
  {
216
  "model": "meta-llama/llama-3.3-70b-instruct",
217
  "task": "translation",
218
  "metric": "bleu",
219
+ "score": 0.28045810258852616,
220
+ "bcp_47": 28
221
  },
222
  {
223
  "model": "meta-llama/llama-3.3-70b-instruct",
224
  "task": "translation",
225
  "metric": "chrf",
226
+ "score": 0.45694310450071773,
227
+ "bcp_47": 28
228
  },
229
  {
230
  "model": "microsoft/phi-4-multimodal-instruct",
 
237
  "model": "microsoft/phi-4-multimodal-instruct",
238
  "task": "language_modeling",
239
  "metric": "chrf",
240
+ "score": 0.8811352896333067,
241
  "bcp_47": 2
242
  },
243
  {
 
265
  "model": "mistralai/mistral-nemo",
266
  "task": "language_modeling",
267
  "metric": "chrf",
268
+ "score": 0.8612477844203897,
269
  "bcp_47": 2
270
  },
271
  {
 
293
  "model": "mistralai/mistral-small-24b-instruct-2501",
294
  "task": "language_modeling",
295
  "metric": "chrf",
296
+ "score": 0.8782400543225595,
297
  "bcp_47": 2
298
  },
299
  {
 
321
  "model": "openai/gpt-4o-mini",
322
  "task": "language_modeling",
323
  "metric": "chrf",
324
+ "score": 0.9560369064537906,
325
  "bcp_47": 2
326
  },
327
  {
 
349
  "model": "qwen/qwq-32b",
350
  "task": "language_modeling",
351
  "metric": "chrf",
352
+ "score": 0.47001826645586636,
353
  "bcp_47": 2
354
  },
355
  {
 
701
  "in_benchmark": true,
702
  "task": "language_modeling",
703
  "metric": "chrf",
704
+ "score": 0.9392314289764625,
705
  "model": 1.0
706
  },
707
  {
 
827
  "commonvoice_hours": null,
828
  "commonvoice_locale": null,
829
  "in_benchmark": true,
830
+ "task": "classification",
831
+ "metric": "accuracy",
832
+ "score": 0.4,
833
+ "model": 1.0
834
+ },
835
+ {
836
+ "bcp_47": "arz",
837
+ "speakers": 66639360,
838
+ "language_name": "Egyptian Arabic",
839
+ "autonym": "Egyptian Arabic",
840
+ "family": "Afro-Asiatic",
841
+ "flores_path": "arz_Arab",
842
+ "fleurs_tag": null,
843
+ "commonvoice_hours": null,
844
+ "commonvoice_locale": null,
845
+ "in_benchmark": true,
846
+ "task": "language_modeling",
847
+ "metric": "chrf",
848
+ "score": 0.930329195667362,
849
+ "model": 1.0
850
+ },
851
+ {
852
+ "bcp_47": "arz",
853
+ "speakers": 66639360,
854
+ "language_name": "Egyptian Arabic",
855
+ "autonym": "Egyptian Arabic",
856
+ "family": "Afro-Asiatic",
857
+ "flores_path": "arz_Arab",
858
+ "fleurs_tag": null,
859
+ "commonvoice_hours": null,
860
+ "commonvoice_locale": null,
861
+ "in_benchmark": true,
862
+ "task": "translation",
863
+ "metric": "bleu",
864
+ "score": 0.19793415292805128,
865
+ "model": 1.0
866
+ },
867
+ {
868
+ "bcp_47": "arz",
869
+ "speakers": 66639360,
870
+ "language_name": "Egyptian Arabic",
871
+ "autonym": "Egyptian Arabic",
872
+ "family": "Afro-Asiatic",
873
+ "flores_path": "arz_Arab",
874
+ "fleurs_tag": null,
875
+ "commonvoice_hours": null,
876
+ "commonvoice_locale": null,
877
+ "in_benchmark": true,
878
+ "task": "translation",
879
+ "metric": "chrf",
880
+ "score": 0.3881278724939126,
881
+ "model": 1.0
882
  },
883
  {
884
  "bcp_47": "as",
 
1661
  "in_benchmark": true,
1662
  "task": "language_modeling",
1663
  "metric": "chrf",
1664
+ "score": 0.9097658392566466,
1665
  "model": 1.0
1666
  },
1667
  {
 
2040
  "family": "Indo-European",
2041
  "flores_path": "cat_Latn",
2042
  "fleurs_tag": "ca_es",
2043
+ "commonvoice_hours": 2845.0,
2044
  "commonvoice_locale": "ca",
2045
  "in_benchmark": true,
2046
  "task": null,
 
2635
  "commonvoice_hours": 1360.0,
2636
  "commonvoice_locale": "de",
2637
  "in_benchmark": true,
2638
+ "task": "classification",
2639
+ "metric": "accuracy",
2640
+ "score": 0.6666666666666666,
2641
+ "model": 1.0
2642
+ },
2643
+ {
2644
+ "bcp_47": "de",
2645
+ "speakers": 136350226,
2646
+ "language_name": "German",
2647
+ "autonym": "Deutsch",
2648
+ "family": "Indo-European",
2649
+ "flores_path": "deu_Latn",
2650
+ "fleurs_tag": "de_de",
2651
+ "commonvoice_hours": 1360.0,
2652
+ "commonvoice_locale": "de",
2653
+ "in_benchmark": true,
2654
+ "task": "language_modeling",
2655
+ "metric": "chrf",
2656
+ "score": 0.9594656177914042,
2657
+ "model": 1.0
2658
+ },
2659
+ {
2660
+ "bcp_47": "de",
2661
+ "speakers": 136350226,
2662
+ "language_name": "German",
2663
+ "autonym": "Deutsch",
2664
+ "family": "Indo-European",
2665
+ "flores_path": "deu_Latn",
2666
+ "fleurs_tag": "de_de",
2667
+ "commonvoice_hours": 1360.0,
2668
+ "commonvoice_locale": "de",
2669
+ "in_benchmark": true,
2670
+ "task": "translation",
2671
+ "metric": "bleu",
2672
+ "score": 0.3207642359472324,
2673
+ "model": 1.0
2674
+ },
2675
+ {
2676
+ "bcp_47": "de",
2677
+ "speakers": 136350226,
2678
+ "language_name": "German",
2679
+ "autonym": "Deutsch",
2680
+ "family": "Indo-European",
2681
+ "flores_path": "deu_Latn",
2682
+ "fleurs_tag": "de_de",
2683
+ "commonvoice_hours": 1360.0,
2684
+ "commonvoice_locale": "de",
2685
+ "in_benchmark": true,
2686
+ "task": "translation",
2687
+ "metric": "chrf",
2688
+ "score": 0.49973270743869647,
2689
+ "model": 1.0
2690
  },
2691
  {
2692
  "bcp_47": "den",
 
3021
  "in_benchmark": true,
3022
  "task": "language_modeling",
3023
  "metric": "chrf",
3024
+ "score": 0.9180269549823046,
3025
  "model": 12.0
3026
  },
3027
  {
 
3037
  "in_benchmark": true,
3038
  "task": "translation",
3039
  "metric": "bleu",
3040
+ "score": 0.3703633711863608,
3041
  "model": 12.0
3042
  },
3043
  {
 
3101
  "in_benchmark": true,
3102
  "task": "language_modeling",
3103
  "metric": "chrf",
3104
+ "score": 0.9569342865902168,
3105
  "model": 1.0
3106
  },
3107
  {
 
3176
  "family": null,
3177
  "flores_path": "eus_Latn",
3178
  "fleurs_tag": null,
3179
+ "commonvoice_hours": 336.0,
3180
  "commonvoice_locale": "eu",
3181
  "in_benchmark": true,
3182
  "task": null,
 
3227
  "commonvoice_hours": 370.0,
3228
  "commonvoice_locale": "fa",
3229
  "in_benchmark": true,
3230
+ "task": "classification",
3231
+ "metric": "accuracy",
3232
+ "score": 0.4,
3233
+ "model": 1.0
3234
+ },
3235
+ {
3236
+ "bcp_47": "fa",
3237
+ "speakers": 84710459,
3238
+ "language_name": "Persian",
3239
+ "autonym": "فارسی",
3240
+ "family": "Indo-European",
3241
+ "flores_path": "pes_Arab",
3242
+ "fleurs_tag": "fa_ir",
3243
+ "commonvoice_hours": 370.0,
3244
+ "commonvoice_locale": "fa",
3245
+ "in_benchmark": true,
3246
+ "task": "language_modeling",
3247
+ "metric": "chrf",
3248
+ "score": 0.9414698824984596,
3249
+ "model": 1.0
3250
+ },
3251
+ {
3252
+ "bcp_47": "fa",
3253
+ "speakers": 84710459,
3254
+ "language_name": "Persian",
3255
+ "autonym": "فارسی",
3256
+ "family": "Indo-European",
3257
+ "flores_path": "pes_Arab",
3258
+ "fleurs_tag": "fa_ir",
3259
+ "commonvoice_hours": 370.0,
3260
+ "commonvoice_locale": "fa",
3261
+ "in_benchmark": true,
3262
+ "task": "translation",
3263
+ "metric": "bleu",
3264
+ "score": 0.26232478733341374,
3265
+ "model": 1.0
3266
+ },
3267
+ {
3268
+ "bcp_47": "fa",
3269
+ "speakers": 84710459,
3270
+ "language_name": "Persian",
3271
+ "autonym": "فارسی",
3272
+ "family": "Indo-European",
3273
+ "flores_path": "pes_Arab",
3274
+ "fleurs_tag": "fa_ir",
3275
+ "commonvoice_hours": 370.0,
3276
+ "commonvoice_locale": "fa",
3277
+ "in_benchmark": true,
3278
+ "task": "translation",
3279
+ "metric": "chrf",
3280
+ "score": 0.44641220608314985,
3281
+ "model": 1.0
3282
  },
3283
  {
3284
  "bcp_47": "fan",
 
3387
  "commonvoice_hours": 0.0,
3388
  "commonvoice_locale": "tl",
3389
  "in_benchmark": true,
3390
+ "task": "classification",
3391
+ "metric": "accuracy",
3392
+ "score": 0.43333333333333335,
3393
+ "model": 1.0
3394
+ },
3395
+ {
3396
+ "bcp_47": "fil",
3397
+ "speakers": 67471096,
3398
+ "language_name": "Filipino",
3399
+ "autonym": "Filipino",
3400
+ "family": "Austronesian",
3401
+ "flores_path": "fil_Latn",
3402
+ "fleurs_tag": "fil_ph",
3403
+ "commonvoice_hours": 0.0,
3404
+ "commonvoice_locale": "tl",
3405
+ "in_benchmark": true,
3406
+ "task": "language_modeling",
3407
+ "metric": "chrf",
3408
+ "score": 0.9402707475255596,
3409
+ "model": 1.0
3410
+ },
3411
+ {
3412
+ "bcp_47": "fil",
3413
+ "speakers": 67471096,
3414
+ "language_name": "Filipino",
3415
+ "autonym": "Filipino",
3416
+ "family": "Austronesian",
3417
+ "flores_path": "fil_Latn",
3418
+ "fleurs_tag": "fil_ph",
3419
+ "commonvoice_hours": 0.0,
3420
+ "commonvoice_locale": "tl",
3421
+ "in_benchmark": true,
3422
+ "task": "translation",
3423
+ "metric": "bleu",
3424
+ "score": 0.29097818784870333,
3425
+ "model": 1.0
3426
+ },
3427
+ {
3428
+ "bcp_47": "fil",
3429
+ "speakers": 67471096,
3430
+ "language_name": "Filipino",
3431
+ "autonym": "Filipino",
3432
+ "family": "Austronesian",
3433
+ "flores_path": "fil_Latn",
3434
+ "fleurs_tag": "fil_ph",
3435
+ "commonvoice_hours": 0.0,
3436
+ "commonvoice_locale": "tl",
3437
+ "in_benchmark": true,
3438
+ "task": "translation",
3439
+ "metric": "chrf",
3440
+ "score": 0.44978114149245985,
3441
+ "model": 1.0
3442
  },
3443
  {
3444
  "bcp_47": "fit",
 
3533
  "in_benchmark": true,
3534
  "task": "language_modeling",
3535
  "metric": "chrf",
3536
+ "score": 0.9815706066541411,
3537
  "model": 1.0
3538
  },
3539
  {
 
3736
  "family": "Indo-European",
3737
  "flores_path": "gle_Latn",
3738
  "fleurs_tag": "ga_ie",
3739
+ "commonvoice_hours": 6.0,
3740
  "commonvoice_locale": "ga-IE",
3741
  "in_benchmark": true,
3742
  "task": null,
 
4091
  "commonvoice_hours": 0.0,
4092
  "commonvoice_locale": "gu-IN",
4093
  "in_benchmark": true,
4094
+ "task": "classification",
4095
+ "metric": "accuracy",
4096
+ "score": 0.43333333333333335,
4097
+ "model": 1.0
4098
  },
4099
  {
4100
+ "bcp_47": "gu",
4101
+ "speakers": 61721799,
4102
+ "language_name": "Gujarati",
4103
+ "autonym": "ગુજરાતી",
4104
+ "family": "Indo-European",
4105
+ "flores_path": "guj_Gujr",
4106
+ "fleurs_tag": "gu_in",
4107
+ "commonvoice_hours": 0.0,
4108
+ "commonvoice_locale": "gu-IN",
4109
+ "in_benchmark": true,
4110
+ "task": "language_modeling",
4111
+ "metric": "chrf",
4112
+ "score": 0.938086045460355,
4113
+ "model": 1.0
4114
  },
4115
  {
4116
+ "bcp_47": "gu",
4117
+ "speakers": 61721799,
4118
+ "language_name": "Gujarati",
4119
+ "autonym": "ગુજરાતી",
4120
+ "family": "Indo-European",
4121
+ "flores_path": "guj_Gujr",
4122
+ "fleurs_tag": "gu_in",
4123
+ "commonvoice_hours": 0.0,
4124
+ "commonvoice_locale": "gu-IN",
4125
+ "in_benchmark": true,
4126
+ "task": "translation",
4127
+ "metric": "bleu",
4128
+ "score": 0.26442484966880464,
4129
+ "model": 1.0
4130
+ },
4131
+ {
4132
+ "bcp_47": "gu",
4133
+ "speakers": 61721799,
4134
+ "language_name": "Gujarati",
4135
+ "autonym": "ગુજરાતી",
4136
+ "family": "Indo-European",
4137
+ "flores_path": "guj_Gujr",
4138
+ "fleurs_tag": "gu_in",
4139
+ "commonvoice_hours": 0.0,
4140
+ "commonvoice_locale": "gu-IN",
4141
+ "in_benchmark": true,
4142
+ "task": "translation",
4143
+ "metric": "chrf",
4144
+ "score": 0.44452182973195975,
4145
+ "model": 1.0
4146
+ },
4147
+ {
4148
+ "bcp_47": "gub",
4149
+ "speakers": 17784,
4150
+ "language_name": "Guajajára",
4151
+ "autonym": "Guajajára",
4152
+ "family": "Tupian",
4153
+ "flores_path": null,
4154
+ "fleurs_tag": null,
4155
+ "commonvoice_hours": null,
4156
+ "commonvoice_locale": null,
4157
+ "in_benchmark": false,
4158
+ "task": null,
4159
+ "metric": null,
4160
+ "score": null,
4161
+ "model": null
4162
+ },
4163
+ {
4164
+ "bcp_47": "guc",
4165
+ "speakers": 132529,
4166
+ "language_name": "Wayuu",
4167
+ "autonym": "Wayuu",
4168
+ "family": "Arawakan",
4169
+ "flores_path": null,
4170
+ "fleurs_tag": null,
4171
+ "commonvoice_hours": 0.0,
4172
  "commonvoice_locale": "guc",
4173
  "in_benchmark": false,
4174
  "task": null,
 
4365
  "in_benchmark": true,
4366
  "task": "language_modeling",
4367
  "metric": "chrf",
4368
+ "score": 0.9428185393832219,
4369
  "model": 1.0
4370
  },
4371
  {
 
4747
  "commonvoice_hours": 33.0,
4748
  "commonvoice_locale": "id",
4749
  "in_benchmark": true,
4750
+ "task": "classification",
4751
+ "metric": "accuracy",
4752
+ "score": 0.6333333333333333,
4753
+ "model": 1.0
4754
+ },
4755
+ {
4756
+ "bcp_47": "id",
4757
+ "speakers": 171207687,
4758
+ "language_name": "Indonesian",
4759
+ "autonym": "Bahasa Indonesia",
4760
+ "family": "Austronesian",
4761
+ "flores_path": "ind_Latn",
4762
+ "fleurs_tag": "id_id",
4763
+ "commonvoice_hours": 33.0,
4764
+ "commonvoice_locale": "id",
4765
+ "in_benchmark": true,
4766
+ "task": "language_modeling",
4767
+ "metric": "chrf",
4768
+ "score": 0.9598314474300775,
4769
+ "model": 1.0
4770
+ },
4771
+ {
4772
+ "bcp_47": "id",
4773
+ "speakers": 171207687,
4774
+ "language_name": "Indonesian",
4775
+ "autonym": "Bahasa Indonesia",
4776
+ "family": "Austronesian",
4777
+ "flores_path": "ind_Latn",
4778
+ "fleurs_tag": "id_id",
4779
+ "commonvoice_hours": 33.0,
4780
+ "commonvoice_locale": "id",
4781
+ "in_benchmark": true,
4782
+ "task": "translation",
4783
+ "metric": "bleu",
4784
+ "score": 0.29354203311552335,
4785
+ "model": 1.0
4786
+ },
4787
+ {
4788
+ "bcp_47": "id",
4789
+ "speakers": 171207687,
4790
+ "language_name": "Indonesian",
4791
+ "autonym": "Bahasa Indonesia",
4792
+ "family": "Austronesian",
4793
+ "flores_path": "ind_Latn",
4794
+ "fleurs_tag": "id_id",
4795
+ "commonvoice_hours": 33.0,
4796
+ "commonvoice_locale": "id",
4797
+ "in_benchmark": true,
4798
+ "task": "translation",
4799
+ "metric": "chrf",
4800
+ "score": 0.4723493656022861,
4801
+ "model": 1.0
4802
  },
4803
  {
4804
  "bcp_47": "ie",
 
4955
  "commonvoice_hours": 362.0,
4956
  "commonvoice_locale": "it",
4957
  "in_benchmark": true,
4958
+ "task": "classification",
4959
+ "metric": "accuracy",
4960
+ "score": 0.6666666666666666,
4961
+ "model": 1.0
4962
+ },
4963
+ {
4964
+ "bcp_47": "it",
4965
+ "speakers": 70247060,
4966
+ "language_name": "Italian",
4967
+ "autonym": "Italiano",
4968
+ "family": "Indo-European",
4969
+ "flores_path": "ita_Latn",
4970
+ "fleurs_tag": "it_it",
4971
+ "commonvoice_hours": 362.0,
4972
+ "commonvoice_locale": "it",
4973
+ "in_benchmark": true,
4974
+ "task": "language_modeling",
4975
+ "metric": "chrf",
4976
+ "score": 0.9439490413212892,
4977
+ "model": 1.0
4978
+ },
4979
+ {
4980
+ "bcp_47": "it",
4981
+ "speakers": 70247060,
4982
+ "language_name": "Italian",
4983
+ "autonym": "Italiano",
4984
+ "family": "Indo-European",
4985
+ "flores_path": "ita_Latn",
4986
+ "fleurs_tag": "it_it",
4987
+ "commonvoice_hours": 362.0,
4988
+ "commonvoice_locale": "it",
4989
+ "in_benchmark": true,
4990
+ "task": "translation",
4991
+ "metric": "bleu",
4992
+ "score": 0.28142583904826096,
4993
+ "model": 1.0
4994
+ },
4995
+ {
4996
+ "bcp_47": "it",
4997
+ "speakers": 70247060,
4998
+ "language_name": "Italian",
4999
+ "autonym": "Italiano",
5000
+ "family": "Indo-European",
5001
+ "flores_path": "ita_Latn",
5002
+ "fleurs_tag": "it_it",
5003
+ "commonvoice_hours": 362.0,
5004
+ "commonvoice_locale": "it",
5005
+ "in_benchmark": true,
5006
+ "task": "translation",
5007
+ "metric": "chrf",
5008
+ "score": 0.4707591889357925,
5009
+ "model": 1.0
5010
  },
5011
  {
5012
  "bcp_47": "iu",
 
5051
  "commonvoice_hours": 222.0,
5052
  "commonvoice_locale": "ja",
5053
  "in_benchmark": true,
5054
+ "task": "classification",
5055
+ "metric": "accuracy",
5056
+ "score": 0.6333333333333333,
5057
+ "model": 1.0
5058
+ },
5059
+ {
5060
+ "bcp_47": "ja",
5061
+ "speakers": 119729026,
5062
+ "language_name": "Japanese",
5063
+ "autonym": "日本語",
5064
+ "family": "Japonic",
5065
+ "flores_path": "jpn_Jpan",
5066
+ "fleurs_tag": "ja_jp",
5067
+ "commonvoice_hours": 222.0,
5068
+ "commonvoice_locale": "ja",
5069
+ "in_benchmark": true,
5070
+ "task": "language_modeling",
5071
+ "metric": "chrf",
5072
+ "score": 0.9371132855221468,
5073
+ "model": 1.0
5074
+ },
5075
+ {
5076
+ "bcp_47": "ja",
5077
+ "speakers": 119729026,
5078
+ "language_name": "Japanese",
5079
+ "autonym": "日本語",
5080
+ "family": "Japonic",
5081
+ "flores_path": "jpn_Jpan",
5082
+ "fleurs_tag": "ja_jp",
5083
+ "commonvoice_hours": 222.0,
5084
+ "commonvoice_locale": "ja",
5085
+ "in_benchmark": true,
5086
+ "task": "translation",
5087
+ "metric": "bleu",
5088
+ "score": 0.2723410893967824,
5089
+ "model": 1.0
5090
+ },
5091
+ {
5092
+ "bcp_47": "ja",
5093
+ "speakers": 119729026,
5094
+ "language_name": "Japanese",
5095
+ "autonym": "日本語",
5096
+ "family": "Japonic",
5097
+ "flores_path": "jpn_Jpan",
5098
+ "fleurs_tag": "ja_jp",
5099
+ "commonvoice_hours": 222.0,
5100
+ "commonvoice_locale": "ja",
5101
+ "in_benchmark": true,
5102
+ "task": "translation",
5103
+ "metric": "chrf",
5104
+ "score": 0.43929453749366865,
5105
+ "model": 1.0
5106
  },
5107
  {
5108
  "bcp_47": "jam",
 
5211
  "commonvoice_hours": 0.0,
5212
  "commonvoice_locale": "jv",
5213
  "in_benchmark": true,
5214
+ "task": "classification",
5215
+ "metric": "accuracy",
5216
+ "score": 0.4666666666666667,
5217
+ "model": 1.0
5218
  },
5219
  {
5220
+ "bcp_47": "jv",
5221
+ "speakers": 91180665,
5222
+ "language_name": "Javanese",
5223
+ "autonym": "Jawa",
5224
+ "family": "Austronesian",
5225
+ "flores_path": "jav_Latn",
5226
+ "fleurs_tag": "jv_id",
5227
+ "commonvoice_hours": 0.0,
5228
+ "commonvoice_locale": "jv",
5229
  "in_benchmark": true,
5230
+ "task": "language_modeling",
5231
+ "metric": "chrf",
5232
+ "score": 0.9298143194922116,
5233
+ "model": 1.0
5234
  },
5235
  {
5236
+ "bcp_47": "jv",
5237
+ "speakers": 91180665,
5238
+ "language_name": "Javanese",
5239
+ "autonym": "Jawa",
5240
+ "family": "Austronesian",
5241
+ "flores_path": "jav_Latn",
5242
+ "fleurs_tag": "jv_id",
5243
+ "commonvoice_hours": 0.0,
5244
+ "commonvoice_locale": "jv",
5245
+ "in_benchmark": true,
5246
+ "task": "translation",
5247
+ "metric": "bleu",
5248
+ "score": 0.23729186537968905,
5249
+ "model": 1.0
5250
+ },
5251
+ {
5252
+ "bcp_47": "jv",
5253
+ "speakers": 91180665,
5254
+ "language_name": "Javanese",
5255
+ "autonym": "Jawa",
5256
+ "family": "Austronesian",
5257
+ "flores_path": "jav_Latn",
5258
+ "fleurs_tag": "jv_id",
5259
+ "commonvoice_hours": 0.0,
5260
+ "commonvoice_locale": "jv",
5261
+ "in_benchmark": true,
5262
+ "task": "translation",
5263
+ "metric": "chrf",
5264
+ "score": 0.4198940727847352,
5265
+ "model": 1.0
5266
+ },
5267
+ {
5268
+ "bcp_47": "ka",
5269
+ "speakers": 3543646,
5270
+ "language_name": "Georgian",
5271
+ "autonym": "ქართული",
5272
+ "family": "Kartvelian",
5273
+ "flores_path": "kat_Geor",
5274
+ "fleurs_tag": "ka_ge",
5275
+ "commonvoice_hours": 158.0,
5276
+ "commonvoice_locale": "ka",
5277
+ "in_benchmark": true,
5278
+ "task": null,
5279
+ "metric": null,
5280
+ "score": null,
5281
+ "model": null
5282
+ },
5283
+ {
5284
+ "bcp_47": "kaa",
5285
+ "speakers": 489046,
5286
+ "language_name": "Kara-Kalpak",
5287
+ "autonym": "Kara-Kalpak",
5288
+ "family": "Turkic",
5289
+ "flores_path": null,
5290
+ "fleurs_tag": null,
5291
+ "commonvoice_hours": 0.0,
5292
+ "commonvoice_locale": "kaa",
5293
+ "in_benchmark": false,
5294
+ "task": null,
5295
  "metric": null,
5296
  "score": null,
5297
  "model": null
 
5384
  "family": "Abkhaz-Adyge",
5385
  "flores_path": null,
5386
  "fleurs_tag": null,
5387
+ "commonvoice_hours": 19.0,
5388
  "commonvoice_locale": "kbd",
5389
  "in_benchmark": false,
5390
  "task": null,
 
5883
  "commonvoice_hours": 1.7,
5884
  "commonvoice_locale": "ko",
5885
  "in_benchmark": true,
5886
+ "task": "classification",
5887
+ "metric": "accuracy",
5888
+ "score": 0.5333333333333333,
5889
+ "model": 1.0
5890
+ },
5891
+ {
5892
+ "bcp_47": "ko",
5893
+ "speakers": 78357046,
5894
+ "language_name": "Korean",
5895
+ "autonym": "한국어",
5896
+ "family": "Koreanic",
5897
+ "flores_path": "kor_Hang",
5898
+ "fleurs_tag": "ko_kr",
5899
+ "commonvoice_hours": 1.7,
5900
+ "commonvoice_locale": "ko",
5901
+ "in_benchmark": true,
5902
+ "task": "language_modeling",
5903
+ "metric": "chrf",
5904
+ "score": 0.9355445912073929,
5905
+ "model": 1.0
5906
+ },
5907
+ {
5908
+ "bcp_47": "ko",
5909
+ "speakers": 78357046,
5910
+ "language_name": "Korean",
5911
+ "autonym": "한국어",
5912
+ "family": "Koreanic",
5913
+ "flores_path": "kor_Hang",
5914
+ "fleurs_tag": "ko_kr",
5915
+ "commonvoice_hours": 1.7,
5916
+ "commonvoice_locale": "ko",
5917
+ "in_benchmark": true,
5918
+ "task": "translation",
5919
+ "metric": "bleu",
5920
+ "score": 0.20332074778330964,
5921
+ "model": 1.0
5922
+ },
5923
+ {
5924
+ "bcp_47": "ko",
5925
+ "speakers": 78357046,
5926
+ "language_name": "Korean",
5927
+ "autonym": "한국어",
5928
+ "family": "Koreanic",
5929
+ "flores_path": "kor_Hang",
5930
+ "fleurs_tag": "ko_kr",
5931
+ "commonvoice_hours": 1.7,
5932
+ "commonvoice_locale": "ko",
5933
+ "in_benchmark": true,
5934
+ "task": "translation",
5935
+ "metric": "chrf",
5936
+ "score": 0.4005255477730261,
5937
+ "model": 1.0
5938
  },
5939
  {
5940
  "bcp_47": "koi",
 
6232
  "family": "Indo-European",
6233
  "flores_path": null,
6234
  "fleurs_tag": null,
6235
+ "commonvoice_hours": 8.1,
6236
  "commonvoice_locale": "kw",
6237
  "in_benchmark": false,
6238
  "task": null,
 
7352
  "family": "Indo-European",
7353
  "flores_path": "mkd_Cyrl",
7354
  "fleurs_tag": "mk_mk",
7355
+ "commonvoice_hours": 19.0,
7356
  "commonvoice_locale": "mk",
7357
  "in_benchmark": true,
7358
  "task": null,
 
7499
  "commonvoice_hours": 20.0,
7500
  "commonvoice_locale": "mr",
7501
  "in_benchmark": true,
7502
+ "task": "classification",
7503
+ "metric": "accuracy",
7504
+ "score": 0.6333333333333333,
7505
+ "model": 1.0
7506
+ },
7507
+ {
7508
+ "bcp_47": "mr",
7509
+ "speakers": 92826300,
7510
+ "language_name": "Marathi",
7511
+ "autonym": "मराठी",
7512
+ "family": "Indo-European",
7513
+ "flores_path": "mar_Deva",
7514
+ "fleurs_tag": "mr_in",
7515
+ "commonvoice_hours": 20.0,
7516
+ "commonvoice_locale": "mr",
7517
+ "in_benchmark": true,
7518
+ "task": "language_modeling",
7519
+ "metric": "chrf",
7520
+ "score": 0.9440892312053646,
7521
+ "model": 1.0
7522
+ },
7523
+ {
7524
+ "bcp_47": "mr",
7525
+ "speakers": 92826300,
7526
+ "language_name": "Marathi",
7527
+ "autonym": "मराठी",
7528
+ "family": "Indo-European",
7529
+ "flores_path": "mar_Deva",
7530
+ "fleurs_tag": "mr_in",
7531
+ "commonvoice_hours": 20.0,
7532
+ "commonvoice_locale": "mr",
7533
+ "in_benchmark": true,
7534
+ "task": "translation",
7535
+ "metric": "bleu",
7536
+ "score": 0.24903049799655144,
7537
+ "model": 1.0
7538
+ },
7539
+ {
7540
+ "bcp_47": "mr",
7541
+ "speakers": 92826300,
7542
+ "language_name": "Marathi",
7543
+ "autonym": "मराठी",
7544
+ "family": "Indo-European",
7545
+ "flores_path": "mar_Deva",
7546
+ "fleurs_tag": "mr_in",
7547
+ "commonvoice_hours": 20.0,
7548
+ "commonvoice_locale": "mr",
7549
+ "in_benchmark": true,
7550
+ "task": "translation",
7551
+ "metric": "chrf",
7552
+ "score": 0.42489125861884175,
7553
+ "model": 1.0
7554
  },
7555
  {
7556
  "bcp_47": "mrd",
 
8504
  "family": "Indo-European",
8505
  "flores_path": null,
8506
  "fleurs_tag": null,
8507
+ "commonvoice_hours": 0.8,
8508
  "commonvoice_locale": "os",
8509
  "in_benchmark": false,
8510
  "task": null,
 
8557
  "in_benchmark": true,
8558
  "task": "language_modeling",
8559
  "metric": "chrf",
8560
+ "score": 0.9025298113664532,
8561
  "model": 1.0
8562
  },
8563
  {
 
8925
  "in_benchmark": true,
8926
  "task": "language_modeling",
8927
  "metric": "chrf",
8928
+ "score": 0.9641423549595803,
8929
  "model": 1.0
8930
  },
8931
  {
 
9352
  "family": "Indo-European",
9353
  "flores_path": "rus_Cyrl",
9354
  "fleurs_tag": "ru_ru",
9355
+ "commonvoice_hours": 243.0,
9356
  "commonvoice_locale": "ru",
9357
  "in_benchmark": true,
9358
+ "task": "classification",
9359
+ "metric": "accuracy",
9360
+ "score": 0.5666666666666667,
9361
+ "model": 1.0
9362
+ },
9363
+ {
9364
+ "bcp_47": "ru",
9365
+ "speakers": 195841151,
9366
+ "language_name": "Russian",
9367
+ "autonym": "Русский",
9368
+ "family": "Indo-European",
9369
+ "flores_path": "rus_Cyrl",
9370
+ "fleurs_tag": "ru_ru",
9371
+ "commonvoice_hours": 243.0,
9372
+ "commonvoice_locale": "ru",
9373
+ "in_benchmark": true,
9374
+ "task": "language_modeling",
9375
+ "metric": "chrf",
9376
+ "score": 0.9663696817874857,
9377
+ "model": 1.0
9378
+ },
9379
+ {
9380
+ "bcp_47": "ru",
9381
+ "speakers": 195841151,
9382
+ "language_name": "Russian",
9383
+ "autonym": "Русский",
9384
+ "family": "Indo-European",
9385
+ "flores_path": "rus_Cyrl",
9386
+ "fleurs_tag": "ru_ru",
9387
+ "commonvoice_hours": 243.0,
9388
+ "commonvoice_locale": "ru",
9389
+ "in_benchmark": true,
9390
+ "task": "translation",
9391
+ "metric": "bleu",
9392
+ "score": 0.26015179309825326,
9393
+ "model": 1.0
9394
+ },
9395
+ {
9396
+ "bcp_47": "ru",
9397
+ "speakers": 195841151,
9398
+ "language_name": "Russian",
9399
+ "autonym": "Русский",
9400
+ "family": "Indo-European",
9401
+ "flores_path": "rus_Cyrl",
9402
+ "fleurs_tag": "ru_ru",
9403
+ "commonvoice_hours": 243.0,
9404
+ "commonvoice_locale": "ru",
9405
+ "in_benchmark": true,
9406
+ "task": "translation",
9407
+ "metric": "chrf",
9408
+ "score": 0.4525762744858351,
9409
+ "model": 1.0
9410
  },
9411
  {
9412
  "bcp_47": "rue",
 
9800
  "family": null,
9801
  "flores_path": null,
9802
  "fleurs_tag": null,
9803
+ "commonvoice_hours": 2.5,
9804
  "commonvoice_locale": "sei",
9805
  "in_benchmark": false,
9806
  "task": null,
 
10379
  "commonvoice_hours": 411.0,
10380
  "commonvoice_locale": "sw",
10381
  "in_benchmark": true,
10382
+ "task": "classification",
10383
+ "metric": "accuracy",
10384
+ "score": 0.5666666666666667,
10385
+ "model": 1.0
10386
  },
10387
  {
10388
+ "bcp_47": "sw",
10389
+ "speakers": 171610296,
10390
+ "language_name": "Swahili",
10391
+ "autonym": "Kiswahili",
10392
  "family": "Atlantic-Congo",
10393
+ "flores_path": "swh_Latn",
10394
+ "fleurs_tag": "sw_ke",
10395
+ "commonvoice_hours": 411.0,
10396
+ "commonvoice_locale": "sw",
10397
+ "in_benchmark": true,
10398
+ "task": "language_modeling",
10399
+ "metric": "chrf",
10400
+ "score": 0.9401745263817055,
10401
+ "model": 1.0
10402
  },
10403
  {
10404
+ "bcp_47": "sw",
10405
+ "speakers": 171610296,
10406
+ "language_name": "Swahili",
10407
+ "autonym": "Kiswahili",
10408
+ "family": "Atlantic-Congo",
10409
+ "flores_path": "swh_Latn",
10410
+ "fleurs_tag": "sw_ke",
10411
+ "commonvoice_hours": 411.0,
10412
+ "commonvoice_locale": "sw",
10413
+ "in_benchmark": true,
10414
+ "task": "translation",
10415
+ "metric": "bleu",
10416
+ "score": 0.30022614000139736,
10417
+ "model": 1.0
10418
+ },
10419
+ {
10420
+ "bcp_47": "sw",
10421
+ "speakers": 171610296,
10422
+ "language_name": "Swahili",
10423
+ "autonym": "Kiswahili",
10424
+ "family": "Atlantic-Congo",
10425
+ "flores_path": "swh_Latn",
10426
+ "fleurs_tag": "sw_ke",
10427
+ "commonvoice_hours": 411.0,
10428
+ "commonvoice_locale": "sw",
10429
+ "in_benchmark": true,
10430
+ "task": "translation",
10431
+ "metric": "chrf",
10432
+ "score": 0.46620999112028233,
10433
+ "model": 1.0
10434
+ },
10435
+ {
10436
+ "bcp_47": "swb",
10437
+ "speakers": 170720,
10438
+ "language_name": "Comorian",
10439
+ "autonym": "Comorian",
10440
+ "family": "Atlantic-Congo",
10441
+ "flores_path": null,
10442
+ "fleurs_tag": null,
10443
+ "commonvoice_hours": null,
10444
+ "commonvoice_locale": null,
10445
+ "in_benchmark": false,
10446
+ "task": null,
10447
+ "metric": null,
10448
+ "score": null,
10449
+ "model": null
10450
+ },
10451
+ {
10452
+ "bcp_47": "swg",
10453
+ "speakers": 801597,
10454
+ "language_name": "Swabian",
10455
+ "autonym": "Swabian",
10456
  "family": "Indo-European",
10457
  "flores_path": null,
10458
  "fleurs_tag": null,
 
10555
  "commonvoice_hours": 234.0,
10556
  "commonvoice_locale": "ta",
10557
  "in_benchmark": true,
10558
+ "task": "classification",
10559
+ "metric": "accuracy",
10560
+ "score": 0.43333333333333335,
10561
+ "model": 1.0
10562
+ },
10563
+ {
10564
+ "bcp_47": "ta",
10565
+ "speakers": 85616159,
10566
+ "language_name": "Tamil",
10567
+ "autonym": "தமிழ்",
10568
+ "family": "Dravidian",
10569
+ "flores_path": "tam_Taml",
10570
+ "fleurs_tag": "ta_in",
10571
+ "commonvoice_hours": 234.0,
10572
+ "commonvoice_locale": "ta",
10573
+ "in_benchmark": true,
10574
+ "task": "language_modeling",
10575
+ "metric": "chrf",
10576
+ "score": 0.9641464401452432,
10577
+ "model": 1.0
10578
+ },
10579
+ {
10580
+ "bcp_47": "ta",
10581
+ "speakers": 85616159,
10582
+ "language_name": "Tamil",
10583
+ "autonym": "தமிழ்",
10584
+ "family": "Dravidian",
10585
+ "flores_path": "tam_Taml",
10586
+ "fleurs_tag": "ta_in",
10587
+ "commonvoice_hours": 234.0,
10588
+ "commonvoice_locale": "ta",
10589
+ "in_benchmark": true,
10590
+ "task": "translation",
10591
+ "metric": "bleu",
10592
+ "score": 0.2528104486727614,
10593
+ "model": 1.0
10594
+ },
10595
+ {
10596
+ "bcp_47": "ta",
10597
+ "speakers": 85616159,
10598
+ "language_name": "Tamil",
10599
+ "autonym": "தமிழ்",
10600
+ "family": "Dravidian",
10601
+ "flores_path": "tam_Taml",
10602
+ "fleurs_tag": "ta_in",
10603
+ "commonvoice_hours": 234.0,
10604
+ "commonvoice_locale": "ta",
10605
+ "in_benchmark": true,
10606
+ "task": "translation",
10607
+ "metric": "chrf",
10608
+ "score": 0.42077045938882934,
10609
+ "model": 1.0
10610
  },
10611
  {
10612
  "bcp_47": "taj",
 
10715
  "commonvoice_hours": 0.3,
10716
  "commonvoice_locale": "te",
10717
  "in_benchmark": true,
10718
+ "task": "classification",
10719
+ "metric": "accuracy",
10720
+ "score": 0.36666666666666664,
10721
+ "model": 1.0
10722
+ },
10723
+ {
10724
+ "bcp_47": "te",
10725
+ "speakers": 95478480,
10726
+ "language_name": "Telugu",
10727
+ "autonym": "తెలుగు",
10728
+ "family": "Dravidian",
10729
+ "flores_path": "tel_Telu",
10730
+ "fleurs_tag": "te_in",
10731
+ "commonvoice_hours": 0.3,
10732
+ "commonvoice_locale": "te",
10733
+ "in_benchmark": true,
10734
+ "task": "language_modeling",
10735
+ "metric": "chrf",
10736
+ "score": 0.9513838296654142,
10737
+ "model": 1.0
10738
+ },
10739
+ {
10740
+ "bcp_47": "te",
10741
+ "speakers": 95478480,
10742
+ "language_name": "Telugu",
10743
+ "autonym": "తెలుగు",
10744
+ "family": "Dravidian",
10745
+ "flores_path": "tel_Telu",
10746
+ "fleurs_tag": "te_in",
10747
+ "commonvoice_hours": 0.3,
10748
+ "commonvoice_locale": "te",
10749
+ "in_benchmark": true,
10750
+ "task": "translation",
10751
+ "metric": "bleu",
10752
+ "score": 0.28338449781147135,
10753
+ "model": 1.0
10754
+ },
10755
+ {
10756
+ "bcp_47": "te",
10757
+ "speakers": 95478480,
10758
+ "language_name": "Telugu",
10759
+ "autonym": "తెలుగు",
10760
+ "family": "Dravidian",
10761
+ "flores_path": "tel_Telu",
10762
+ "fleurs_tag": "te_in",
10763
+ "commonvoice_hours": 0.3,
10764
+ "commonvoice_locale": "te",
10765
+ "in_benchmark": true,
10766
+ "task": "translation",
10767
+ "metric": "chrf",
10768
+ "score": 0.467003606031036,
10769
+ "model": 1.0
10770
  },
10771
  {
10772
  "bcp_47": "tem",
 
11131
  "commonvoice_hours": 128.0,
11132
  "commonvoice_locale": "tr",
11133
  "in_benchmark": true,
11134
+ "task": "classification",
11135
+ "metric": "accuracy",
11136
+ "score": 0.5333333333333333,
11137
+ "model": 1.0
11138
+ },
11139
+ {
11140
+ "bcp_47": "tr",
11141
+ "speakers": 80360704,
11142
+ "language_name": "Turkish",
11143
+ "autonym": "Türkçe",
11144
+ "family": "Turkic",
11145
+ "flores_path": "tur_Latn",
11146
+ "fleurs_tag": "tr_tr",
11147
+ "commonvoice_hours": 128.0,
11148
+ "commonvoice_locale": "tr",
11149
+ "in_benchmark": true,
11150
+ "task": "language_modeling",
11151
+ "metric": "chrf",
11152
+ "score": 0.9446670623712353,
11153
+ "model": 1.0
11154
+ },
11155
+ {
11156
+ "bcp_47": "tr",
11157
+ "speakers": 80360704,
11158
+ "language_name": "Turkish",
11159
+ "autonym": "Türkçe",
11160
+ "family": "Turkic",
11161
+ "flores_path": "tur_Latn",
11162
+ "fleurs_tag": "tr_tr",
11163
+ "commonvoice_hours": 128.0,
11164
+ "commonvoice_locale": "tr",
11165
+ "in_benchmark": true,
11166
+ "task": "translation",
11167
+ "metric": "bleu",
11168
+ "score": 0.2844596261435892,
11169
+ "model": 1.0
11170
+ },
11171
+ {
11172
+ "bcp_47": "tr",
11173
+ "speakers": 80360704,
11174
+ "language_name": "Turkish",
11175
+ "autonym": "Türkçe",
11176
+ "family": "Turkic",
11177
+ "flores_path": "tur_Latn",
11178
+ "fleurs_tag": "tr_tr",
11179
+ "commonvoice_hours": 128.0,
11180
+ "commonvoice_locale": "tr",
11181
+ "in_benchmark": true,
11182
+ "task": "translation",
11183
+ "metric": "chrf",
11184
+ "score": 0.4525478264239361,
11185
+ "model": 1.0
11186
  },
11187
  {
11188
  "bcp_47": "tru",
 
11597
  "in_benchmark": true,
11598
  "task": "language_modeling",
11599
  "metric": "chrf",
11600
+ "score": 0.9182703887696211,
11601
  "model": 1.0
11602
  },
11603
  {
 
11613
  "in_benchmark": true,
11614
  "task": "translation",
11615
  "metric": "bleu",
11616
+ "score": 0.2434522914619727,
11617
  "model": 1.0
11618
  },
11619
  {
 
11723
  "commonvoice_hours": 6.0,
11724
  "commonvoice_locale": "vi",
11725
  "in_benchmark": true,
11726
+ "task": "classification",
11727
+ "metric": "accuracy",
11728
+ "score": 0.6,
11729
+ "model": 1.0
11730
  },
11731
  {
11732
+ "bcp_47": "vi",
11733
+ "speakers": 86222962,
11734
+ "language_name": "Vietnamese",
11735
+ "autonym": "Tiếng Việt",
11736
+ "family": "Austroasiatic",
11737
+ "flores_path": "vie_Latn",
11738
+ "fleurs_tag": "vi_vn",
11739
+ "commonvoice_hours": 6.0,
11740
+ "commonvoice_locale": "vi",
11741
+ "in_benchmark": true,
11742
+ "task": "language_modeling",
11743
+ "metric": "chrf",
11744
+ "score": 0.9580044761495575,
11745
+ "model": 1.0
11746
  },
11747
  {
11748
+ "bcp_47": "vi",
11749
+ "speakers": 86222962,
11750
+ "language_name": "Vietnamese",
11751
+ "autonym": "Tiếng Việt",
11752
+ "family": "Austroasiatic",
11753
+ "flores_path": "vie_Latn",
11754
+ "fleurs_tag": "vi_vn",
11755
+ "commonvoice_hours": 6.0,
11756
+ "commonvoice_locale": "vi",
11757
+ "in_benchmark": true,
11758
+ "task": "translation",
11759
+ "metric": "bleu",
11760
+ "score": 0.25541664062319624,
11761
+ "model": 1.0
11762
+ },
11763
+ {
11764
+ "bcp_47": "vi",
11765
+ "speakers": 86222962,
11766
+ "language_name": "Vietnamese",
11767
+ "autonym": "Tiếng Việt",
11768
+ "family": "Austroasiatic",
11769
+ "flores_path": "vie_Latn",
11770
+ "fleurs_tag": "vi_vn",
11771
+ "commonvoice_hours": 6.0,
11772
+ "commonvoice_locale": "vi",
11773
+ "in_benchmark": true,
11774
+ "task": "translation",
11775
+ "metric": "chrf",
11776
+ "score": 0.43688984396841446,
11777
+ "model": 1.0
11778
+ },
11779
+ {
11780
+ "bcp_47": "vic",
11781
+ "speakers": 3113,
11782
+ "language_name": "Virgin Islands Creole English",
11783
+ "autonym": "Virgin Islands Creole English",
11784
+ "family": "Indo-European",
11785
+ "flores_path": null,
11786
+ "fleurs_tag": null,
11787
+ "commonvoice_hours": null,
11788
+ "commonvoice_locale": null,
11789
+ "in_benchmark": false,
11790
+ "task": null,
11791
+ "metric": null,
11792
+ "score": null,
11793
+ "model": null
11794
+ },
11795
+ {
11796
+ "bcp_47": "vls",
11797
+ "speakers": 1172070,
11798
+ "language_name": "West Flemish",
11799
+ "autonym": "West Flemish",
11800
+ "family": "Indo-European",
11801
+ "flores_path": null,
11802
+ "fleurs_tag": null,
11803
+ "commonvoice_hours": null,
11804
+ "commonvoice_locale": null,
11805
+ "in_benchmark": false,
11806
+ "task": null,
11807
+ "metric": null,
11808
+ "score": null,
11809
+ "model": null
11810
  },
11811
  {
11812
  "bcp_47": "vmf",
 
12315
  "commonvoice_hours": 203.0,
12316
  "commonvoice_locale": "yue",
12317
  "in_benchmark": true,
12318
+ "task": "classification",
12319
+ "metric": "accuracy",
12320
+ "score": 0.43333333333333335,
12321
+ "model": 1.0
12322
+ },
12323
+ {
12324
+ "bcp_47": "yue",
12325
+ "speakers": 79654759,
12326
+ "language_name": "Cantonese",
12327
+ "autonym": "粵語",
12328
+ "family": "Sino-Tibetan",
12329
+ "flores_path": "yue_Hant",
12330
+ "fleurs_tag": "yue_hant_hk",
12331
+ "commonvoice_hours": 203.0,
12332
+ "commonvoice_locale": "yue",
12333
+ "in_benchmark": true,
12334
+ "task": "language_modeling",
12335
+ "metric": "chrf",
12336
+ "score": 0.9022415223117748,
12337
+ "model": 1.0
12338
+ },
12339
+ {
12340
+ "bcp_47": "yue",
12341
+ "speakers": 79654759,
12342
+ "language_name": "Cantonese",
12343
+ "autonym": "粵語",
12344
+ "family": "Sino-Tibetan",
12345
+ "flores_path": "yue_Hant",
12346
+ "fleurs_tag": "yue_hant_hk",
12347
+ "commonvoice_hours": 203.0,
12348
+ "commonvoice_locale": "yue",
12349
+ "in_benchmark": true,
12350
+ "task": "translation",
12351
+ "metric": "bleu",
12352
+ "score": 0.22628178945118504,
12353
+ "model": 1.0
12354
+ },
12355
+ {
12356
+ "bcp_47": "yue",
12357
+ "speakers": 79654759,
12358
+ "language_name": "Cantonese",
12359
+ "autonym": "粵語",
12360
+ "family": "Sino-Tibetan",
12361
+ "flores_path": "yue_Hant",
12362
+ "fleurs_tag": "yue_hant_hk",
12363
+ "commonvoice_hours": 203.0,
12364
+ "commonvoice_locale": "yue",
12365
+ "in_benchmark": true,
12366
+ "task": "translation",
12367
+ "metric": "chrf",
12368
+ "score": 0.4052050858435178,
12369
+ "model": 1.0
12370
  },
12371
  {
12372
  "bcp_47": "za",
 
12477
  "in_benchmark": true,
12478
  "task": "language_modeling",
12479
  "metric": "chrf",
12480
+ "score": 0.862116462347859,
12481
  "model": 12.0
12482
  },
12483
  {
 
12575
  "bcp_47": "en",
12576
  "task": "language_modeling",
12577
  "metric": "chrf",
12578
+ "score": 0.9596433057062642,
12579
  "sentence_nr": 14.5
12580
  },
12581
  {
 
12607
  "bcp_47": "zh",
12608
  "task": "language_modeling",
12609
  "metric": "chrf",
12610
+ "score": 0.9120424742302929,
12611
  "sentence_nr": 14.5
12612
  },
12613
  {
 
12639
  "bcp_47": "en",
12640
  "task": "language_modeling",
12641
  "metric": "chrf",
12642
+ "score": 0.9854618933889567,
12643
  "sentence_nr": 14.5
12644
  },
12645
  {
 
12671
  "bcp_47": "zh",
12672
  "task": "language_modeling",
12673
  "metric": "chrf",
12674
+ "score": 0.93160311345022,
12675
  "sentence_nr": 14.5
12676
  },
12677
  {
 
12703
  "bcp_47": "en",
12704
  "task": "language_modeling",
12705
  "metric": "chrf",
12706
+ "score": 0.9840731165453181,
12707
  "sentence_nr": 14.5
12708
  },
12709
  {
 
12735
  "bcp_47": "zh",
12736
  "task": "language_modeling",
12737
  "metric": "chrf",
12738
+ "score": 0.9308727688438002,
12739
  "sentence_nr": 14.5
12740
  },
12741
  {
 
12767
  "bcp_47": "en",
12768
  "task": "language_modeling",
12769
  "metric": "chrf",
12770
+ "score": 0.9705999747171945,
12771
  "sentence_nr": 14.5
12772
  },
12773
  {
 
12799
  "bcp_47": "zh",
12800
  "task": "language_modeling",
12801
  "metric": "chrf",
12802
+ "score": 0.9098214011017126,
12803
  "sentence_nr": 14.5
12804
  },
12805
  {
 
12831
  "bcp_47": "en",
12832
  "task": "language_modeling",
12833
  "metric": "chrf",
12834
+ "score": 0.9802918604410554,
12835
  "sentence_nr": 14.5
12836
  },
12837
  {
 
12863
  "bcp_47": "zh",
12864
  "task": "language_modeling",
12865
  "metric": "chrf",
12866
+ "score": 0.9309062045243536,
12867
  "sentence_nr": 14.5
12868
  },
12869
  {
 
12895
  "bcp_47": "en",
12896
  "task": "language_modeling",
12897
  "metric": "chrf",
12898
+ "score": 0.9683113542489836,
12899
  "sentence_nr": 14.5
12900
  },
12901
  {
 
12903
  "bcp_47": "en",
12904
  "task": "translation",
12905
  "metric": "bleu",
12906
+ "score": 0.444507882217401,
12907
  "sentence_nr": 14.5
12908
  },
12909
  {
 
12927
  "bcp_47": "zh",
12928
  "task": "language_modeling",
12929
  "metric": "chrf",
12930
+ "score": 0.9233418215760759,
12931
  "sentence_nr": 14.5
12932
  },
12933
  {
 
12959
  "bcp_47": "ar",
12960
  "task": "language_modeling",
12961
  "metric": "chrf",
12962
+ "score": 0.9392314289764625,
12963
  "sentence_nr": 14.5
12964
  },
12965
  {
 
12978
  "score": 0.4684314458952127,
12979
  "sentence_nr": 14.5
12980
  },
12981
+ {
12982
+ "model": "meta-llama/llama-3.3-70b-instruct",
12983
+ "bcp_47": "arz",
12984
+ "task": "classification",
12985
+ "metric": "accuracy",
12986
+ "score": 0.4,
12987
+ "sentence_nr": 14.5
12988
+ },
12989
+ {
12990
+ "model": "meta-llama/llama-3.3-70b-instruct",
12991
+ "bcp_47": "arz",
12992
+ "task": "language_modeling",
12993
+ "metric": "chrf",
12994
+ "score": 0.930329195667362,
12995
+ "sentence_nr": 14.5
12996
+ },
12997
+ {
12998
+ "model": "meta-llama/llama-3.3-70b-instruct",
12999
+ "bcp_47": "arz",
13000
+ "task": "translation",
13001
+ "metric": "bleu",
13002
+ "score": 0.19793415292805128,
13003
+ "sentence_nr": 14.5
13004
+ },
13005
+ {
13006
+ "model": "meta-llama/llama-3.3-70b-instruct",
13007
+ "bcp_47": "arz",
13008
+ "task": "translation",
13009
+ "metric": "chrf",
13010
+ "score": 0.3881278724939126,
13011
+ "sentence_nr": 14.5
13012
+ },
13013
  {
13014
  "model": "meta-llama/llama-3.3-70b-instruct",
13015
  "bcp_47": "bn",
 
13023
  "bcp_47": "bn",
13024
  "task": "language_modeling",
13025
  "metric": "chrf",
13026
+ "score": 0.9097658392566466,
13027
  "sentence_nr": 14.5
13028
  },
13029
  {
 
13042
  "score": 0.4076175886917154,
13043
  "sentence_nr": 14.5
13044
  },
13045
+ {
13046
+ "model": "meta-llama/llama-3.3-70b-instruct",
13047
+ "bcp_47": "de",
13048
+ "task": "classification",
13049
+ "metric": "accuracy",
13050
+ "score": 0.6666666666666666,
13051
+ "sentence_nr": 14.5
13052
+ },
13053
+ {
13054
+ "model": "meta-llama/llama-3.3-70b-instruct",
13055
+ "bcp_47": "de",
13056
+ "task": "language_modeling",
13057
+ "metric": "chrf",
13058
+ "score": 0.9594656177914042,
13059
+ "sentence_nr": 14.5
13060
+ },
13061
+ {
13062
+ "model": "meta-llama/llama-3.3-70b-instruct",
13063
+ "bcp_47": "de",
13064
+ "task": "translation",
13065
+ "metric": "bleu",
13066
+ "score": 0.3207642359472324,
13067
+ "sentence_nr": 14.5
13068
+ },
13069
+ {
13070
+ "model": "meta-llama/llama-3.3-70b-instruct",
13071
+ "bcp_47": "de",
13072
+ "task": "translation",
13073
+ "metric": "chrf",
13074
+ "score": 0.49973270743869647,
13075
+ "sentence_nr": 14.5
13076
+ },
13077
  {
13078
  "model": "meta-llama/llama-3.3-70b-instruct",
13079
  "bcp_47": "en",
 
13087
  "bcp_47": "en",
13088
  "task": "language_modeling",
13089
  "metric": "chrf",
13090
+ "score": 0.9810108607325073,
13091
  "sentence_nr": 14.5
13092
  },
13093
  {
 
13119
  "bcp_47": "es",
13120
  "task": "language_modeling",
13121
  "metric": "chrf",
13122
+ "score": 0.9569342865902168,
13123
  "sentence_nr": 14.5
13124
  },
13125
  {
 
13140
  },
13141
  {
13142
  "model": "meta-llama/llama-3.3-70b-instruct",
13143
+ "bcp_47": "fa",
13144
  "task": "classification",
13145
  "metric": "accuracy",
13146
+ "score": 0.4,
13147
  "sentence_nr": 14.5
13148
  },
13149
  {
13150
  "model": "meta-llama/llama-3.3-70b-instruct",
13151
+ "bcp_47": "fa",
13152
  "task": "language_modeling",
13153
  "metric": "chrf",
13154
+ "score": 0.9414698824984596,
13155
  "sentence_nr": 14.5
13156
  },
13157
  {
13158
  "model": "meta-llama/llama-3.3-70b-instruct",
13159
+ "bcp_47": "fa",
13160
  "task": "translation",
13161
  "metric": "bleu",
13162
+ "score": 0.26232478733341374,
13163
  "sentence_nr": 14.5
13164
  },
13165
  {
13166
  "model": "meta-llama/llama-3.3-70b-instruct",
13167
+ "bcp_47": "fa",
13168
  "task": "translation",
13169
  "metric": "chrf",
13170
+ "score": 0.44641220608314985,
13171
  "sentence_nr": 14.5
13172
  },
13173
  {
13174
  "model": "meta-llama/llama-3.3-70b-instruct",
13175
+ "bcp_47": "fil",
13176
  "task": "classification",
13177
  "metric": "accuracy",
13178
+ "score": 0.43333333333333335,
13179
  "sentence_nr": 14.5
13180
  },
13181
  {
13182
  "model": "meta-llama/llama-3.3-70b-instruct",
13183
+ "bcp_47": "fil",
13184
  "task": "language_modeling",
13185
  "metric": "chrf",
13186
+ "score": 0.9402707475255596,
13187
  "sentence_nr": 14.5
13188
  },
13189
  {
13190
  "model": "meta-llama/llama-3.3-70b-instruct",
13191
+ "bcp_47": "fil",
13192
  "task": "translation",
13193
  "metric": "bleu",
13194
+ "score": 0.29097818784870333,
13195
  "sentence_nr": 14.5
13196
  },
13197
  {
13198
  "model": "meta-llama/llama-3.3-70b-instruct",
13199
+ "bcp_47": "fil",
13200
  "task": "translation",
13201
  "metric": "chrf",
13202
+ "score": 0.44978114149245985,
13203
  "sentence_nr": 14.5
13204
  },
13205
  {
13206
  "model": "meta-llama/llama-3.3-70b-instruct",
13207
+ "bcp_47": "fr",
13208
  "task": "classification",
13209
  "metric": "accuracy",
13210
+ "score": 0.5333333333333333,
13211
  "sentence_nr": 14.5
13212
  },
13213
  {
13214
  "model": "meta-llama/llama-3.3-70b-instruct",
13215
+ "bcp_47": "fr",
13216
  "task": "language_modeling",
13217
  "metric": "chrf",
13218
+ "score": 0.9815706066541411,
13219
  "sentence_nr": 14.5
13220
  },
13221
  {
13222
  "model": "meta-llama/llama-3.3-70b-instruct",
13223
+ "bcp_47": "fr",
13224
  "task": "translation",
13225
  "metric": "bleu",
13226
+ "score": 0.3193235920661593,
13227
  "sentence_nr": 14.5
13228
  },
13229
  {
13230
  "model": "meta-llama/llama-3.3-70b-instruct",
13231
+ "bcp_47": "fr",
13232
  "task": "translation",
13233
  "metric": "chrf",
13234
+ "score": 0.4875691290722964,
13235
  "sentence_nr": 14.5
13236
  },
13237
  {
13238
  "model": "meta-llama/llama-3.3-70b-instruct",
13239
+ "bcp_47": "gu",
13240
  "task": "classification",
13241
  "metric": "accuracy",
13242
+ "score": 0.43333333333333335,
13243
  "sentence_nr": 14.5
13244
  },
13245
  {
13246
  "model": "meta-llama/llama-3.3-70b-instruct",
13247
+ "bcp_47": "gu",
13248
  "task": "language_modeling",
13249
  "metric": "chrf",
13250
+ "score": 0.938086045460355,
13251
  "sentence_nr": 14.5
13252
  },
13253
  {
13254
  "model": "meta-llama/llama-3.3-70b-instruct",
13255
+ "bcp_47": "gu",
13256
  "task": "translation",
13257
  "metric": "bleu",
13258
+ "score": 0.26442484966880464,
13259
  "sentence_nr": 14.5
13260
  },
13261
  {
13262
  "model": "meta-llama/llama-3.3-70b-instruct",
13263
+ "bcp_47": "gu",
13264
  "task": "translation",
13265
  "metric": "chrf",
13266
+ "score": 0.44452182973195975,
13267
  "sentence_nr": 14.5
13268
  },
13269
  {
13270
  "model": "meta-llama/llama-3.3-70b-instruct",
13271
+ "bcp_47": "hi",
13272
  "task": "classification",
13273
  "metric": "accuracy",
13274
+ "score": 0.5333333333333333,
13275
  "sentence_nr": 14.5
13276
  },
13277
  {
13278
  "model": "meta-llama/llama-3.3-70b-instruct",
13279
+ "bcp_47": "hi",
13280
  "task": "language_modeling",
13281
  "metric": "chrf",
13282
+ "score": 0.9428185393832219,
13283
  "sentence_nr": 14.5
13284
  },
13285
  {
13286
  "model": "meta-llama/llama-3.3-70b-instruct",
13287
+ "bcp_47": "hi",
13288
  "task": "translation",
13289
  "metric": "bleu",
13290
+ "score": 0.31956422674397006,
13291
  "sentence_nr": 14.5
13292
  },
13293
  {
13294
  "model": "meta-llama/llama-3.3-70b-instruct",
13295
+ "bcp_47": "hi",
13296
  "task": "translation",
13297
  "metric": "chrf",
13298
+ "score": 0.4896277852320754,
13299
+ "sentence_nr": 14.5
13300
+ },
13301
+ {
13302
+ "model": "meta-llama/llama-3.3-70b-instruct",
13303
+ "bcp_47": "id",
13304
+ "task": "classification",
13305
+ "metric": "accuracy",
13306
+ "score": 0.6333333333333333,
13307
+ "sentence_nr": 14.5
13308
+ },
13309
+ {
13310
+ "model": "meta-llama/llama-3.3-70b-instruct",
13311
+ "bcp_47": "id",
13312
+ "task": "language_modeling",
13313
+ "metric": "chrf",
13314
+ "score": 0.9598314474300775,
13315
+ "sentence_nr": 14.5
13316
+ },
13317
+ {
13318
+ "model": "meta-llama/llama-3.3-70b-instruct",
13319
+ "bcp_47": "id",
13320
+ "task": "translation",
13321
+ "metric": "bleu",
13322
+ "score": 0.29354203311552335,
13323
+ "sentence_nr": 14.5
13324
+ },
13325
+ {
13326
+ "model": "meta-llama/llama-3.3-70b-instruct",
13327
+ "bcp_47": "id",
13328
+ "task": "translation",
13329
+ "metric": "chrf",
13330
+ "score": 0.4723493656022861,
13331
+ "sentence_nr": 14.5
13332
+ },
13333
+ {
13334
+ "model": "meta-llama/llama-3.3-70b-instruct",
13335
+ "bcp_47": "it",
13336
+ "task": "classification",
13337
+ "metric": "accuracy",
13338
+ "score": 0.6666666666666666,
13339
+ "sentence_nr": 14.5
13340
+ },
13341
+ {
13342
+ "model": "meta-llama/llama-3.3-70b-instruct",
13343
+ "bcp_47": "it",
13344
+ "task": "language_modeling",
13345
+ "metric": "chrf",
13346
+ "score": 0.9439490413212892,
13347
+ "sentence_nr": 14.5
13348
+ },
13349
+ {
13350
+ "model": "meta-llama/llama-3.3-70b-instruct",
13351
+ "bcp_47": "it",
13352
+ "task": "translation",
13353
+ "metric": "bleu",
13354
+ "score": 0.28142583904826096,
13355
+ "sentence_nr": 14.5
13356
+ },
13357
+ {
13358
+ "model": "meta-llama/llama-3.3-70b-instruct",
13359
+ "bcp_47": "it",
13360
+ "task": "translation",
13361
+ "metric": "chrf",
13362
+ "score": 0.4707591889357925,
13363
+ "sentence_nr": 14.5
13364
+ },
13365
+ {
13366
+ "model": "meta-llama/llama-3.3-70b-instruct",
13367
+ "bcp_47": "ja",
13368
+ "task": "classification",
13369
+ "metric": "accuracy",
13370
+ "score": 0.6333333333333333,
13371
+ "sentence_nr": 14.5
13372
+ },
13373
+ {
13374
+ "model": "meta-llama/llama-3.3-70b-instruct",
13375
+ "bcp_47": "ja",
13376
+ "task": "language_modeling",
13377
+ "metric": "chrf",
13378
+ "score": 0.9371132855221468,
13379
+ "sentence_nr": 14.5
13380
+ },
13381
+ {
13382
+ "model": "meta-llama/llama-3.3-70b-instruct",
13383
+ "bcp_47": "ja",
13384
+ "task": "translation",
13385
+ "metric": "bleu",
13386
+ "score": 0.2723410893967824,
13387
+ "sentence_nr": 14.5
13388
+ },
13389
+ {
13390
+ "model": "meta-llama/llama-3.3-70b-instruct",
13391
+ "bcp_47": "ja",
13392
+ "task": "translation",
13393
+ "metric": "chrf",
13394
+ "score": 0.43929453749366865,
13395
+ "sentence_nr": 14.5
13396
+ },
13397
+ {
13398
+ "model": "meta-llama/llama-3.3-70b-instruct",
13399
+ "bcp_47": "jv",
13400
+ "task": "classification",
13401
+ "metric": "accuracy",
13402
+ "score": 0.4666666666666667,
13403
+ "sentence_nr": 14.5
13404
+ },
13405
+ {
13406
+ "model": "meta-llama/llama-3.3-70b-instruct",
13407
+ "bcp_47": "jv",
13408
+ "task": "language_modeling",
13409
+ "metric": "chrf",
13410
+ "score": 0.9298143194922116,
13411
+ "sentence_nr": 14.5
13412
+ },
13413
+ {
13414
+ "model": "meta-llama/llama-3.3-70b-instruct",
13415
+ "bcp_47": "jv",
13416
+ "task": "translation",
13417
+ "metric": "bleu",
13418
+ "score": 0.23729186537968905,
13419
+ "sentence_nr": 14.5
13420
+ },
13421
+ {
13422
+ "model": "meta-llama/llama-3.3-70b-instruct",
13423
+ "bcp_47": "jv",
13424
+ "task": "translation",
13425
+ "metric": "chrf",
13426
+ "score": 0.4198940727847352,
13427
+ "sentence_nr": 14.5
13428
+ },
13429
+ {
13430
+ "model": "meta-llama/llama-3.3-70b-instruct",
13431
+ "bcp_47": "ko",
13432
+ "task": "classification",
13433
+ "metric": "accuracy",
13434
+ "score": 0.5333333333333333,
13435
+ "sentence_nr": 14.5
13436
+ },
13437
+ {
13438
+ "model": "meta-llama/llama-3.3-70b-instruct",
13439
+ "bcp_47": "ko",
13440
+ "task": "language_modeling",
13441
+ "metric": "chrf",
13442
+ "score": 0.9355445912073929,
13443
+ "sentence_nr": 14.5
13444
+ },
13445
+ {
13446
+ "model": "meta-llama/llama-3.3-70b-instruct",
13447
+ "bcp_47": "ko",
13448
+ "task": "translation",
13449
+ "metric": "bleu",
13450
+ "score": 0.20332074778330964,
13451
+ "sentence_nr": 14.5
13452
+ },
13453
+ {
13454
+ "model": "meta-llama/llama-3.3-70b-instruct",
13455
+ "bcp_47": "ko",
13456
+ "task": "translation",
13457
+ "metric": "chrf",
13458
+ "score": 0.4005255477730261,
13459
+ "sentence_nr": 14.5
13460
+ },
13461
+ {
13462
+ "model": "meta-llama/llama-3.3-70b-instruct",
13463
+ "bcp_47": "mr",
13464
+ "task": "classification",
13465
+ "metric": "accuracy",
13466
+ "score": 0.6333333333333333,
13467
+ "sentence_nr": 14.5
13468
+ },
13469
+ {
13470
+ "model": "meta-llama/llama-3.3-70b-instruct",
13471
+ "bcp_47": "mr",
13472
+ "task": "language_modeling",
13473
+ "metric": "chrf",
13474
+ "score": 0.9440892312053646,
13475
+ "sentence_nr": 14.5
13476
+ },
13477
+ {
13478
+ "model": "meta-llama/llama-3.3-70b-instruct",
13479
+ "bcp_47": "mr",
13480
+ "task": "translation",
13481
+ "metric": "bleu",
13482
+ "score": 0.24903049799655144,
13483
+ "sentence_nr": 14.5
13484
+ },
13485
+ {
13486
+ "model": "meta-llama/llama-3.3-70b-instruct",
13487
+ "bcp_47": "mr",
13488
+ "task": "translation",
13489
+ "metric": "chrf",
13490
+ "score": 0.42489125861884175,
13491
+ "sentence_nr": 14.5
13492
+ },
13493
+ {
13494
+ "model": "meta-llama/llama-3.3-70b-instruct",
13495
+ "bcp_47": "pa",
13496
+ "task": "classification",
13497
+ "metric": "accuracy",
13498
+ "score": 0.4,
13499
+ "sentence_nr": 14.5
13500
+ },
13501
+ {
13502
+ "model": "meta-llama/llama-3.3-70b-instruct",
13503
+ "bcp_47": "pa",
13504
+ "task": "language_modeling",
13505
+ "metric": "chrf",
13506
+ "score": 0.9025298113664532,
13507
+ "sentence_nr": 14.5
13508
+ },
13509
+ {
13510
+ "model": "meta-llama/llama-3.3-70b-instruct",
13511
+ "bcp_47": "pa",
13512
+ "task": "translation",
13513
+ "metric": "bleu",
13514
+ "score": 0.3368333727390049,
13515
+ "sentence_nr": 14.5
13516
+ },
13517
+ {
13518
+ "model": "meta-llama/llama-3.3-70b-instruct",
13519
+ "bcp_47": "pa",
13520
+ "task": "translation",
13521
+ "metric": "chrf",
13522
+ "score": 0.4873541452250132,
13523
+ "sentence_nr": 14.5
13524
+ },
13525
+ {
13526
+ "model": "meta-llama/llama-3.3-70b-instruct",
13527
+ "bcp_47": "pt",
13528
+ "task": "classification",
13529
+ "metric": "accuracy",
13530
+ "score": 0.5,
13531
+ "sentence_nr": 14.5
13532
+ },
13533
+ {
13534
+ "model": "meta-llama/llama-3.3-70b-instruct",
13535
+ "bcp_47": "pt",
13536
+ "task": "language_modeling",
13537
+ "metric": "chrf",
13538
+ "score": 0.9641423549595803,
13539
+ "sentence_nr": 14.5
13540
+ },
13541
+ {
13542
+ "model": "meta-llama/llama-3.3-70b-instruct",
13543
+ "bcp_47": "pt",
13544
+ "task": "translation",
13545
+ "metric": "bleu",
13546
+ "score": 0.3110105331834714,
13547
+ "sentence_nr": 14.5
13548
+ },
13549
+ {
13550
+ "model": "meta-llama/llama-3.3-70b-instruct",
13551
+ "bcp_47": "pt",
13552
+ "task": "translation",
13553
+ "metric": "chrf",
13554
+ "score": 0.49172080600981716,
13555
+ "sentence_nr": 14.5
13556
+ },
13557
+ {
13558
+ "model": "meta-llama/llama-3.3-70b-instruct",
13559
+ "bcp_47": "ru",
13560
+ "task": "classification",
13561
+ "metric": "accuracy",
13562
+ "score": 0.5666666666666667,
13563
+ "sentence_nr": 14.5
13564
+ },
13565
+ {
13566
+ "model": "meta-llama/llama-3.3-70b-instruct",
13567
+ "bcp_47": "ru",
13568
+ "task": "language_modeling",
13569
+ "metric": "chrf",
13570
+ "score": 0.9663696817874857,
13571
+ "sentence_nr": 14.5
13572
+ },
13573
+ {
13574
+ "model": "meta-llama/llama-3.3-70b-instruct",
13575
+ "bcp_47": "ru",
13576
+ "task": "translation",
13577
+ "metric": "bleu",
13578
+ "score": 0.26015179309825326,
13579
+ "sentence_nr": 14.5
13580
+ },
13581
+ {
13582
+ "model": "meta-llama/llama-3.3-70b-instruct",
13583
+ "bcp_47": "ru",
13584
+ "task": "translation",
13585
+ "metric": "chrf",
13586
+ "score": 0.4525762744858351,
13587
+ "sentence_nr": 14.5
13588
+ },
13589
+ {
13590
+ "model": "meta-llama/llama-3.3-70b-instruct",
13591
+ "bcp_47": "sw",
13592
+ "task": "classification",
13593
+ "metric": "accuracy",
13594
+ "score": 0.5666666666666667,
13595
+ "sentence_nr": 14.5
13596
+ },
13597
+ {
13598
+ "model": "meta-llama/llama-3.3-70b-instruct",
13599
+ "bcp_47": "sw",
13600
+ "task": "language_modeling",
13601
+ "metric": "chrf",
13602
+ "score": 0.9401745263817055,
13603
+ "sentence_nr": 14.5
13604
+ },
13605
+ {
13606
+ "model": "meta-llama/llama-3.3-70b-instruct",
13607
+ "bcp_47": "sw",
13608
+ "task": "translation",
13609
+ "metric": "bleu",
13610
+ "score": 0.30022614000139736,
13611
+ "sentence_nr": 14.5
13612
+ },
13613
+ {
13614
+ "model": "meta-llama/llama-3.3-70b-instruct",
13615
+ "bcp_47": "sw",
13616
+ "task": "translation",
13617
+ "metric": "chrf",
13618
+ "score": 0.46620999112028233,
13619
+ "sentence_nr": 14.5
13620
+ },
13621
+ {
13622
+ "model": "meta-llama/llama-3.3-70b-instruct",
13623
+ "bcp_47": "ta",
13624
+ "task": "classification",
13625
+ "metric": "accuracy",
13626
+ "score": 0.43333333333333335,
13627
+ "sentence_nr": 14.5
13628
+ },
13629
+ {
13630
+ "model": "meta-llama/llama-3.3-70b-instruct",
13631
+ "bcp_47": "ta",
13632
+ "task": "language_modeling",
13633
+ "metric": "chrf",
13634
+ "score": 0.9641464401452432,
13635
+ "sentence_nr": 14.5
13636
+ },
13637
+ {
13638
+ "model": "meta-llama/llama-3.3-70b-instruct",
13639
+ "bcp_47": "ta",
13640
+ "task": "translation",
13641
+ "metric": "bleu",
13642
+ "score": 0.2528104486727614,
13643
+ "sentence_nr": 14.5
13644
+ },
13645
+ {
13646
+ "model": "meta-llama/llama-3.3-70b-instruct",
13647
+ "bcp_47": "ta",
13648
+ "task": "translation",
13649
+ "metric": "chrf",
13650
+ "score": 0.42077045938882934,
13651
+ "sentence_nr": 14.5
13652
+ },
13653
+ {
13654
+ "model": "meta-llama/llama-3.3-70b-instruct",
13655
+ "bcp_47": "te",
13656
+ "task": "classification",
13657
+ "metric": "accuracy",
13658
+ "score": 0.36666666666666664,
13659
+ "sentence_nr": 14.5
13660
+ },
13661
+ {
13662
+ "model": "meta-llama/llama-3.3-70b-instruct",
13663
+ "bcp_47": "te",
13664
+ "task": "language_modeling",
13665
+ "metric": "chrf",
13666
+ "score": 0.9513838296654142,
13667
+ "sentence_nr": 14.5
13668
+ },
13669
+ {
13670
+ "model": "meta-llama/llama-3.3-70b-instruct",
13671
+ "bcp_47": "te",
13672
+ "task": "translation",
13673
+ "metric": "bleu",
13674
+ "score": 0.28338449781147135,
13675
+ "sentence_nr": 14.5
13676
+ },
13677
+ {
13678
+ "model": "meta-llama/llama-3.3-70b-instruct",
13679
+ "bcp_47": "te",
13680
+ "task": "translation",
13681
+ "metric": "chrf",
13682
+ "score": 0.467003606031036,
13683
+ "sentence_nr": 14.5
13684
+ },
13685
+ {
13686
+ "model": "meta-llama/llama-3.3-70b-instruct",
13687
+ "bcp_47": "tr",
13688
+ "task": "classification",
13689
+ "metric": "accuracy",
13690
+ "score": 0.5333333333333333,
13691
+ "sentence_nr": 14.5
13692
+ },
13693
+ {
13694
+ "model": "meta-llama/llama-3.3-70b-instruct",
13695
+ "bcp_47": "tr",
13696
+ "task": "language_modeling",
13697
+ "metric": "chrf",
13698
+ "score": 0.9446670623712353,
13699
+ "sentence_nr": 14.5
13700
+ },
13701
+ {
13702
+ "model": "meta-llama/llama-3.3-70b-instruct",
13703
+ "bcp_47": "tr",
13704
+ "task": "translation",
13705
+ "metric": "bleu",
13706
+ "score": 0.2844596261435892,
13707
+ "sentence_nr": 14.5
13708
+ },
13709
+ {
13710
+ "model": "meta-llama/llama-3.3-70b-instruct",
13711
+ "bcp_47": "tr",
13712
+ "task": "translation",
13713
+ "metric": "chrf",
13714
+ "score": 0.4525478264239361,
13715
+ "sentence_nr": 14.5
13716
+ },
13717
+ {
13718
+ "model": "meta-llama/llama-3.3-70b-instruct",
13719
+ "bcp_47": "ur",
13720
+ "task": "classification",
13721
+ "metric": "accuracy",
13722
+ "score": 0.5,
13723
+ "sentence_nr": 14.5
13724
+ },
13725
+ {
13726
+ "model": "meta-llama/llama-3.3-70b-instruct",
13727
+ "bcp_47": "ur",
13728
+ "task": "language_modeling",
13729
+ "metric": "chrf",
13730
+ "score": 0.9182703887696211,
13731
+ "sentence_nr": 14.5
13732
+ },
13733
+ {
13734
+ "model": "meta-llama/llama-3.3-70b-instruct",
13735
+ "bcp_47": "ur",
13736
+ "task": "translation",
13737
+ "metric": "bleu",
13738
+ "score": 0.2434522914619727,
13739
+ "sentence_nr": 14.5
13740
+ },
13741
+ {
13742
+ "model": "meta-llama/llama-3.3-70b-instruct",
13743
+ "bcp_47": "ur",
13744
+ "task": "translation",
13745
+ "metric": "chrf",
13746
+ "score": 0.42196914378741973,
13747
+ "sentence_nr": 14.5
13748
+ },
13749
+ {
13750
+ "model": "meta-llama/llama-3.3-70b-instruct",
13751
+ "bcp_47": "vi",
13752
+ "task": "classification",
13753
+ "metric": "accuracy",
13754
+ "score": 0.6,
13755
+ "sentence_nr": 14.5
13756
+ },
13757
+ {
13758
+ "model": "meta-llama/llama-3.3-70b-instruct",
13759
+ "bcp_47": "vi",
13760
+ "task": "language_modeling",
13761
+ "metric": "chrf",
13762
+ "score": 0.9580044761495575,
13763
+ "sentence_nr": 14.5
13764
+ },
13765
+ {
13766
+ "model": "meta-llama/llama-3.3-70b-instruct",
13767
+ "bcp_47": "vi",
13768
+ "task": "translation",
13769
+ "metric": "bleu",
13770
+ "score": 0.25541664062319624,
13771
+ "sentence_nr": 14.5
13772
+ },
13773
+ {
13774
+ "model": "meta-llama/llama-3.3-70b-instruct",
13775
+ "bcp_47": "vi",
13776
+ "task": "translation",
13777
+ "metric": "chrf",
13778
+ "score": 0.43688984396841446,
13779
+ "sentence_nr": 14.5
13780
+ },
13781
+ {
13782
+ "model": "meta-llama/llama-3.3-70b-instruct",
13783
+ "bcp_47": "yue",
13784
+ "task": "classification",
13785
+ "metric": "accuracy",
13786
+ "score": 0.43333333333333335,
13787
+ "sentence_nr": 14.5
13788
+ },
13789
+ {
13790
+ "model": "meta-llama/llama-3.3-70b-instruct",
13791
+ "bcp_47": "yue",
13792
+ "task": "language_modeling",
13793
+ "metric": "chrf",
13794
+ "score": 0.9022415223117748,
13795
+ "sentence_nr": 14.5
13796
+ },
13797
+ {
13798
+ "model": "meta-llama/llama-3.3-70b-instruct",
13799
+ "bcp_47": "yue",
13800
+ "task": "translation",
13801
+ "metric": "bleu",
13802
+ "score": 0.22628178945118504,
13803
+ "sentence_nr": 14.5
13804
+ },
13805
+ {
13806
+ "model": "meta-llama/llama-3.3-70b-instruct",
13807
+ "bcp_47": "yue",
13808
+ "task": "translation",
13809
+ "metric": "chrf",
13810
+ "score": 0.4052050858435178,
13811
  "sentence_nr": 14.5
13812
  },
13813
  {
 
13823
  "bcp_47": "zh",
13824
  "task": "language_modeling",
13825
  "metric": "chrf",
13826
+ "score": 0.9003842558834025,
13827
  "sentence_nr": 14.5
13828
  },
13829
  {
 
13855
  "bcp_47": "en",
13856
  "task": "language_modeling",
13857
  "metric": "chrf",
13858
+ "score": 0.9312514772455793,
13859
  "sentence_nr": 14.5
13860
  },
13861
  {
 
13887
  "bcp_47": "zh",
13888
  "task": "language_modeling",
13889
  "metric": "chrf",
13890
+ "score": 0.831019102021034,
13891
  "sentence_nr": 14.5
13892
  },
13893
  {
 
13919
  "bcp_47": "en",
13920
  "task": "language_modeling",
13921
  "metric": "chrf",
13922
+ "score": 0.9126664788853867,
13923
  "sentence_nr": 14.5
13924
  },
13925
  {
 
13951
  "bcp_47": "zh",
13952
  "task": "language_modeling",
13953
  "metric": "chrf",
13954
+ "score": 0.8098290899553928,
13955
  "sentence_nr": 14.5
13956
  },
13957
  {
 
13983
  "bcp_47": "en",
13984
  "task": "language_modeling",
13985
  "metric": "chrf",
13986
+ "score": 0.8397325387031247,
13987
  "sentence_nr": 14.5
13988
  },
13989
  {
 
14015
  "bcp_47": "zh",
14016
  "task": "language_modeling",
14017
  "metric": "chrf",
14018
+ "score": 0.9167475699419941,
14019
  "sentence_nr": 14.5
14020
  },
14021
  {
 
14047
  "bcp_47": "en",
14048
  "task": "language_modeling",
14049
  "metric": "chrf",
14050
+ "score": 0.9807297060840695,
14051
  "sentence_nr": 14.5
14052
  },
14053
  {
 
14079
  "bcp_47": "zh",
14080
  "task": "language_modeling",
14081
  "metric": "chrf",
14082
+ "score": 0.9313441068235117,
14083
  "sentence_nr": 14.5
14084
  },
14085
  {
 
14111
  "bcp_47": "en",
14112
  "task": "language_modeling",
14113
  "metric": "chrf",
14114
+ "score": 0.5225508930892153,
14115
  "sentence_nr": 14.5
14116
  },
14117
  {
 
14143
  "bcp_47": "zh",
14144
  "task": "language_modeling",
14145
  "metric": "chrf",
14146
+ "score": 0.4174856398225174,
14147
  "sentence_nr": 14.5
14148
  },
14149
  {