davidpomerenke commited on
Commit
95c4e14
·
verified ·
1 Parent(s): 088f96f

Upload from GitHub Actions: Update evaluation results

Browse files
Files changed (3) hide show
  1. languages.json +2 -2
  2. models.json +118 -178
  3. results.json +2 -2
languages.json CHANGED
@@ -79,7 +79,7 @@
79
  "family":"Indo-European",
80
  "flores_path":"fra_Latn",
81
  "fleurs_tag":"fr_fr",
82
- "commonvoice_hours":1072.0,
83
  "commonvoice_locale":"fr",
84
  "in_benchmark":true
85
  },
@@ -2167,7 +2167,7 @@
2167
  "family":"Indo-European",
2168
  "flores_path":"glg_Latn",
2169
  "fleurs_tag":"gl_es",
2170
- "commonvoice_hours":163.0,
2171
  "commonvoice_locale":"gl",
2172
  "in_benchmark":true
2173
  },
 
79
  "family":"Indo-European",
80
  "flores_path":"fra_Latn",
81
  "fleurs_tag":"fr_fr",
82
+ "commonvoice_hours":1073.0,
83
  "commonvoice_locale":"fr",
84
  "in_benchmark":true
85
  },
 
2167
  "family":"Indo-European",
2168
  "flores_path":"glg_Latn",
2169
  "fleurs_tag":"gl_es",
2170
+ "commonvoice_hours":164.0,
2171
  "commonvoice_locale":"gl",
2172
  "in_benchmark":true
2173
  },
models.json CHANGED
@@ -1,24 +1,4 @@
1
  [
2
- {
3
- "id":"ai21\/jamba-large-1.7",
4
- "name":"Jamba Large 1.7",
5
- "provider_name":"AI21",
6
- "cost":8.0,
7
- "hf_id":"ai21labs\/AI21-Jamba-Large-1.7",
8
- "size":398555145696.0,
9
- "type":"open-source",
10
- "license":"Other",
11
- "creation_date":1751414400000,
12
- "tasks":[
13
- "translation_from",
14
- "translation_to",
15
- "classification",
16
- "mmlu",
17
- "arc",
18
- "truthfulqa",
19
- "mgsm"
20
- ]
21
- },
22
  {
23
  "id":"amazon\/nova-micro-v1",
24
  "name":"Nova Micro 1.0",
@@ -40,15 +20,15 @@
40
  ]
41
  },
42
  {
43
- "id":"anthracite-org\/magnum-v4-72b",
44
- "name":"Magnum v4 72B",
45
- "provider_name":"Magnum v4 72B",
46
- "cost":5.0,
47
- "hf_id":"anthracite-org\/magnum-v4-72b",
48
- "size":72706203648.0,
49
- "type":"open-source",
50
- "license":"Apache 2.0",
51
- "creation_date":1726790400000,
52
  "tasks":[
53
  "translation_from",
54
  "translation_to",
@@ -99,26 +79,6 @@
99
  "mgsm"
100
  ]
101
  },
102
- {
103
- "id":"arcee-ai\/virtuoso-large",
104
- "name":"Virtuoso Large",
105
- "provider_name":"Arcee AI",
106
- "cost":1.2,
107
- "hf_id":"arcee-ai\/Virtuoso-Large",
108
- "size":72706203648.0,
109
- "type":"open-source",
110
- "license":"Other",
111
- "creation_date":1749427200000,
112
- "tasks":[
113
- "translation_from",
114
- "translation_to",
115
- "classification",
116
- "mmlu",
117
- "arc",
118
- "truthfulqa",
119
- "mgsm"
120
- ]
121
- },
122
  {
123
  "id":"arliai\/qwq-32b-arliai-rpr-v1",
124
  "name":"QwQ 32B RpR v1",
@@ -140,15 +100,15 @@
140
  ]
141
  },
142
  {
143
- "id":"baidu\/ernie-4.5-300b-a47b",
144
- "name":"ERNIE 4.5 300B A47B ",
145
- "provider_name":"Baidu",
146
- "cost":1.1,
147
- "hf_id":"baidu\/ERNIE-4.5-300B-A47B-PT",
148
- "size":300474051776.0,
149
- "type":"open-source",
150
- "license":"Apache 2.0",
151
- "creation_date":1751068800000,
152
  "tasks":[
153
  "translation_from",
154
  "translation_to",
@@ -220,15 +180,35 @@
220
  ]
221
  },
222
  {
223
- "id":"eleutherai\/llemma_7b",
224
- "name":"Llemma 7b",
225
- "provider_name":"EleutherAI",
226
- "cost":1.2,
227
- "hf_id":"EleutherAI\/llemma_7b",
228
- "size":null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
229
  "type":"open-source",
230
- "license":"Llama2",
231
- "creation_date":1694476800000,
232
  "tasks":[
233
  "translation_from",
234
  "translation_to",
@@ -299,26 +279,6 @@
299
  "mgsm"
300
  ]
301
  },
302
- {
303
- "id":"google\/gemma-2-9b-it",
304
- "name":"Gemma 2 9B",
305
- "provider_name":"Google",
306
- "cost":0.0,
307
- "hf_id":"google\/gemma-2-9b-it",
308
- "size":9241705984.0,
309
- "type":"open-source",
310
- "license":"Gemma",
311
- "creation_date":1719187200000,
312
- "tasks":[
313
- "translation_from",
314
- "translation_to",
315
- "classification",
316
- "mmlu",
317
- "arc",
318
- "truthfulqa",
319
- "mgsm"
320
- ]
321
- },
322
  {
323
  "id":"google\/gemma-3-12b-it",
324
  "name":"Gemma 3 12B",
@@ -359,46 +319,6 @@
359
  "mgsm"
360
  ]
361
  },
362
- {
363
- "id":"google\/gemma-3-4b-it",
364
- "name":"Gemma 3 4B",
365
- "provider_name":"Google",
366
- "cost":0.0,
367
- "hf_id":"google\/gemma-3-4b-it",
368
- "size":4300079472.0,
369
- "type":"open-source",
370
- "license":"Gemma",
371
- "creation_date":1740009600000,
372
- "tasks":[
373
- "translation_from",
374
- "translation_to",
375
- "classification",
376
- "mmlu",
377
- "arc",
378
- "truthfulqa",
379
- "mgsm"
380
- ]
381
- },
382
- {
383
- "id":"liquid\/lfm-7b",
384
- "name":"LFM 7B",
385
- "provider_name":"Liquid",
386
- "cost":0.01,
387
- "hf_id":null,
388
- "size":null,
389
- "type":"closed-source",
390
- "license":null,
391
- "creation_date":1737763200000,
392
- "tasks":[
393
- "translation_from",
394
- "translation_to",
395
- "classification",
396
- "mmlu",
397
- "arc",
398
- "truthfulqa",
399
- "mgsm"
400
- ]
401
- },
402
  {
403
  "id":"meta-llama\/llama-3-70b-instruct",
404
  "name":"Llama 3 70B Instruct",
@@ -519,6 +439,26 @@
519
  "mgsm"
520
  ]
521
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
522
  {
523
  "id":"mistralai\/mistral-nemo",
524
  "name":"Mistral Nemo",
@@ -580,15 +520,15 @@
580
  ]
581
  },
582
  {
583
- "id":"mistralai\/mixtral-8x7b-instruct",
584
- "name":"Mixtral 8x7B Instruct",
585
- "provider_name":"Mistral",
586
- "cost":0.24,
587
- "hf_id":"mistralai\/Mixtral-8x7B-Instruct-v0.1",
588
- "size":46702792704.0,
589
  "type":"open-source",
590
- "license":"Apache 2.0",
591
- "creation_date":1702166400000,
592
  "tasks":[
593
  "translation_from",
594
  "translation_to",
@@ -600,15 +540,15 @@
600
  ]
601
  },
602
  {
603
- "id":"moonshotai\/kimi-k2",
604
- "name":"Kimi K2",
605
- "provider_name":"MoonshotAI",
606
- "cost":0.0,
607
- "hf_id":"moonshotai\/Kimi-K2-Instruct",
608
- "size":null,
609
  "type":"open-source",
610
- "license":"Other",
611
- "creation_date":1752192000000,
612
  "tasks":[
613
  "translation_from",
614
  "translation_to",
@@ -620,15 +560,15 @@
620
  ]
621
  },
622
  {
623
- "id":"nousresearch\/deephermes-3-llama-3-8b-preview",
624
- "name":"DeepHermes 3 Llama 3 8B Preview",
625
- "provider_name":"Nous",
626
- "cost":0.0,
627
- "hf_id":"NousResearch\/DeepHermes-3-Llama-3-8B-Preview",
628
- "size":8030261248.0,
629
  "type":"open-source",
630
- "license":"Llama3",
631
- "creation_date":1739318400000,
632
  "tasks":[
633
  "translation_from",
634
  "translation_to",
@@ -799,26 +739,6 @@
799
  "mgsm"
800
  ]
801
  },
802
- {
803
- "id":"qwen\/qwen-2.5-72b-instruct",
804
- "name":"Qwen2.5 72B Instruct",
805
- "provider_name":"Qwen2.5 72B Instruct (free)",
806
- "cost":0.0,
807
- "hf_id":"Qwen\/Qwen2.5-72B-Instruct",
808
- "size":72706203648.0,
809
- "type":"open-source",
810
- "license":"Other",
811
- "creation_date":1726444800000,
812
- "tasks":[
813
- "translation_from",
814
- "translation_to",
815
- "classification",
816
- "mmlu",
817
- "arc",
818
- "truthfulqa",
819
- "mgsm"
820
- ]
821
- },
822
  {
823
  "id":"qwen\/qwen-2.5-coder-32b-instruct",
824
  "name":"Qwen2.5 Coder 32B Instruct",
@@ -899,6 +819,26 @@
899
  "mgsm"
900
  ]
901
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
902
  {
903
  "id":"tencent\/hunyuan-a13b-instruct",
904
  "name":"Hunyuan A13B Instruct",
@@ -920,15 +860,15 @@
920
  ]
921
  },
922
  {
923
- "id":"undi95\/remm-slerp-l2-13b",
924
- "name":"ReMM SLERP 13B",
925
- "provider_name":"ReMM SLERP 13B",
926
- "cost":0.65,
927
- "hf_id":"Undi95\/ReMM-SLERP-L2-13B",
928
- "size":null,
929
  "type":"open-source",
930
- "license":"Cc By Nc 4.0",
931
- "creation_date":1693785600000,
932
  "tasks":[
933
  "translation_from",
934
  "translation_to",
 
1
  [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  {
3
  "id":"amazon\/nova-micro-v1",
4
  "name":"Nova Micro 1.0",
 
20
  ]
21
  },
22
  {
23
+ "id":"anthropic\/claude-3-haiku",
24
+ "name":"Claude 3 Haiku",
25
+ "provider_name":"Anthropic",
26
+ "cost":1.25,
27
+ "hf_id":null,
28
+ "size":null,
29
+ "type":"closed-source",
30
+ "license":null,
31
+ "creation_date":1710288000000,
32
  "tasks":[
33
  "translation_from",
34
  "translation_to",
 
79
  "mgsm"
80
  ]
81
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
82
  {
83
  "id":"arliai\/qwq-32b-arliai-rpr-v1",
84
  "name":"QwQ 32B RpR v1",
 
100
  ]
101
  },
102
  {
103
+ "id":"cohere\/command-r-08-2024",
104
+ "name":"Command R (08-2024)",
105
+ "provider_name":"Cohere",
106
+ "cost":0.6,
107
+ "hf_id":null,
108
+ "size":null,
109
+ "type":"closed-source",
110
+ "license":null,
111
+ "creation_date":1724976000000,
112
  "tasks":[
113
  "translation_from",
114
  "translation_to",
 
180
  ]
181
  },
182
  {
183
+ "id":"deepseek\/deepseek-r1",
184
+ "name":"R1",
185
+ "provider_name":"DeepSeek",
186
+ "cost":0.0,
187
+ "hf_id":"deepseek-ai\/DeepSeek-R1",
188
+ "size":684531386000.0,
189
+ "type":"open-source",
190
+ "license":"Mit",
191
+ "creation_date":1737331200000,
192
+ "tasks":[
193
+ "translation_from",
194
+ "translation_to",
195
+ "classification",
196
+ "mmlu",
197
+ "arc",
198
+ "truthfulqa",
199
+ "mgsm"
200
+ ]
201
+ },
202
+ {
203
+ "id":"deepseek\/deepseek-r1-0528-qwen3-8b",
204
+ "name":"Deepseek R1 0528 Qwen3 8B",
205
+ "provider_name":"DeepSeek",
206
+ "cost":0.0,
207
+ "hf_id":"deepseek-ai\/DeepSeek-R1-0528-Qwen3-8B",
208
+ "size":8190735360.0,
209
  "type":"open-source",
210
+ "license":"Mit",
211
+ "creation_date":1748476800000,
212
  "tasks":[
213
  "translation_from",
214
  "translation_to",
 
279
  "mgsm"
280
  ]
281
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
282
  {
283
  "id":"google\/gemma-3-12b-it",
284
  "name":"Gemma 3 12B",
 
319
  "mgsm"
320
  ]
321
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
322
  {
323
  "id":"meta-llama\/llama-3-70b-instruct",
324
  "name":"Llama 3 70B Instruct",
 
439
  "mgsm"
440
  ]
441
  },
442
+ {
443
+ "id":"mistralai\/mistral-7b-instruct-v0.3",
444
+ "name":"Mistral 7B Instruct v0.3",
445
+ "provider_name":"Mistral",
446
+ "cost":0.05,
447
+ "hf_id":"mistralai\/Mistral-7B-Instruct-v0.3",
448
+ "size":7248023552.0,
449
+ "type":"open-source",
450
+ "license":"Apache 2.0",
451
+ "creation_date":1716336000000,
452
+ "tasks":[
453
+ "translation_from",
454
+ "translation_to",
455
+ "classification",
456
+ "mmlu",
457
+ "arc",
458
+ "truthfulqa",
459
+ "mgsm"
460
+ ]
461
+ },
462
  {
463
  "id":"mistralai\/mistral-nemo",
464
  "name":"Mistral Nemo",
 
520
  ]
521
  },
522
  {
523
+ "id":"moonshotai\/kimi-k2",
524
+ "name":"Kimi K2",
525
+ "provider_name":"MoonshotAI",
526
+ "cost":0.0,
527
+ "hf_id":"moonshotai\/Kimi-K2-Instruct",
528
+ "size":null,
529
  "type":"open-source",
530
+ "license":"Other",
531
+ "creation_date":1752192000000,
532
  "tasks":[
533
  "translation_from",
534
  "translation_to",
 
540
  ]
541
  },
542
  {
543
+ "id":"neversleep\/llama-3-lumimaid-70b",
544
+ "name":"Llama 3 Lumimaid 70B",
545
+ "provider_name":"NeverSleep",
546
+ "cost":6.0,
547
+ "hf_id":"NeverSleep\/Llama-3-Lumimaid-70B-v0.1",
548
+ "size":70553706496.0,
549
  "type":"open-source",
550
+ "license":"Cc By Nc 4.0",
551
+ "creation_date":1714262400000,
552
  "tasks":[
553
  "translation_from",
554
  "translation_to",
 
560
  ]
561
  },
562
  {
563
+ "id":"nvidia\/llama-3.1-nemotron-70b-instruct",
564
+ "name":"Llama 3.1 Nemotron 70B Instruct",
565
+ "provider_name":"NVIDIA",
566
+ "cost":0.3,
567
+ "hf_id":"nvidia\/Llama-3.1-Nemotron-70B-Instruct-HF",
568
+ "size":70553706496.0,
569
  "type":"open-source",
570
+ "license":"Llama3.1",
571
+ "creation_date":1728691200000,
572
  "tasks":[
573
  "translation_from",
574
  "translation_to",
 
739
  "mgsm"
740
  ]
741
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
742
  {
743
  "id":"qwen\/qwen-2.5-coder-32b-instruct",
744
  "name":"Qwen2.5 Coder 32B Instruct",
 
819
  "mgsm"
820
  ]
821
  },
822
+ {
823
+ "id":"scb10x\/llama3.1-typhoon2-70b-instruct",
824
+ "name":"Typhoon2 70B Instruct",
825
+ "provider_name":"Typhoon2 70B Instruct",
826
+ "cost":0.88,
827
+ "hf_id":"scb10x\/llama3.1-typhoon2-70b-instruct",
828
+ "size":70553706496.0,
829
+ "type":"open-source",
830
+ "license":"Llama3.1",
831
+ "creation_date":1734220800000,
832
+ "tasks":[
833
+ "translation_from",
834
+ "translation_to",
835
+ "classification",
836
+ "mmlu",
837
+ "arc",
838
+ "truthfulqa",
839
+ "mgsm"
840
+ ]
841
+ },
842
  {
843
  "id":"tencent\/hunyuan-a13b-instruct",
844
  "name":"Hunyuan A13B Instruct",
 
860
  ]
861
  },
862
  {
863
+ "id":"thedrummer\/anubis-pro-105b-v1",
864
+ "name":"Anubis Pro 105B V1",
865
+ "provider_name":"TheDrummer",
866
+ "cost":1.0,
867
+ "hf_id":"TheDrummer\/Anubis-Pro-105B-v1",
868
+ "size":104779882496.0,
869
  "type":"open-source",
870
+ "license":"Other",
871
+ "creation_date":1738454400000,
872
  "tasks":[
873
  "translation_from",
874
  "translation_to",
results.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce3638aedf7fd3bd28f92814be7c10a5a8f748c5cc601ab6041be798710dff54
3
- size 11677172
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:649509b8373b76e51a79809fdab77badff44e5536ca3bd8e3eb409f406b6ecda
3
+ size 13260774