Spaces:
Runtime error
Runtime error
Upload from GitHub Actions: Update evaluation results
Browse files- languages.json +2 -2
- models.json +118 -178
- results.json +2 -2
languages.json
CHANGED
@@ -79,7 +79,7 @@
|
|
79 |
"family":"Indo-European",
|
80 |
"flores_path":"fra_Latn",
|
81 |
"fleurs_tag":"fr_fr",
|
82 |
-
"commonvoice_hours":
|
83 |
"commonvoice_locale":"fr",
|
84 |
"in_benchmark":true
|
85 |
},
|
@@ -2167,7 +2167,7 @@
|
|
2167 |
"family":"Indo-European",
|
2168 |
"flores_path":"glg_Latn",
|
2169 |
"fleurs_tag":"gl_es",
|
2170 |
-
"commonvoice_hours":
|
2171 |
"commonvoice_locale":"gl",
|
2172 |
"in_benchmark":true
|
2173 |
},
|
|
|
79 |
"family":"Indo-European",
|
80 |
"flores_path":"fra_Latn",
|
81 |
"fleurs_tag":"fr_fr",
|
82 |
+
"commonvoice_hours":1073.0,
|
83 |
"commonvoice_locale":"fr",
|
84 |
"in_benchmark":true
|
85 |
},
|
|
|
2167 |
"family":"Indo-European",
|
2168 |
"flores_path":"glg_Latn",
|
2169 |
"fleurs_tag":"gl_es",
|
2170 |
+
"commonvoice_hours":164.0,
|
2171 |
"commonvoice_locale":"gl",
|
2172 |
"in_benchmark":true
|
2173 |
},
|
models.json
CHANGED
@@ -1,24 +1,4 @@
|
|
1 |
[
|
2 |
-
{
|
3 |
-
"id":"ai21\/jamba-large-1.7",
|
4 |
-
"name":"Jamba Large 1.7",
|
5 |
-
"provider_name":"AI21",
|
6 |
-
"cost":8.0,
|
7 |
-
"hf_id":"ai21labs\/AI21-Jamba-Large-1.7",
|
8 |
-
"size":398555145696.0,
|
9 |
-
"type":"open-source",
|
10 |
-
"license":"Other",
|
11 |
-
"creation_date":1751414400000,
|
12 |
-
"tasks":[
|
13 |
-
"translation_from",
|
14 |
-
"translation_to",
|
15 |
-
"classification",
|
16 |
-
"mmlu",
|
17 |
-
"arc",
|
18 |
-
"truthfulqa",
|
19 |
-
"mgsm"
|
20 |
-
]
|
21 |
-
},
|
22 |
{
|
23 |
"id":"amazon\/nova-micro-v1",
|
24 |
"name":"Nova Micro 1.0",
|
@@ -40,15 +20,15 @@
|
|
40 |
]
|
41 |
},
|
42 |
{
|
43 |
-
"id":"
|
44 |
-
"name":"
|
45 |
-
"provider_name":"
|
46 |
-
"cost":
|
47 |
-
"hf_id":
|
48 |
-
"size":
|
49 |
-
"type":"
|
50 |
-
"license":
|
51 |
-
"creation_date":
|
52 |
"tasks":[
|
53 |
"translation_from",
|
54 |
"translation_to",
|
@@ -99,26 +79,6 @@
|
|
99 |
"mgsm"
|
100 |
]
|
101 |
},
|
102 |
-
{
|
103 |
-
"id":"arcee-ai\/virtuoso-large",
|
104 |
-
"name":"Virtuoso Large",
|
105 |
-
"provider_name":"Arcee AI",
|
106 |
-
"cost":1.2,
|
107 |
-
"hf_id":"arcee-ai\/Virtuoso-Large",
|
108 |
-
"size":72706203648.0,
|
109 |
-
"type":"open-source",
|
110 |
-
"license":"Other",
|
111 |
-
"creation_date":1749427200000,
|
112 |
-
"tasks":[
|
113 |
-
"translation_from",
|
114 |
-
"translation_to",
|
115 |
-
"classification",
|
116 |
-
"mmlu",
|
117 |
-
"arc",
|
118 |
-
"truthfulqa",
|
119 |
-
"mgsm"
|
120 |
-
]
|
121 |
-
},
|
122 |
{
|
123 |
"id":"arliai\/qwq-32b-arliai-rpr-v1",
|
124 |
"name":"QwQ 32B RpR v1",
|
@@ -140,15 +100,15 @@
|
|
140 |
]
|
141 |
},
|
142 |
{
|
143 |
-
"id":"
|
144 |
-
"name":"
|
145 |
-
"provider_name":"
|
146 |
-
"cost":
|
147 |
-
"hf_id":
|
148 |
-
"size":
|
149 |
-
"type":"
|
150 |
-
"license":
|
151 |
-
"creation_date":
|
152 |
"tasks":[
|
153 |
"translation_from",
|
154 |
"translation_to",
|
@@ -220,15 +180,35 @@
|
|
220 |
]
|
221 |
},
|
222 |
{
|
223 |
-
"id":"
|
224 |
-
"name":"
|
225 |
-
"provider_name":"
|
226 |
-
"cost":
|
227 |
-
"hf_id":"
|
228 |
-
"size":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
229 |
"type":"open-source",
|
230 |
-
"license":"
|
231 |
-
"creation_date":
|
232 |
"tasks":[
|
233 |
"translation_from",
|
234 |
"translation_to",
|
@@ -299,26 +279,6 @@
|
|
299 |
"mgsm"
|
300 |
]
|
301 |
},
|
302 |
-
{
|
303 |
-
"id":"google\/gemma-2-9b-it",
|
304 |
-
"name":"Gemma 2 9B",
|
305 |
-
"provider_name":"Google",
|
306 |
-
"cost":0.0,
|
307 |
-
"hf_id":"google\/gemma-2-9b-it",
|
308 |
-
"size":9241705984.0,
|
309 |
-
"type":"open-source",
|
310 |
-
"license":"Gemma",
|
311 |
-
"creation_date":1719187200000,
|
312 |
-
"tasks":[
|
313 |
-
"translation_from",
|
314 |
-
"translation_to",
|
315 |
-
"classification",
|
316 |
-
"mmlu",
|
317 |
-
"arc",
|
318 |
-
"truthfulqa",
|
319 |
-
"mgsm"
|
320 |
-
]
|
321 |
-
},
|
322 |
{
|
323 |
"id":"google\/gemma-3-12b-it",
|
324 |
"name":"Gemma 3 12B",
|
@@ -359,46 +319,6 @@
|
|
359 |
"mgsm"
|
360 |
]
|
361 |
},
|
362 |
-
{
|
363 |
-
"id":"google\/gemma-3-4b-it",
|
364 |
-
"name":"Gemma 3 4B",
|
365 |
-
"provider_name":"Google",
|
366 |
-
"cost":0.0,
|
367 |
-
"hf_id":"google\/gemma-3-4b-it",
|
368 |
-
"size":4300079472.0,
|
369 |
-
"type":"open-source",
|
370 |
-
"license":"Gemma",
|
371 |
-
"creation_date":1740009600000,
|
372 |
-
"tasks":[
|
373 |
-
"translation_from",
|
374 |
-
"translation_to",
|
375 |
-
"classification",
|
376 |
-
"mmlu",
|
377 |
-
"arc",
|
378 |
-
"truthfulqa",
|
379 |
-
"mgsm"
|
380 |
-
]
|
381 |
-
},
|
382 |
-
{
|
383 |
-
"id":"liquid\/lfm-7b",
|
384 |
-
"name":"LFM 7B",
|
385 |
-
"provider_name":"Liquid",
|
386 |
-
"cost":0.01,
|
387 |
-
"hf_id":null,
|
388 |
-
"size":null,
|
389 |
-
"type":"closed-source",
|
390 |
-
"license":null,
|
391 |
-
"creation_date":1737763200000,
|
392 |
-
"tasks":[
|
393 |
-
"translation_from",
|
394 |
-
"translation_to",
|
395 |
-
"classification",
|
396 |
-
"mmlu",
|
397 |
-
"arc",
|
398 |
-
"truthfulqa",
|
399 |
-
"mgsm"
|
400 |
-
]
|
401 |
-
},
|
402 |
{
|
403 |
"id":"meta-llama\/llama-3-70b-instruct",
|
404 |
"name":"Llama 3 70B Instruct",
|
@@ -519,6 +439,26 @@
|
|
519 |
"mgsm"
|
520 |
]
|
521 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
522 |
{
|
523 |
"id":"mistralai\/mistral-nemo",
|
524 |
"name":"Mistral Nemo",
|
@@ -580,15 +520,15 @@
|
|
580 |
]
|
581 |
},
|
582 |
{
|
583 |
-
"id":"
|
584 |
-
"name":"
|
585 |
-
"provider_name":"
|
586 |
-
"cost":0.
|
587 |
-
"hf_id":"
|
588 |
-
"size":
|
589 |
"type":"open-source",
|
590 |
-
"license":"
|
591 |
-
"creation_date":
|
592 |
"tasks":[
|
593 |
"translation_from",
|
594 |
"translation_to",
|
@@ -600,15 +540,15 @@
|
|
600 |
]
|
601 |
},
|
602 |
{
|
603 |
-
"id":"
|
604 |
-
"name":"
|
605 |
-
"provider_name":"
|
606 |
-
"cost":
|
607 |
-
"hf_id":"
|
608 |
-
"size":
|
609 |
"type":"open-source",
|
610 |
-
"license":"
|
611 |
-
"creation_date":
|
612 |
"tasks":[
|
613 |
"translation_from",
|
614 |
"translation_to",
|
@@ -620,15 +560,15 @@
|
|
620 |
]
|
621 |
},
|
622 |
{
|
623 |
-
"id":"
|
624 |
-
"name":"
|
625 |
-
"provider_name":"
|
626 |
-
"cost":0.
|
627 |
-
"hf_id":"
|
628 |
-
"size":
|
629 |
"type":"open-source",
|
630 |
-
"license":"Llama3",
|
631 |
-
"creation_date":
|
632 |
"tasks":[
|
633 |
"translation_from",
|
634 |
"translation_to",
|
@@ -799,26 +739,6 @@
|
|
799 |
"mgsm"
|
800 |
]
|
801 |
},
|
802 |
-
{
|
803 |
-
"id":"qwen\/qwen-2.5-72b-instruct",
|
804 |
-
"name":"Qwen2.5 72B Instruct",
|
805 |
-
"provider_name":"Qwen2.5 72B Instruct (free)",
|
806 |
-
"cost":0.0,
|
807 |
-
"hf_id":"Qwen\/Qwen2.5-72B-Instruct",
|
808 |
-
"size":72706203648.0,
|
809 |
-
"type":"open-source",
|
810 |
-
"license":"Other",
|
811 |
-
"creation_date":1726444800000,
|
812 |
-
"tasks":[
|
813 |
-
"translation_from",
|
814 |
-
"translation_to",
|
815 |
-
"classification",
|
816 |
-
"mmlu",
|
817 |
-
"arc",
|
818 |
-
"truthfulqa",
|
819 |
-
"mgsm"
|
820 |
-
]
|
821 |
-
},
|
822 |
{
|
823 |
"id":"qwen\/qwen-2.5-coder-32b-instruct",
|
824 |
"name":"Qwen2.5 Coder 32B Instruct",
|
@@ -899,6 +819,26 @@
|
|
899 |
"mgsm"
|
900 |
]
|
901 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
902 |
{
|
903 |
"id":"tencent\/hunyuan-a13b-instruct",
|
904 |
"name":"Hunyuan A13B Instruct",
|
@@ -920,15 +860,15 @@
|
|
920 |
]
|
921 |
},
|
922 |
{
|
923 |
-
"id":"
|
924 |
-
"name":"
|
925 |
-
"provider_name":"
|
926 |
-
"cost":0
|
927 |
-
"hf_id":"
|
928 |
-
"size":
|
929 |
"type":"open-source",
|
930 |
-
"license":"
|
931 |
-
"creation_date":
|
932 |
"tasks":[
|
933 |
"translation_from",
|
934 |
"translation_to",
|
|
|
1 |
[
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2 |
{
|
3 |
"id":"amazon\/nova-micro-v1",
|
4 |
"name":"Nova Micro 1.0",
|
|
|
20 |
]
|
21 |
},
|
22 |
{
|
23 |
+
"id":"anthropic\/claude-3-haiku",
|
24 |
+
"name":"Claude 3 Haiku",
|
25 |
+
"provider_name":"Anthropic",
|
26 |
+
"cost":1.25,
|
27 |
+
"hf_id":null,
|
28 |
+
"size":null,
|
29 |
+
"type":"closed-source",
|
30 |
+
"license":null,
|
31 |
+
"creation_date":1710288000000,
|
32 |
"tasks":[
|
33 |
"translation_from",
|
34 |
"translation_to",
|
|
|
79 |
"mgsm"
|
80 |
]
|
81 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
82 |
{
|
83 |
"id":"arliai\/qwq-32b-arliai-rpr-v1",
|
84 |
"name":"QwQ 32B RpR v1",
|
|
|
100 |
]
|
101 |
},
|
102 |
{
|
103 |
+
"id":"cohere\/command-r-08-2024",
|
104 |
+
"name":"Command R (08-2024)",
|
105 |
+
"provider_name":"Cohere",
|
106 |
+
"cost":0.6,
|
107 |
+
"hf_id":null,
|
108 |
+
"size":null,
|
109 |
+
"type":"closed-source",
|
110 |
+
"license":null,
|
111 |
+
"creation_date":1724976000000,
|
112 |
"tasks":[
|
113 |
"translation_from",
|
114 |
"translation_to",
|
|
|
180 |
]
|
181 |
},
|
182 |
{
|
183 |
+
"id":"deepseek\/deepseek-r1",
|
184 |
+
"name":"R1",
|
185 |
+
"provider_name":"DeepSeek",
|
186 |
+
"cost":0.0,
|
187 |
+
"hf_id":"deepseek-ai\/DeepSeek-R1",
|
188 |
+
"size":684531386000.0,
|
189 |
+
"type":"open-source",
|
190 |
+
"license":"Mit",
|
191 |
+
"creation_date":1737331200000,
|
192 |
+
"tasks":[
|
193 |
+
"translation_from",
|
194 |
+
"translation_to",
|
195 |
+
"classification",
|
196 |
+
"mmlu",
|
197 |
+
"arc",
|
198 |
+
"truthfulqa",
|
199 |
+
"mgsm"
|
200 |
+
]
|
201 |
+
},
|
202 |
+
{
|
203 |
+
"id":"deepseek\/deepseek-r1-0528-qwen3-8b",
|
204 |
+
"name":"Deepseek R1 0528 Qwen3 8B",
|
205 |
+
"provider_name":"DeepSeek",
|
206 |
+
"cost":0.0,
|
207 |
+
"hf_id":"deepseek-ai\/DeepSeek-R1-0528-Qwen3-8B",
|
208 |
+
"size":8190735360.0,
|
209 |
"type":"open-source",
|
210 |
+
"license":"Mit",
|
211 |
+
"creation_date":1748476800000,
|
212 |
"tasks":[
|
213 |
"translation_from",
|
214 |
"translation_to",
|
|
|
279 |
"mgsm"
|
280 |
]
|
281 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
282 |
{
|
283 |
"id":"google\/gemma-3-12b-it",
|
284 |
"name":"Gemma 3 12B",
|
|
|
319 |
"mgsm"
|
320 |
]
|
321 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
322 |
{
|
323 |
"id":"meta-llama\/llama-3-70b-instruct",
|
324 |
"name":"Llama 3 70B Instruct",
|
|
|
439 |
"mgsm"
|
440 |
]
|
441 |
},
|
442 |
+
{
|
443 |
+
"id":"mistralai\/mistral-7b-instruct-v0.3",
|
444 |
+
"name":"Mistral 7B Instruct v0.3",
|
445 |
+
"provider_name":"Mistral",
|
446 |
+
"cost":0.05,
|
447 |
+
"hf_id":"mistralai\/Mistral-7B-Instruct-v0.3",
|
448 |
+
"size":7248023552.0,
|
449 |
+
"type":"open-source",
|
450 |
+
"license":"Apache 2.0",
|
451 |
+
"creation_date":1716336000000,
|
452 |
+
"tasks":[
|
453 |
+
"translation_from",
|
454 |
+
"translation_to",
|
455 |
+
"classification",
|
456 |
+
"mmlu",
|
457 |
+
"arc",
|
458 |
+
"truthfulqa",
|
459 |
+
"mgsm"
|
460 |
+
]
|
461 |
+
},
|
462 |
{
|
463 |
"id":"mistralai\/mistral-nemo",
|
464 |
"name":"Mistral Nemo",
|
|
|
520 |
]
|
521 |
},
|
522 |
{
|
523 |
+
"id":"moonshotai\/kimi-k2",
|
524 |
+
"name":"Kimi K2",
|
525 |
+
"provider_name":"MoonshotAI",
|
526 |
+
"cost":0.0,
|
527 |
+
"hf_id":"moonshotai\/Kimi-K2-Instruct",
|
528 |
+
"size":null,
|
529 |
"type":"open-source",
|
530 |
+
"license":"Other",
|
531 |
+
"creation_date":1752192000000,
|
532 |
"tasks":[
|
533 |
"translation_from",
|
534 |
"translation_to",
|
|
|
540 |
]
|
541 |
},
|
542 |
{
|
543 |
+
"id":"neversleep\/llama-3-lumimaid-70b",
|
544 |
+
"name":"Llama 3 Lumimaid 70B",
|
545 |
+
"provider_name":"NeverSleep",
|
546 |
+
"cost":6.0,
|
547 |
+
"hf_id":"NeverSleep\/Llama-3-Lumimaid-70B-v0.1",
|
548 |
+
"size":70553706496.0,
|
549 |
"type":"open-source",
|
550 |
+
"license":"Cc By Nc 4.0",
|
551 |
+
"creation_date":1714262400000,
|
552 |
"tasks":[
|
553 |
"translation_from",
|
554 |
"translation_to",
|
|
|
560 |
]
|
561 |
},
|
562 |
{
|
563 |
+
"id":"nvidia\/llama-3.1-nemotron-70b-instruct",
|
564 |
+
"name":"Llama 3.1 Nemotron 70B Instruct",
|
565 |
+
"provider_name":"NVIDIA",
|
566 |
+
"cost":0.3,
|
567 |
+
"hf_id":"nvidia\/Llama-3.1-Nemotron-70B-Instruct-HF",
|
568 |
+
"size":70553706496.0,
|
569 |
"type":"open-source",
|
570 |
+
"license":"Llama3.1",
|
571 |
+
"creation_date":1728691200000,
|
572 |
"tasks":[
|
573 |
"translation_from",
|
574 |
"translation_to",
|
|
|
739 |
"mgsm"
|
740 |
]
|
741 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
742 |
{
|
743 |
"id":"qwen\/qwen-2.5-coder-32b-instruct",
|
744 |
"name":"Qwen2.5 Coder 32B Instruct",
|
|
|
819 |
"mgsm"
|
820 |
]
|
821 |
},
|
822 |
+
{
|
823 |
+
"id":"scb10x\/llama3.1-typhoon2-70b-instruct",
|
824 |
+
"name":"Typhoon2 70B Instruct",
|
825 |
+
"provider_name":"Typhoon2 70B Instruct",
|
826 |
+
"cost":0.88,
|
827 |
+
"hf_id":"scb10x\/llama3.1-typhoon2-70b-instruct",
|
828 |
+
"size":70553706496.0,
|
829 |
+
"type":"open-source",
|
830 |
+
"license":"Llama3.1",
|
831 |
+
"creation_date":1734220800000,
|
832 |
+
"tasks":[
|
833 |
+
"translation_from",
|
834 |
+
"translation_to",
|
835 |
+
"classification",
|
836 |
+
"mmlu",
|
837 |
+
"arc",
|
838 |
+
"truthfulqa",
|
839 |
+
"mgsm"
|
840 |
+
]
|
841 |
+
},
|
842 |
{
|
843 |
"id":"tencent\/hunyuan-a13b-instruct",
|
844 |
"name":"Hunyuan A13B Instruct",
|
|
|
860 |
]
|
861 |
},
|
862 |
{
|
863 |
+
"id":"thedrummer\/anubis-pro-105b-v1",
|
864 |
+
"name":"Anubis Pro 105B V1",
|
865 |
+
"provider_name":"TheDrummer",
|
866 |
+
"cost":1.0,
|
867 |
+
"hf_id":"TheDrummer\/Anubis-Pro-105B-v1",
|
868 |
+
"size":104779882496.0,
|
869 |
"type":"open-source",
|
870 |
+
"license":"Other",
|
871 |
+
"creation_date":1738454400000,
|
872 |
"tasks":[
|
873 |
"translation_from",
|
874 |
"translation_to",
|
results.json
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:649509b8373b76e51a79809fdab77badff44e5536ca3bd8e3eb409f406b6ecda
|
3 |
+
size 13260774
|