Spaces:
Running
Running
Upload from GitHub Actions: Merge pull request #7 from datenlabor-bmz/jn-dev
Browse files- .gitattributes +1 -0
- evals/data_flow_architecture.png +3 -0
- evals/models.py +92 -23
- languages.json +31 -31
- models.json +12 -12
.gitattributes
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
evals/data_flow_architecture.png filter=lfs diff=lfs merge=lfs -text
|
evals/data_flow_architecture.png
ADDED
|
Git LFS Details
|
evals/models.py
CHANGED
|
@@ -93,28 +93,91 @@ def get_model(permaslug):
|
|
| 93 |
|
| 94 |
@cache
|
| 95 |
def get_historical_popular_models(date: date):
|
| 96 |
-
|
| 97 |
-
|
| 98 |
-
|
| 99 |
-
|
| 100 |
-
|
| 101 |
-
|
| 102 |
-
|
| 103 |
-
|
| 104 |
-
|
| 105 |
-
|
| 106 |
-
|
| 107 |
-
|
| 108 |
-
|
| 109 |
-
|
| 110 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 111 |
def get_current_popular_models(date: date):
|
| 112 |
-
|
| 113 |
-
|
| 114 |
-
|
| 115 |
-
|
| 116 |
-
|
| 117 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 118 |
|
| 119 |
|
| 120 |
def get_translation_models():
|
|
@@ -249,8 +312,14 @@ def get_hf_metadata(row):
|
|
| 249 |
|
| 250 |
|
| 251 |
def get_cost(row):
|
| 252 |
-
|
| 253 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 254 |
|
| 255 |
|
| 256 |
@cache
|
|
|
|
| 93 |
|
| 94 |
@cache
|
| 95 |
def get_historical_popular_models(date: date):
|
| 96 |
+
try:
|
| 97 |
+
raw = get("https://openrouter.ai/rankings").text
|
| 98 |
+
|
| 99 |
+
# Extract model data from rankingData using regex
|
| 100 |
+
import re
|
| 101 |
+
import json
|
| 102 |
+
|
| 103 |
+
# Find all count and model_permaslug pairs in the data
|
| 104 |
+
# Format: "count":number,"model_permaslug":"model/name"
|
| 105 |
+
pattern = r'\\\"count\\\":([\d.]+).*?\\\"model_permaslug\\\":\\\"([^\\\"]+)\\\"'
|
| 106 |
+
matches = re.findall(pattern, raw)
|
| 107 |
+
|
| 108 |
+
if matches:
|
| 109 |
+
# Aggregate model counts
|
| 110 |
+
model_counts = {}
|
| 111 |
+
for count_str, model_slug in matches:
|
| 112 |
+
count = float(count_str)
|
| 113 |
+
if not model_slug.startswith('openrouter') and model_slug != 'Others':
|
| 114 |
+
# Remove variant suffixes for aggregation
|
| 115 |
+
base_model = model_slug.split(':')[0]
|
| 116 |
+
model_counts[base_model] = model_counts.get(base_model, 0) + count
|
| 117 |
+
|
| 118 |
+
# Sort by popularity and return top models
|
| 119 |
+
sorted_models = sorted(model_counts.items(), key=lambda x: x[1], reverse=True)
|
| 120 |
+
result = []
|
| 121 |
+
for model_slug, count in sorted_models[:20]: # Top 20
|
| 122 |
+
result.append({"slug": model_slug, "count": int(count)})
|
| 123 |
+
|
| 124 |
+
print(f"✅ Historical OpenRouter models: {len(result)} models fetched")
|
| 125 |
+
if result:
|
| 126 |
+
print(f" Top 5: {[m['slug'] for m in result[:5]]}")
|
| 127 |
+
print(f" Sample counts: {[m['count'] for m in result[:3]]}")
|
| 128 |
+
return result
|
| 129 |
+
else:
|
| 130 |
+
print("⚠️ Could not find model ranking data in OpenRouter response")
|
| 131 |
+
return []
|
| 132 |
+
|
| 133 |
+
except Exception as e:
|
| 134 |
+
print(f"⚠️ Error fetching OpenRouter historical rankings: {e}")
|
| 135 |
+
print("🔄 Falling back to static model list")
|
| 136 |
+
return []
|
| 137 |
+
|
| 138 |
+
|
| 139 |
+
@cache
|
| 140 |
def get_current_popular_models(date: date):
|
| 141 |
+
try:
|
| 142 |
+
raw = get("https://openrouter.ai/rankings?view=day").text
|
| 143 |
+
|
| 144 |
+
# Extract model data from daily rankings
|
| 145 |
+
import re
|
| 146 |
+
import json
|
| 147 |
+
|
| 148 |
+
# Find all count and model_permaslug pairs in the daily data
|
| 149 |
+
pattern = r'\\\"count\\\":([\d.]+).*?\\\"model_permaslug\\\":\\\"([^\\\"]+)\\\"'
|
| 150 |
+
matches = re.findall(pattern, raw)
|
| 151 |
+
|
| 152 |
+
if matches:
|
| 153 |
+
# Aggregate model counts
|
| 154 |
+
model_counts = {}
|
| 155 |
+
for count_str, model_slug in matches:
|
| 156 |
+
count = float(count_str)
|
| 157 |
+
if not model_slug.startswith('openrouter') and model_slug != 'Others':
|
| 158 |
+
# Remove variant suffixes for aggregation
|
| 159 |
+
base_model = model_slug.split(':')[0]
|
| 160 |
+
model_counts[base_model] = model_counts.get(base_model, 0) + count
|
| 161 |
+
|
| 162 |
+
# Sort by popularity and return top models
|
| 163 |
+
sorted_models = sorted(model_counts.items(), key=lambda x: x[1], reverse=True)
|
| 164 |
+
result = []
|
| 165 |
+
for model_slug, count in sorted_models[:10]: # Top 10
|
| 166 |
+
result.append({"slug": model_slug, "count": int(count)})
|
| 167 |
+
|
| 168 |
+
print(f"✅ Current OpenRouter models: {len(result)} models fetched")
|
| 169 |
+
if result:
|
| 170 |
+
print(f" Top 5: {[m['slug'] for m in result[:5]]}")
|
| 171 |
+
print(f" Sample counts: {[m['count'] for m in result[:3]]}")
|
| 172 |
+
return result
|
| 173 |
+
else:
|
| 174 |
+
print("⚠️ Could not find daily ranking data in OpenRouter response")
|
| 175 |
+
return []
|
| 176 |
+
|
| 177 |
+
except Exception as e:
|
| 178 |
+
print(f"⚠️ Error fetching OpenRouter current rankings: {e}")
|
| 179 |
+
print("🔄 Falling back to static model list")
|
| 180 |
+
return []
|
| 181 |
|
| 182 |
|
| 183 |
def get_translation_models():
|
|
|
|
| 312 |
|
| 313 |
|
| 314 |
def get_cost(row):
|
| 315 |
+
"""
|
| 316 |
+
row: a row from the OpenRouter models dataframe
|
| 317 |
+
"""
|
| 318 |
+
try:
|
| 319 |
+
cost = float(row["endpoint"]["pricing"]["completion"])
|
| 320 |
+
return round(cost * 1_000_000, 2)
|
| 321 |
+
except (TypeError, KeyError):
|
| 322 |
+
return None
|
| 323 |
|
| 324 |
|
| 325 |
@cache
|
languages.json
CHANGED
|
@@ -7,7 +7,7 @@
|
|
| 7 |
"family":"Indo-European",
|
| 8 |
"flores_path":"eng_Latn",
|
| 9 |
"fleurs_tag":"en_us",
|
| 10 |
-
"commonvoice_hours":
|
| 11 |
"commonvoice_locale":"en",
|
| 12 |
"in_benchmark":true
|
| 13 |
},
|
|
@@ -79,7 +79,7 @@
|
|
| 79 |
"family":"Indo-European",
|
| 80 |
"flores_path":"fra_Latn",
|
| 81 |
"fleurs_tag":"fr_fr",
|
| 82 |
-
"commonvoice_hours":
|
| 83 |
"commonvoice_locale":"fr",
|
| 84 |
"in_benchmark":true
|
| 85 |
},
|
|
@@ -103,7 +103,7 @@
|
|
| 103 |
"family":"Indo-European",
|
| 104 |
"flores_path":"por_Latn",
|
| 105 |
"fleurs_tag":"pt_br",
|
| 106 |
-
"commonvoice_hours":
|
| 107 |
"commonvoice_locale":"pt",
|
| 108 |
"in_benchmark":true
|
| 109 |
},
|
|
@@ -115,7 +115,7 @@
|
|
| 115 |
"family":"Indo-European",
|
| 116 |
"flores_path":"pan_Guru",
|
| 117 |
"fleurs_tag":"pa_in",
|
| 118 |
-
"commonvoice_hours":2.
|
| 119 |
"commonvoice_locale":"pa-IN",
|
| 120 |
"in_benchmark":true
|
| 121 |
},
|
|
@@ -163,7 +163,7 @@
|
|
| 163 |
"family":"Indo-European",
|
| 164 |
"flores_path":"deu_Latn",
|
| 165 |
"fleurs_tag":"de_de",
|
| 166 |
-
"commonvoice_hours":
|
| 167 |
"commonvoice_locale":"de",
|
| 168 |
"in_benchmark":true
|
| 169 |
},
|
|
@@ -379,7 +379,7 @@
|
|
| 379 |
"family":"Indo-European",
|
| 380 |
"flores_path":null,
|
| 381 |
"fleurs_tag":"ps_af",
|
| 382 |
-
"commonvoice_hours":
|
| 383 |
"commonvoice_locale":"ps",
|
| 384 |
"in_benchmark":false
|
| 385 |
},
|
|
@@ -619,7 +619,7 @@
|
|
| 619 |
"family":"Indo-European",
|
| 620 |
"flores_path":"nld_Latn",
|
| 621 |
"fleurs_tag":"nl_nl",
|
| 622 |
-
"commonvoice_hours":
|
| 623 |
"commonvoice_locale":"nl",
|
| 624 |
"in_benchmark":true
|
| 625 |
},
|
|
@@ -655,7 +655,7 @@
|
|
| 655 |
"family":"Atlantic-Congo",
|
| 656 |
"flores_path":"yor_Latn",
|
| 657 |
"fleurs_tag":"yo_ng",
|
| 658 |
-
"commonvoice_hours":6.
|
| 659 |
"commonvoice_locale":"yo",
|
| 660 |
"in_benchmark":true
|
| 661 |
},
|
|
@@ -1099,7 +1099,7 @@
|
|
| 1099 |
"family":"Indo-European",
|
| 1100 |
"flores_path":"ckb_Arab",
|
| 1101 |
"fleurs_tag":"ckb_iq",
|
| 1102 |
-
"commonvoice_hours":
|
| 1103 |
"commonvoice_locale":"ckb",
|
| 1104 |
"in_benchmark":true
|
| 1105 |
},
|
|
@@ -1183,7 +1183,7 @@
|
|
| 1183 |
"family":"Indo-European",
|
| 1184 |
"flores_path":"bel_Cyrl",
|
| 1185 |
"fleurs_tag":"be_by",
|
| 1186 |
-
"commonvoice_hours":
|
| 1187 |
"commonvoice_locale":"be",
|
| 1188 |
"in_benchmark":true
|
| 1189 |
},
|
|
@@ -1243,7 +1243,7 @@
|
|
| 1243 |
"family":"Indo-European",
|
| 1244 |
"flores_path":"afr_Latn",
|
| 1245 |
"fleurs_tag":"af_za",
|
| 1246 |
-
"commonvoice_hours":0.
|
| 1247 |
"commonvoice_locale":"af",
|
| 1248 |
"in_benchmark":true
|
| 1249 |
},
|
|
@@ -1291,7 +1291,7 @@
|
|
| 1291 |
"family":"Indo-European",
|
| 1292 |
"flores_path":"cat_Latn",
|
| 1293 |
"fleurs_tag":"ca_es",
|
| 1294 |
-
"commonvoice_hours":
|
| 1295 |
"commonvoice_locale":"ca",
|
| 1296 |
"in_benchmark":true
|
| 1297 |
},
|
|
@@ -1303,7 +1303,7 @@
|
|
| 1303 |
"family":"Afro-Asiatic",
|
| 1304 |
"flores_path":"heb_Hebr",
|
| 1305 |
"fleurs_tag":"he_il",
|
| 1306 |
-
"commonvoice_hours":1.
|
| 1307 |
"commonvoice_locale":"he",
|
| 1308 |
"in_benchmark":true
|
| 1309 |
},
|
|
@@ -1375,7 +1375,7 @@
|
|
| 1375 |
"family":"Turkic",
|
| 1376 |
"flores_path":"uig_Arab",
|
| 1377 |
"fleurs_tag":null,
|
| 1378 |
-
"commonvoice_hours":
|
| 1379 |
"commonvoice_locale":"ug",
|
| 1380 |
"in_benchmark":true
|
| 1381 |
},
|
|
@@ -1747,7 +1747,7 @@
|
|
| 1747 |
"family":"Indo-European",
|
| 1748 |
"flores_path":"nob_Latn",
|
| 1749 |
"fleurs_tag":"nb_no",
|
| 1750 |
-
"commonvoice_hours":0.
|
| 1751 |
"commonvoice_locale":"nb-NO",
|
| 1752 |
"in_benchmark":true
|
| 1753 |
},
|
|
@@ -2167,7 +2167,7 @@
|
|
| 2167 |
"family":"Indo-European",
|
| 2168 |
"flores_path":"glg_Latn",
|
| 2169 |
"fleurs_tag":"gl_es",
|
| 2170 |
-
"commonvoice_hours":
|
| 2171 |
"commonvoice_locale":"gl",
|
| 2172 |
"in_benchmark":true
|
| 2173 |
},
|
|
@@ -2323,7 +2323,7 @@
|
|
| 2323 |
"family":"Dravidian",
|
| 2324 |
"flores_path":null,
|
| 2325 |
"fleurs_tag":null,
|
| 2326 |
-
"commonvoice_hours":
|
| 2327 |
"commonvoice_locale":"brh",
|
| 2328 |
"in_benchmark":false
|
| 2329 |
},
|
|
@@ -2623,7 +2623,7 @@
|
|
| 2623 |
"family":"Indo-European",
|
| 2624 |
"flores_path":null,
|
| 2625 |
"fleurs_tag":null,
|
| 2626 |
-
"commonvoice_hours":0
|
| 2627 |
"commonvoice_locale":"haz",
|
| 2628 |
"in_benchmark":false
|
| 2629 |
},
|
|
@@ -2695,7 +2695,7 @@
|
|
| 2695 |
"family":"Indo-European",
|
| 2696 |
"flores_path":"oci_Latn",
|
| 2697 |
"fleurs_tag":"oc_fr",
|
| 2698 |
-
"commonvoice_hours":1.
|
| 2699 |
"commonvoice_locale":"oc",
|
| 2700 |
"in_benchmark":true
|
| 2701 |
},
|
|
@@ -3319,8 +3319,8 @@
|
|
| 3319 |
"family":"Indo-European",
|
| 3320 |
"flores_path":null,
|
| 3321 |
"fleurs_tag":null,
|
| 3322 |
-
"commonvoice_hours":
|
| 3323 |
-
"commonvoice_locale":
|
| 3324 |
"in_benchmark":false
|
| 3325 |
},
|
| 3326 |
{
|
|
@@ -3331,7 +3331,7 @@
|
|
| 3331 |
"family":"Indo-European",
|
| 3332 |
"flores_path":"gle_Latn",
|
| 3333 |
"fleurs_tag":"ga_ie",
|
| 3334 |
-
"commonvoice_hours":8.
|
| 3335 |
"commonvoice_locale":"ga-IE",
|
| 3336 |
"in_benchmark":true
|
| 3337 |
},
|
|
@@ -3487,7 +3487,7 @@
|
|
| 3487 |
"family":"Indo-European",
|
| 3488 |
"flores_path":"lvs_Latn",
|
| 3489 |
"fleurs_tag":"lv_lv",
|
| 3490 |
-
"commonvoice_hours":
|
| 3491 |
"commonvoice_locale":"lv",
|
| 3492 |
"in_benchmark":true
|
| 3493 |
},
|
|
@@ -3535,7 +3535,7 @@
|
|
| 3535 |
"family":null,
|
| 3536 |
"flores_path":"eus_Latn",
|
| 3537 |
"fleurs_tag":null,
|
| 3538 |
-
"commonvoice_hours":
|
| 3539 |
"commonvoice_locale":"eu",
|
| 3540 |
"in_benchmark":true
|
| 3541 |
},
|
|
@@ -3559,7 +3559,7 @@
|
|
| 3559 |
"family":"Abkhaz-Adyge",
|
| 3560 |
"flores_path":null,
|
| 3561 |
"fleurs_tag":null,
|
| 3562 |
-
"commonvoice_hours":
|
| 3563 |
"commonvoice_locale":"kbd",
|
| 3564 |
"in_benchmark":false
|
| 3565 |
},
|
|
@@ -3679,7 +3679,7 @@
|
|
| 3679 |
"family":"Indo-European",
|
| 3680 |
"flores_path":"ydd_Hebr",
|
| 3681 |
"fleurs_tag":null,
|
| 3682 |
-
"commonvoice_hours":0.
|
| 3683 |
"commonvoice_locale":"yi",
|
| 3684 |
"in_benchmark":true
|
| 3685 |
},
|
|
@@ -3991,8 +3991,8 @@
|
|
| 3991 |
"family":"Atlantic-Congo",
|
| 3992 |
"flores_path":null,
|
| 3993 |
"fleurs_tag":null,
|
| 3994 |
-
"commonvoice_hours":
|
| 3995 |
-
"commonvoice_locale":
|
| 3996 |
"in_benchmark":false
|
| 3997 |
},
|
| 3998 |
{
|
|
@@ -4351,7 +4351,7 @@
|
|
| 4351 |
"family":"Indo-European",
|
| 4352 |
"flores_path":null,
|
| 4353 |
"fleurs_tag":null,
|
| 4354 |
-
"commonvoice_hours":
|
| 4355 |
"commonvoice_locale":"br",
|
| 4356 |
"in_benchmark":false
|
| 4357 |
},
|
|
@@ -4651,7 +4651,7 @@
|
|
| 4651 |
"family":"Abkhaz-Adyge",
|
| 4652 |
"flores_path":null,
|
| 4653 |
"fleurs_tag":null,
|
| 4654 |
-
"commonvoice_hours":
|
| 4655 |
"commonvoice_locale":"ady",
|
| 4656 |
"in_benchmark":false
|
| 4657 |
},
|
|
@@ -7879,7 +7879,7 @@
|
|
| 7879 |
"family":"Artificial Language",
|
| 7880 |
"flores_path":"epo_Latn",
|
| 7881 |
"fleurs_tag":null,
|
| 7882 |
-
"commonvoice_hours":
|
| 7883 |
"commonvoice_locale":"eo",
|
| 7884 |
"in_benchmark":true
|
| 7885 |
},
|
|
|
|
| 7 |
"family":"Indo-European",
|
| 8 |
"flores_path":"eng_Latn",
|
| 9 |
"fleurs_tag":"en_us",
|
| 10 |
+
"commonvoice_hours":2678.0,
|
| 11 |
"commonvoice_locale":"en",
|
| 12 |
"in_benchmark":true
|
| 13 |
},
|
|
|
|
| 79 |
"family":"Indo-European",
|
| 80 |
"flores_path":"fra_Latn",
|
| 81 |
"fleurs_tag":"fr_fr",
|
| 82 |
+
"commonvoice_hours":1067.0,
|
| 83 |
"commonvoice_locale":"fr",
|
| 84 |
"in_benchmark":true
|
| 85 |
},
|
|
|
|
| 103 |
"family":"Indo-European",
|
| 104 |
"flores_path":"por_Latn",
|
| 105 |
"fleurs_tag":"pt_br",
|
| 106 |
+
"commonvoice_hours":181.0,
|
| 107 |
"commonvoice_locale":"pt",
|
| 108 |
"in_benchmark":true
|
| 109 |
},
|
|
|
|
| 115 |
"family":"Indo-European",
|
| 116 |
"flores_path":"pan_Guru",
|
| 117 |
"fleurs_tag":"pa_in",
|
| 118 |
+
"commonvoice_hours":2.5,
|
| 119 |
"commonvoice_locale":"pa-IN",
|
| 120 |
"in_benchmark":true
|
| 121 |
},
|
|
|
|
| 163 |
"family":"Indo-European",
|
| 164 |
"flores_path":"deu_Latn",
|
| 165 |
"fleurs_tag":"de_de",
|
| 166 |
+
"commonvoice_hours":1370.0,
|
| 167 |
"commonvoice_locale":"de",
|
| 168 |
"in_benchmark":true
|
| 169 |
},
|
|
|
|
| 379 |
"family":"Indo-European",
|
| 380 |
"flores_path":null,
|
| 381 |
"fleurs_tag":"ps_af",
|
| 382 |
+
"commonvoice_hours":82.0,
|
| 383 |
"commonvoice_locale":"ps",
|
| 384 |
"in_benchmark":false
|
| 385 |
},
|
|
|
|
| 619 |
"family":"Indo-European",
|
| 620 |
"flores_path":"nld_Latn",
|
| 621 |
"fleurs_tag":"nl_nl",
|
| 622 |
+
"commonvoice_hours":122.0,
|
| 623 |
"commonvoice_locale":"nl",
|
| 624 |
"in_benchmark":true
|
| 625 |
},
|
|
|
|
| 655 |
"family":"Atlantic-Congo",
|
| 656 |
"flores_path":"yor_Latn",
|
| 657 |
"fleurs_tag":"yo_ng",
|
| 658 |
+
"commonvoice_hours":6.4,
|
| 659 |
"commonvoice_locale":"yo",
|
| 660 |
"in_benchmark":true
|
| 661 |
},
|
|
|
|
| 1099 |
"family":"Indo-European",
|
| 1100 |
"flores_path":"ckb_Arab",
|
| 1101 |
"fleurs_tag":"ckb_iq",
|
| 1102 |
+
"commonvoice_hours":136.0,
|
| 1103 |
"commonvoice_locale":"ckb",
|
| 1104 |
"in_benchmark":true
|
| 1105 |
},
|
|
|
|
| 1183 |
"family":"Indo-European",
|
| 1184 |
"flores_path":"bel_Cyrl",
|
| 1185 |
"fleurs_tag":"be_by",
|
| 1186 |
+
"commonvoice_hours":1811.0,
|
| 1187 |
"commonvoice_locale":"be",
|
| 1188 |
"in_benchmark":true
|
| 1189 |
},
|
|
|
|
| 1243 |
"family":"Indo-European",
|
| 1244 |
"flores_path":"afr_Latn",
|
| 1245 |
"fleurs_tag":"af_za",
|
| 1246 |
+
"commonvoice_hours":0.6,
|
| 1247 |
"commonvoice_locale":"af",
|
| 1248 |
"in_benchmark":true
|
| 1249 |
},
|
|
|
|
| 1291 |
"family":"Indo-European",
|
| 1292 |
"flores_path":"cat_Latn",
|
| 1293 |
"fleurs_tag":"ca_es",
|
| 1294 |
+
"commonvoice_hours":2874.0,
|
| 1295 |
"commonvoice_locale":"ca",
|
| 1296 |
"in_benchmark":true
|
| 1297 |
},
|
|
|
|
| 1303 |
"family":"Afro-Asiatic",
|
| 1304 |
"flores_path":"heb_Hebr",
|
| 1305 |
"fleurs_tag":"he_il",
|
| 1306 |
+
"commonvoice_hours":1.6,
|
| 1307 |
"commonvoice_locale":"he",
|
| 1308 |
"in_benchmark":true
|
| 1309 |
},
|
|
|
|
| 1375 |
"family":"Turkic",
|
| 1376 |
"flores_path":"uig_Arab",
|
| 1377 |
"fleurs_tag":null,
|
| 1378 |
+
"commonvoice_hours":412.0,
|
| 1379 |
"commonvoice_locale":"ug",
|
| 1380 |
"in_benchmark":true
|
| 1381 |
},
|
|
|
|
| 1747 |
"family":"Indo-European",
|
| 1748 |
"flores_path":"nob_Latn",
|
| 1749 |
"fleurs_tag":"nb_no",
|
| 1750 |
+
"commonvoice_hours":0.6,
|
| 1751 |
"commonvoice_locale":"nb-NO",
|
| 1752 |
"in_benchmark":true
|
| 1753 |
},
|
|
|
|
| 2167 |
"family":"Indo-European",
|
| 2168 |
"flores_path":"glg_Latn",
|
| 2169 |
"fleurs_tag":"gl_es",
|
| 2170 |
+
"commonvoice_hours":121.0,
|
| 2171 |
"commonvoice_locale":"gl",
|
| 2172 |
"in_benchmark":true
|
| 2173 |
},
|
|
|
|
| 2323 |
"family":"Dravidian",
|
| 2324 |
"flores_path":null,
|
| 2325 |
"fleurs_tag":null,
|
| 2326 |
+
"commonvoice_hours":11.0,
|
| 2327 |
"commonvoice_locale":"brh",
|
| 2328 |
"in_benchmark":false
|
| 2329 |
},
|
|
|
|
| 2623 |
"family":"Indo-European",
|
| 2624 |
"flores_path":null,
|
| 2625 |
"fleurs_tag":null,
|
| 2626 |
+
"commonvoice_hours":11.0,
|
| 2627 |
"commonvoice_locale":"haz",
|
| 2628 |
"in_benchmark":false
|
| 2629 |
},
|
|
|
|
| 2695 |
"family":"Indo-European",
|
| 2696 |
"flores_path":"oci_Latn",
|
| 2697 |
"fleurs_tag":"oc_fr",
|
| 2698 |
+
"commonvoice_hours":1.9,
|
| 2699 |
"commonvoice_locale":"oc",
|
| 2700 |
"in_benchmark":true
|
| 2701 |
},
|
|
|
|
| 3319 |
"family":"Indo-European",
|
| 3320 |
"flores_path":null,
|
| 3321 |
"fleurs_tag":null,
|
| 3322 |
+
"commonvoice_hours":0.0,
|
| 3323 |
+
"commonvoice_locale":"mfe",
|
| 3324 |
"in_benchmark":false
|
| 3325 |
},
|
| 3326 |
{
|
|
|
|
| 3331 |
"family":"Indo-European",
|
| 3332 |
"flores_path":"gle_Latn",
|
| 3333 |
"fleurs_tag":"ga_ie",
|
| 3334 |
+
"commonvoice_hours":8.8,
|
| 3335 |
"commonvoice_locale":"ga-IE",
|
| 3336 |
"in_benchmark":true
|
| 3337 |
},
|
|
|
|
| 3487 |
"family":"Indo-European",
|
| 3488 |
"flores_path":"lvs_Latn",
|
| 3489 |
"fleurs_tag":"lv_lv",
|
| 3490 |
+
"commonvoice_hours":263.0,
|
| 3491 |
"commonvoice_locale":"lv",
|
| 3492 |
"in_benchmark":true
|
| 3493 |
},
|
|
|
|
| 3535 |
"family":null,
|
| 3536 |
"flores_path":"eus_Latn",
|
| 3537 |
"fleurs_tag":null,
|
| 3538 |
+
"commonvoice_hours":452.0,
|
| 3539 |
"commonvoice_locale":"eu",
|
| 3540 |
"in_benchmark":true
|
| 3541 |
},
|
|
|
|
| 3559 |
"family":"Abkhaz-Adyge",
|
| 3560 |
"flores_path":null,
|
| 3561 |
"fleurs_tag":null,
|
| 3562 |
+
"commonvoice_hours":92.0,
|
| 3563 |
"commonvoice_locale":"kbd",
|
| 3564 |
"in_benchmark":false
|
| 3565 |
},
|
|
|
|
| 3679 |
"family":"Indo-European",
|
| 3680 |
"flores_path":"ydd_Hebr",
|
| 3681 |
"fleurs_tag":null,
|
| 3682 |
+
"commonvoice_hours":0.8,
|
| 3683 |
"commonvoice_locale":"yi",
|
| 3684 |
"in_benchmark":true
|
| 3685 |
},
|
|
|
|
| 3991 |
"family":"Atlantic-Congo",
|
| 3992 |
"flores_path":null,
|
| 3993 |
"fleurs_tag":null,
|
| 3994 |
+
"commonvoice_hours":0.0,
|
| 3995 |
+
"commonvoice_locale":"gaa",
|
| 3996 |
"in_benchmark":false
|
| 3997 |
},
|
| 3998 |
{
|
|
|
|
| 4351 |
"family":"Indo-European",
|
| 4352 |
"flores_path":null,
|
| 4353 |
"fleurs_tag":null,
|
| 4354 |
+
"commonvoice_hours":30.0,
|
| 4355 |
"commonvoice_locale":"br",
|
| 4356 |
"in_benchmark":false
|
| 4357 |
},
|
|
|
|
| 4651 |
"family":"Abkhaz-Adyge",
|
| 4652 |
"flores_path":null,
|
| 4653 |
"fleurs_tag":null,
|
| 4654 |
+
"commonvoice_hours":31.0,
|
| 4655 |
"commonvoice_locale":"ady",
|
| 4656 |
"in_benchmark":false
|
| 4657 |
},
|
|
|
|
| 7879 |
"family":"Artificial Language",
|
| 7880 |
"flores_path":"epo_Latn",
|
| 7881 |
"fleurs_tag":null,
|
| 7882 |
+
"commonvoice_hours":1437.0,
|
| 7883 |
"commonvoice_locale":"eo",
|
| 7884 |
"in_benchmark":true
|
| 7885 |
},
|
models.json
CHANGED
|
@@ -28,7 +28,7 @@
|
|
| 28 |
"size":null,
|
| 29 |
"type":"closed-source",
|
| 30 |
"license":null,
|
| 31 |
-
"creation_date":1729555200000,
|
| 32 |
"tasks":[
|
| 33 |
"translation_from",
|
| 34 |
"translation_to",
|
|
@@ -48,7 +48,7 @@
|
|
| 48 |
"size":null,
|
| 49 |
"type":"closed-source",
|
| 50 |
"license":null,
|
| 51 |
-
"creation_date":1740355200000,
|
| 52 |
"tasks":[
|
| 53 |
"translation_from",
|
| 54 |
"translation_to",
|
|
@@ -68,7 +68,7 @@
|
|
| 68 |
"size":null,
|
| 69 |
"type":"closed-source",
|
| 70 |
"license":null,
|
| 71 |
-
"creation_date":1747872000000,
|
| 72 |
"tasks":[
|
| 73 |
"translation_from",
|
| 74 |
"translation_to",
|
|
@@ -83,7 +83,7 @@
|
|
| 83 |
"id":"deepseek\/deepseek-chat",
|
| 84 |
"name":"DeepSeek V3",
|
| 85 |
"provider_name":"DeepSeek",
|
| 86 |
-
"cost":0.
|
| 87 |
"hf_id":"deepseek-ai\/DeepSeek-V3",
|
| 88 |
"size":684531386000.0,
|
| 89 |
"type":"open-source",
|
|
@@ -128,7 +128,7 @@
|
|
| 128 |
"size":684531386000.0,
|
| 129 |
"type":"open-source",
|
| 130 |
"license":"Mit",
|
| 131 |
-
"creation_date":1737331200000,
|
| 132 |
"tasks":[
|
| 133 |
"translation_from",
|
| 134 |
"translation_to",
|
|
@@ -168,7 +168,7 @@
|
|
| 168 |
"size":null,
|
| 169 |
"type":"closed-source",
|
| 170 |
"license":null,
|
| 171 |
-
"creation_date":1738713600000,
|
| 172 |
"tasks":[
|
| 173 |
"translation_from",
|
| 174 |
"translation_to",
|
|
@@ -282,7 +282,7 @@
|
|
| 282 |
"size":null,
|
| 283 |
"type":"closed-source",
|
| 284 |
"license":null,
|
| 285 |
-
"creation_date":1750118400000,
|
| 286 |
"tasks":[
|
| 287 |
"translation_from",
|
| 288 |
"translation_to",
|
|
@@ -338,7 +338,7 @@
|
|
| 338 |
"size":null,
|
| 339 |
"type":"closed-source",
|
| 340 |
"license":null,
|
| 341 |
-
"creation_date":1715644800000,
|
| 342 |
"tasks":[
|
| 343 |
"translation_from",
|
| 344 |
"translation_to",
|
|
@@ -358,7 +358,7 @@
|
|
| 358 |
"size":null,
|
| 359 |
"type":"closed-source",
|
| 360 |
"license":null,
|
| 361 |
-
"creation_date":1727913600000,
|
| 362 |
"tasks":[
|
| 363 |
"translation_from",
|
| 364 |
"translation_to",
|
|
@@ -413,7 +413,7 @@
|
|
| 413 |
"size":null,
|
| 414 |
"type":"open-source",
|
| 415 |
"license":"Other",
|
| 416 |
-
"creation_date":1691625600000,
|
| 417 |
"tasks":[
|
| 418 |
"translation_from",
|
| 419 |
"translation_to",
|
|
@@ -512,7 +512,7 @@
|
|
| 512 |
"id":"meta-llama\/llama-4-maverick",
|
| 513 |
"name":"Llama 4 Maverick",
|
| 514 |
"provider_name":"Meta",
|
| 515 |
-
"cost":0.
|
| 516 |
"hf_id":"meta-llama\/Llama-4-Maverick-17B-128E-Instruct",
|
| 517 |
"size":401583781376.0,
|
| 518 |
"type":"open-source",
|
|
@@ -772,7 +772,7 @@
|
|
| 772 |
"id":"qwen\/qwen3-32b",
|
| 773 |
"name":"Qwen3 32B",
|
| 774 |
"provider_name":"Qwen",
|
| 775 |
-
"cost":0.
|
| 776 |
"hf_id":"Qwen\/Qwen3-32B",
|
| 777 |
"size":32762123264.0,
|
| 778 |
"type":"open-source",
|
|
|
|
| 28 |
"size":null,
|
| 29 |
"type":"closed-source",
|
| 30 |
"license":null,
|
| 31 |
+
"creation_date":1729555200000.0,
|
| 32 |
"tasks":[
|
| 33 |
"translation_from",
|
| 34 |
"translation_to",
|
|
|
|
| 48 |
"size":null,
|
| 49 |
"type":"closed-source",
|
| 50 |
"license":null,
|
| 51 |
+
"creation_date":1740355200000.0,
|
| 52 |
"tasks":[
|
| 53 |
"translation_from",
|
| 54 |
"translation_to",
|
|
|
|
| 68 |
"size":null,
|
| 69 |
"type":"closed-source",
|
| 70 |
"license":null,
|
| 71 |
+
"creation_date":1747872000000.0,
|
| 72 |
"tasks":[
|
| 73 |
"translation_from",
|
| 74 |
"translation_to",
|
|
|
|
| 83 |
"id":"deepseek\/deepseek-chat",
|
| 84 |
"name":"DeepSeek V3",
|
| 85 |
"provider_name":"DeepSeek",
|
| 86 |
+
"cost":0.27,
|
| 87 |
"hf_id":"deepseek-ai\/DeepSeek-V3",
|
| 88 |
"size":684531386000.0,
|
| 89 |
"type":"open-source",
|
|
|
|
| 128 |
"size":684531386000.0,
|
| 129 |
"type":"open-source",
|
| 130 |
"license":"Mit",
|
| 131 |
+
"creation_date":1737331200000.0,
|
| 132 |
"tasks":[
|
| 133 |
"translation_from",
|
| 134 |
"translation_to",
|
|
|
|
| 168 |
"size":null,
|
| 169 |
"type":"closed-source",
|
| 170 |
"license":null,
|
| 171 |
+
"creation_date":1738713600000.0,
|
| 172 |
"tasks":[
|
| 173 |
"translation_from",
|
| 174 |
"translation_to",
|
|
|
|
| 282 |
"size":null,
|
| 283 |
"type":"closed-source",
|
| 284 |
"license":null,
|
| 285 |
+
"creation_date":1750118400000.0,
|
| 286 |
"tasks":[
|
| 287 |
"translation_from",
|
| 288 |
"translation_to",
|
|
|
|
| 338 |
"size":null,
|
| 339 |
"type":"closed-source",
|
| 340 |
"license":null,
|
| 341 |
+
"creation_date":1715644800000.0,
|
| 342 |
"tasks":[
|
| 343 |
"translation_from",
|
| 344 |
"translation_to",
|
|
|
|
| 358 |
"size":null,
|
| 359 |
"type":"closed-source",
|
| 360 |
"license":null,
|
| 361 |
+
"creation_date":1727913600000.0,
|
| 362 |
"tasks":[
|
| 363 |
"translation_from",
|
| 364 |
"translation_to",
|
|
|
|
| 413 |
"size":null,
|
| 414 |
"type":"open-source",
|
| 415 |
"license":"Other",
|
| 416 |
+
"creation_date":1691625600000.0,
|
| 417 |
"tasks":[
|
| 418 |
"translation_from",
|
| 419 |
"translation_to",
|
|
|
|
| 512 |
"id":"meta-llama\/llama-4-maverick",
|
| 513 |
"name":"Llama 4 Maverick",
|
| 514 |
"provider_name":"Meta",
|
| 515 |
+
"cost":0.6,
|
| 516 |
"hf_id":"meta-llama\/Llama-4-Maverick-17B-128E-Instruct",
|
| 517 |
"size":401583781376.0,
|
| 518 |
"type":"open-source",
|
|
|
|
| 772 |
"id":"qwen\/qwen3-32b",
|
| 773 |
"name":"Qwen3 32B",
|
| 774 |
"provider_name":"Qwen",
|
| 775 |
+
"cost":0.03,
|
| 776 |
"hf_id":"Qwen\/Qwen3-32B",
|
| 777 |
"size":32762123264.0,
|
| 778 |
"type":"open-source",
|