davidpomerenke commited on
Commit
088f96f
·
verified ·
1 Parent(s): b39df3c

Upload from GitHub Actions: ran full evaluation locally

Browse files
Files changed (6) hide show
  1. .gitattributes +1 -0
  2. errors.log +3 -0
  3. evals/main.py +83 -43
  4. languages.json +3 -3
  5. models.json +509 -500
  6. results.json +2 -2
.gitattributes CHANGED
@@ -1,2 +1,3 @@
1
  evals/data_flow_architecture.png filter=lfs diff=lfs merge=lfs -text
2
  results.json filter=lfs diff=lfs merge=lfs -text
 
 
1
  evals/data_flow_architecture.png filter=lfs diff=lfs merge=lfs -text
2
  results.json filter=lfs diff=lfs merge=lfs -text
3
+ errors.log filter=lfs diff=lfs merge=lfs -text
errors.log ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bbd7bf12d062c48650b24bb1c138d565f8129cb9d4ecabeedc3d165edcd57cb
3
+ size 11143443
evals/main.py CHANGED
@@ -14,7 +14,7 @@ async def evaluate():
14
  single_model = os.environ.get("SINGLE_MODEL") # Optional: run only one specific model
15
  test_mode = os.environ.get("TEST", "").lower() in ("1", "true", "yes") # Optional: skip results loading/saving
16
 
17
- # Keep original DataFrames for saving metadata
18
  original_models_df = pd.DataFrame(models)
19
  original_languages_df = pd.DataFrame(languages)
20
 
@@ -59,8 +59,11 @@ async def evaluate():
59
 
60
  # Filter out already evaluated combinations
61
  combis = pd.DataFrame(combis, columns=["model", "bcp_47", "task"])
62
- combis = combis.merge(old_results, on=["model", "bcp_47", "task"], how="left")
63
- combis = combis[combis["metric"].isna()][["model", "bcp_47", "task"]]
 
 
 
64
 
65
  # Create all evaluation tasks
66
  all_tasks = []
@@ -70,64 +73,101 @@ async def evaluate():
70
 
71
  print(f"Running {len(all_tasks)} evaluation tasks...")
72
 
73
- # Run all tasks with simple asyncio.gather, but stop on first error
 
 
 
 
 
 
 
74
  try:
75
- results = await asyncio.gather(
76
- *[task_func(model, bcp_47, sentence_nr) for task_func, model, bcp_47, sentence_nr in all_tasks],
77
- return_exceptions=False # This will raise on first exception
78
- )
 
 
 
 
 
79
 
80
- # Process results - no exceptions should reach here
81
  valid_results = []
82
- for r in results:
83
- if isinstance(r, list):
 
 
 
 
 
 
84
  valid_results.extend(r)
85
- else:
86
  valid_results.append(r)
87
-
88
- print(f"Completed: {len(valid_results)} valid results")
89
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
90
  except Exception as e:
91
  print(f"EVALUATION STOPPED - API Error occurred:")
92
  print(f"Error type: {type(e).__name__}")
93
  print(f"Error message: {str(e)}")
94
  return pd.DataFrame()
95
 
96
- # Save results (skip in test mode)
97
- if valid_results:
98
- results_df = pd.DataFrame(valid_results)
99
-
100
- # Aggregate results
101
- results_df = (
102
- results_df.groupby(["model", "bcp_47", "task", "metric", "origin"])
103
- .agg({"score": "mean"})
104
- .reset_index()
105
- )
 
 
 
106
 
107
- if not test_mode:
108
- args = dict(orient="records", indent=2, force_ascii=False)
109
-
110
- # Merge with existing results
111
- if not old_results.empty:
112
- results_df = pd.concat([old_results, results_df])
113
- results_df = results_df.drop_duplicates(subset=["model", "bcp_47", "task", "metric", "origin"])
114
-
115
- results_df = results_df.sort_values(by=["model", "bcp_47", "task", "metric"])
116
- results_df.to_json("results.json", **args)
117
-
118
- # Save model and language info (always save complete metadata, not filtered)
119
- original_models_df.to_json("models.json", **args)
120
- original_languages_df.to_json("languages.json", **args)
121
- else:
122
- print("TEST MODE: Skipping results saving")
123
 
124
- elapsed = time.time() - start_time
125
- print(f"Evaluation completed in {str(timedelta(seconds=int(elapsed)))}")
126
 
127
- return results_df
 
 
 
 
 
 
 
 
 
128
 
129
  return pd.DataFrame()
130
 
131
 
 
132
  if __name__ == "__main__":
133
  results = asyncio.run(evaluate())
 
14
  single_model = os.environ.get("SINGLE_MODEL") # Optional: run only one specific model
15
  test_mode = os.environ.get("TEST", "").lower() in ("1", "true", "yes") # Optional: skip results loading/saving
16
 
17
+ # Keep original DataFrames for saving metadata - distinction added for single model test runs.
18
  original_models_df = pd.DataFrame(models)
19
  original_languages_df = pd.DataFrame(languages)
20
 
 
59
 
60
  # Filter out already evaluated combinations
61
  combis = pd.DataFrame(combis, columns=["model", "bcp_47", "task"])
62
+ if not old_results.empty:
63
+ completed = set(old_results[["model", "bcp_47", "task"]].apply(tuple, axis=1))
64
+ # set + combis is faster than merge (locally it made a difference for me when loading all data/tasks into memory)
65
+ mask = ~combis.apply(lambda row: (row["model"], row["bcp_47"], row["task"]) in completed, axis=1)
66
+ combis = combis[mask]
67
 
68
  # Create all evaluation tasks
69
  all_tasks = []
 
73
 
74
  print(f"Running {len(all_tasks)} evaluation tasks...")
75
 
76
+ # For single model runs, we stop immediately on first API error to inspect.
77
+ # For full evaluations, we continue despite errors to get maximum coverage.
78
+ stop_on_error = single_model is not None
79
+
80
+ # Process tasks in batches to avoid memory issues (for full evaluation locally that helped a lot)
81
+ batch_size = 1000
82
+ all_results = []
83
+
84
  try:
85
+ for i in range(0, len(all_tasks), batch_size):
86
+ batch = all_tasks[i:i + batch_size]
87
+ batch_results = await asyncio.gather(
88
+ *[task_func(model, bcp_47, sentence_nr) for task_func, model, bcp_47, sentence_nr in batch],
89
+ return_exceptions=not stop_on_error
90
+ )
91
+ all_results.extend(batch_results)
92
+
93
+ results = all_results
94
 
95
+ # Process results and logging API errors separately to understand what are the main issues.
96
  valid_results = []
97
+ errors = []
98
+
99
+ for i, r in enumerate(results):
100
+ if isinstance(r, Exception):
101
+ if i < len(all_tasks):
102
+ task_info = all_tasks[i]
103
+ errors.append(f"{task_info[1]},{task_info[2]},{str(r)}")
104
+ elif isinstance(r, list):
105
  valid_results.extend(r)
106
+ elif r is not None:
107
  valid_results.append(r)
 
 
108
 
109
+ # log errors and store
110
+ if errors:
111
+ with open("errors.log", "w") as f:
112
+ f.write("model,task,error\n")
113
+ for error in errors:
114
+ f.write(error + "\n")
115
+
116
+ # Track model completion (TO BE DELETED - was for local run only)
117
+ if valid_results:
118
+ completed_models = set()
119
+ for result in valid_results:
120
+ if isinstance(result, dict) and "model" in result:
121
+ model = result["model"]
122
+ if model not in completed_models:
123
+ completed_models.add(model)
124
+ print(f"Completed: {model}")
125
+
126
+ print(f"Completed: {len(valid_results)} valid results, {len(errors)} errors")
127
+
128
+ # this is for local single model runs - for testing and development
129
  except Exception as e:
130
  print(f"EVALUATION STOPPED - API Error occurred:")
131
  print(f"Error type: {type(e).__name__}")
132
  print(f"Error message: {str(e)}")
133
  return pd.DataFrame()
134
 
135
+ # Save results (skipped in test mode as we do not want to overwrite existing results)
136
+ if valid_results:
137
+ results_df = pd.DataFrame(valid_results)
138
+
139
+ # Aggregate results
140
+ results_df = (
141
+ results_df.groupby(["model", "bcp_47", "task", "metric", "origin"])
142
+ .agg({"score": "mean"})
143
+ .reset_index()
144
+ )
145
+
146
+ if not test_mode:
147
+ args = dict(orient="records", indent=2, force_ascii=False)
148
 
149
+ # Merge with existing results
150
+ if not old_results.empty:
151
+ results_df = pd.concat([old_results, results_df])
152
+ results_df = results_df.drop_duplicates(subset=["model", "bcp_47", "task", "metric", "origin"])
 
 
 
 
 
 
 
 
 
 
 
 
153
 
154
+ results_df = results_df.sort_values(by=["model", "bcp_47", "task", "metric"])
155
+ results_df.to_json("results.json", **args)
156
 
157
+ # Save model and language info (always save complete metadata, not filtered)
158
+ original_models_df.to_json("models.json", **args)
159
+ original_languages_df.to_json("languages.json", **args)
160
+ else:
161
+ print("TEST MODE: Skipping results saving")
162
+
163
+ elapsed = time.time() - start_time
164
+ print(f"Evaluation completed in {str(timedelta(seconds=int(elapsed)))}")
165
+
166
+ return results_df
167
 
168
  return pd.DataFrame()
169
 
170
 
171
+
172
  if __name__ == "__main__":
173
  results = asyncio.run(evaluate())
languages.json CHANGED
@@ -979,7 +979,7 @@
979
  "family":"Turkic",
980
  "flores_path":"kaz_Cyrl",
981
  "fleurs_tag":"kk_kz",
982
- "commonvoice_hours":2.2,
983
  "commonvoice_locale":"kk",
984
  "in_benchmark":true
985
  },
@@ -2167,7 +2167,7 @@
2167
  "family":"Indo-European",
2168
  "flores_path":"glg_Latn",
2169
  "fleurs_tag":"gl_es",
2170
- "commonvoice_hours":162.0,
2171
  "commonvoice_locale":"gl",
2172
  "in_benchmark":true
2173
  },
@@ -3679,7 +3679,7 @@
3679
  "family":"Indo-European",
3680
  "flores_path":"ydd_Hebr",
3681
  "fleurs_tag":null,
3682
- "commonvoice_hours":1.7,
3683
  "commonvoice_locale":"yi",
3684
  "in_benchmark":true
3685
  },
 
979
  "family":"Turkic",
980
  "flores_path":"kaz_Cyrl",
981
  "fleurs_tag":"kk_kz",
982
+ "commonvoice_hours":2.3,
983
  "commonvoice_locale":"kk",
984
  "in_benchmark":true
985
  },
 
2167
  "family":"Indo-European",
2168
  "flores_path":"glg_Latn",
2169
  "fleurs_tag":"gl_es",
2170
+ "commonvoice_hours":163.0,
2171
  "commonvoice_locale":"gl",
2172
  "in_benchmark":true
2173
  },
 
3679
  "family":"Indo-European",
3680
  "flores_path":"ydd_Hebr",
3681
  "fleurs_tag":null,
3682
+ "commonvoice_hours":1.8,
3683
  "commonvoice_locale":"yi",
3684
  "in_benchmark":true
3685
  },
models.json CHANGED
@@ -1,15 +1,15 @@
1
  [
2
  {
3
- "id": "amazon/nova-micro-v1",
4
- "name": "Nova Micro 1.0",
5
- "provider_name": "Amazon",
6
- "cost": 0.14,
7
- "hf_id": null,
8
- "size": null,
9
- "type": "closed-source",
10
- "license": null,
11
- "creation_date": 1733356800000,
12
- "tasks": [
13
  "translation_from",
14
  "translation_to",
15
  "classification",
@@ -20,16 +20,16 @@
20
  ]
21
  },
22
  {
23
- "id": "anthracite-org/magnum-v4-72b",
24
- "name": "Magnum v4 72B",
25
- "provider_name": "Magnum v4 72B",
26
- "cost": 3.0,
27
- "hf_id": "anthracite-org/magnum-v4-72b",
28
- "size": 72706203648.0,
29
- "type": "open-source",
30
- "license": "Apache 2.0",
31
- "creation_date": 1726790400000,
32
- "tasks": [
33
  "translation_from",
34
  "translation_to",
35
  "classification",
@@ -40,16 +40,16 @@
40
  ]
41
  },
42
  {
43
- "id": "anthropic/claude-sonnet-4",
44
- "name": "Claude Sonnet 4",
45
- "provider_name": "Anthropic",
46
- "cost": 15.0,
47
- "hf_id": null,
48
- "size": null,
49
- "type": "closed-source",
50
- "license": null,
51
- "creation_date": 1747872000000,
52
- "tasks": [
53
  "translation_from",
54
  "translation_to",
55
  "classification",
@@ -60,16 +60,16 @@
60
  ]
61
  },
62
  {
63
- "id": "deepseek/deepseek-chat",
64
- "name": "DeepSeek V3",
65
- "provider_name": "DeepSeek",
66
- "cost": 0.72,
67
- "hf_id": "deepseek-ai/DeepSeek-V3",
68
- "size": 684531386000.0,
69
- "type": "open-source",
70
- "license": "",
71
- "creation_date": 1735084800000,
72
- "tasks": [
73
  "translation_from",
74
  "translation_to",
75
  "classification",
@@ -80,16 +80,16 @@
80
  ]
81
  },
82
  {
83
- "id": "deepseek/deepseek-chat-v3-0324",
84
- "name": "DeepSeek V3 0324",
85
- "provider_name": "DeepSeek",
86
- "cost": 0.0,
87
- "hf_id": "deepseek-ai/DeepSeek-V3-0324",
88
- "size": 684531386000.0,
89
- "type": "open-source",
90
- "license": "Mit",
91
- "creation_date": 1742774400000,
92
- "tasks": [
93
  "translation_from",
94
  "translation_to",
95
  "classification",
@@ -100,16 +100,16 @@
100
  ]
101
  },
102
  {
103
- "id": "deepseek/deepseek-r1-0528",
104
- "name": "R1 0528",
105
- "provider_name": "DeepSeek",
106
- "cost": 0.0,
107
- "hf_id": "deepseek-ai/DeepSeek-R1-0528",
108
- "size": 684531386000.0,
109
- "type": "open-source",
110
- "license": "Mit",
111
- "creation_date": 1748390400000,
112
- "tasks": [
113
  "translation_from",
114
  "translation_to",
115
  "classification",
@@ -120,16 +120,16 @@
120
  ]
121
  },
122
  {
123
- "id": "google/gemini-2.0-flash-lite-001",
124
- "name": "Gemini 2.0 Flash Lite",
125
- "provider_name": "Google",
126
- "cost": 0.3,
127
- "hf_id": null,
128
- "size": null,
129
- "type": "closed-source",
130
- "license": null,
131
- "creation_date": 1740441600000,
132
- "tasks": [
133
  "translation_from",
134
  "translation_to",
135
  "classification",
@@ -140,16 +140,16 @@
140
  ]
141
  },
142
  {
143
- "id": "google/gemini-2.5-flash",
144
- "name": "Gemini 2.5 Flash",
145
- "provider_name": "Google",
146
- "cost": 2.5,
147
- "hf_id": null,
148
- "size": null,
149
- "type": "closed-source",
150
- "license": null,
151
- "creation_date": 1750118400000,
152
- "tasks": [
153
  "translation_from",
154
  "translation_to",
155
  "classification",
@@ -160,16 +160,16 @@
160
  ]
161
  },
162
  {
163
- "id": "google/gemma-2-9b-it",
164
- "name": "Gemma 2 9B",
165
- "provider_name": "Google",
166
- "cost": 0.0,
167
- "hf_id": "google/gemma-2-9b-it",
168
- "size": 9241705984.0,
169
- "type": "open-source",
170
- "license": "Gemma",
171
- "creation_date": 1719187200000,
172
- "tasks": [
173
  "translation_from",
174
  "translation_to",
175
  "classification",
@@ -180,16 +180,16 @@
180
  ]
181
  },
182
  {
183
- "id": "google/gemma-3-27b-it",
184
- "name": "Gemma 3 27B",
185
- "provider_name": "Google",
186
- "cost": 0.0,
187
- "hf_id": "google/gemma-3-27b-it",
188
- "size": 27432406640.0,
189
- "type": "open-source",
190
- "license": "Gemma",
191
- "creation_date": 1740787200000,
192
- "tasks": [
193
  "translation_from",
194
  "translation_to",
195
  "classification",
@@ -200,16 +200,16 @@
200
  ]
201
  },
202
  {
203
- "id": "meta-llama/llama-3-70b-instruct",
204
- "name": "Llama 3 70B Instruct",
205
- "provider_name": "Meta",
206
- "cost": 0.4,
207
- "hf_id": "meta-llama/Meta-Llama-3-70B-Instruct",
208
- "size": 70553706496.0,
209
- "type": "open-source",
210
- "license": "Llama3",
211
- "creation_date": 1713312000000,
212
- "tasks": [
213
  "translation_from",
214
  "translation_to",
215
  "classification",
@@ -220,16 +220,16 @@
220
  ]
221
  },
222
  {
223
- "id": "meta-llama/llama-3.1-70b-instruct",
224
- "name": "Llama 3.1 70B Instruct",
225
- "provider_name": "Meta",
226
- "cost": 0.28,
227
- "hf_id": "meta-llama/Llama-3.1-70B-Instruct",
228
- "size": 70553706496.0,
229
- "type": "open-source",
230
- "license": "Llama3.1",
231
- "creation_date": 1721088000000,
232
- "tasks": [
233
  "translation_from",
234
  "translation_to",
235
  "classification",
@@ -240,16 +240,16 @@
240
  ]
241
  },
242
  {
243
- "id": "meta-llama/llama-3.2-3b-instruct",
244
- "name": "Llama 3.2 3B Instruct",
245
- "provider_name": "Meta",
246
- "cost": 0.0,
247
- "hf_id": "meta-llama/Llama-3.2-3B-Instruct",
248
- "size": 3212749824.0,
249
- "type": "open-source",
250
- "license": "Llama3.2",
251
- "creation_date": 1726617600000,
252
- "tasks": [
253
  "translation_from",
254
  "translation_to",
255
  "classification",
@@ -260,16 +260,16 @@
260
  ]
261
  },
262
  {
263
- "id": "meta-llama/llama-3.3-70b-instruct",
264
- "name": "Llama 3.3 70B Instruct",
265
- "provider_name": "Meta",
266
- "cost": 0.0,
267
- "hf_id": "meta-llama/Llama-3.3-70B-Instruct",
268
- "size": 70553706496.0,
269
- "type": "open-source",
270
- "license": "Llama3.3",
271
- "creation_date": 1732579200000,
272
- "tasks": [
273
  "translation_from",
274
  "translation_to",
275
  "classification",
@@ -280,16 +280,16 @@
280
  ]
281
  },
282
  {
283
- "id": "meta-llama/llama-4-maverick",
284
- "name": "Llama 4 Maverick",
285
- "provider_name": "Meta",
286
- "cost": 0.6,
287
- "hf_id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct",
288
- "size": 401583781376.0,
289
- "type": "open-source",
290
- "license": "Other",
291
- "creation_date": 1743465600000,
292
- "tasks": [
293
  "translation_from",
294
  "translation_to",
295
  "classification",
@@ -300,16 +300,16 @@
300
  ]
301
  },
302
  {
303
- "id": "meta-llama/llama-guard-4-12b",
304
- "name": "Llama Guard 4 12B",
305
- "provider_name": "Meta",
306
- "cost": 0.18,
307
- "hf_id": "meta-llama/Llama-Guard-4-12B",
308
- "size": 12001097216.0,
309
- "type": "open-source",
310
- "license": "Other",
311
- "creation_date": 1745366400000,
312
- "tasks": [
313
  "translation_from",
314
  "translation_to",
315
  "classification",
@@ -320,16 +320,16 @@
320
  ]
321
  },
322
  {
323
- "id": "microsoft/phi-3-medium-128k-instruct",
324
- "name": "Phi-3 Medium 128K Instruct",
325
- "provider_name": "Microsoft",
326
- "cost": 1.0,
327
- "hf_id": "microsoft/Phi-3-medium-128k-instruct",
328
- "size": 13960238080.0,
329
- "type": "open-source",
330
- "license": "Mit",
331
- "creation_date": 1715040000000,
332
- "tasks": [
333
  "translation_from",
334
  "translation_to",
335
  "classification",
@@ -340,16 +340,16 @@
340
  ]
341
  },
342
  {
343
- "id": "microsoft/phi-3.5-mini-128k-instruct",
344
- "name": "Phi-3.5 Mini 128K Instruct",
345
- "provider_name": "Microsoft",
346
- "cost": 0.1,
347
- "hf_id": "microsoft/Phi-3.5-mini-instruct",
348
- "size": 3821079552.0,
349
- "type": "open-source",
350
- "license": "Mit",
351
- "creation_date": 1723766400000,
352
- "tasks": [
353
  "translation_from",
354
  "translation_to",
355
  "classification",
@@ -360,16 +360,16 @@
360
  ]
361
  },
362
  {
363
- "id": "microsoft/phi-4",
364
- "name": "Phi 4",
365
- "provider_name": "Microsoft",
366
- "cost": 0.14,
367
- "hf_id": "microsoft/phi-4",
368
- "size": 14659507200.0,
369
- "type": "open-source",
370
- "license": "Mit",
371
- "creation_date": 1733875200000,
372
- "tasks": [
373
  "translation_from",
374
  "translation_to",
375
  "classification",
@@ -380,16 +380,16 @@
380
  ]
381
  },
382
  {
383
- "id": "microsoft/phi-4-multimodal-instruct",
384
- "name": "Phi 4 Multimodal Instruct",
385
- "provider_name": "Microsoft",
386
- "cost": 0.1,
387
- "hf_id": "microsoft/Phi-4-multimodal-instruct",
388
- "size": 5574460384.0,
389
- "type": "open-source",
390
- "license": "Mit",
391
- "creation_date": 1740355200000,
392
- "tasks": [
393
  "translation_from",
394
  "translation_to",
395
  "classification",
@@ -400,16 +400,16 @@
400
  ]
401
  },
402
  {
403
- "id": "mistralai/magistral-medium-2506",
404
- "name": "Magistral Medium 2506",
405
- "provider_name": "Mistral",
406
- "cost": 5.0,
407
- "hf_id": null,
408
- "size": null,
409
- "type": "closed-source",
410
- "license": null,
411
- "creation_date": 1749340800000,
412
- "tasks": [
413
  "translation_from",
414
  "translation_to",
415
  "classification",
@@ -420,16 +420,16 @@
420
  ]
421
  },
422
  {
423
- "id": "mistralai/mistral-7b-instruct",
424
- "name": "Mistral 7B Instruct",
425
- "provider_name": "Mistral",
426
- "cost": 0.0,
427
- "hf_id": "mistralai/Mistral-7B-Instruct-v0.3",
428
- "size": 7248023552.0,
429
- "type": "open-source",
430
- "license": "Apache 2.0",
431
- "creation_date": 1716336000000,
432
- "tasks": [
433
  "translation_from",
434
  "translation_to",
435
  "classification",
@@ -440,16 +440,16 @@
440
  ]
441
  },
442
  {
443
- "id": "mistralai/mistral-nemo",
444
- "name": "Mistral Nemo",
445
- "provider_name": "Mistral",
446
- "cost": 0.0,
447
- "hf_id": "mistralai/Mistral-Nemo-Instruct-2407",
448
- "size": 12247782400.0,
449
- "type": "open-source",
450
- "license": "Apache 2.0",
451
- "creation_date": 1721174400000,
452
- "tasks": [
453
  "translation_from",
454
  "translation_to",
455
  "classification",
@@ -460,16 +460,16 @@
460
  ]
461
  },
462
  {
463
- "id": "mistralai/mistral-saba",
464
- "name": "Saba",
465
- "provider_name": "Mistral",
466
- "cost": 0.6,
467
- "hf_id": null,
468
- "size": null,
469
- "type": "closed-source",
470
- "license": null,
471
- "creation_date": 1739750400000,
472
- "tasks": [
473
  "translation_from",
474
  "translation_to",
475
  "classification",
@@ -480,16 +480,16 @@
480
  ]
481
  },
482
  {
483
- "id": "mistralai/mistral-small-3.1-24b-instruct",
484
- "name": "Mistral Small 3.1 24B",
485
- "provider_name": "Mistral",
486
- "cost": 0.0,
487
- "hf_id": "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
488
- "size": 24011361280.0,
489
- "type": "open-source",
490
- "license": "Apache 2.0",
491
- "creation_date": 1741651200000,
492
- "tasks": [
493
  "translation_from",
494
  "translation_to",
495
  "classification",
@@ -500,16 +500,16 @@
500
  ]
501
  },
502
  {
503
- "id": "mistralai/mixtral-8x7b-instruct",
504
- "name": "Mixtral 8x7B Instruct",
505
- "provider_name": "Mistral",
506
- "cost": 0.24,
507
- "hf_id": "mistralai/Mixtral-8x7B-Instruct-v0.1",
508
- "size": 46702792704.0,
509
- "type": "open-source",
510
- "license": "Apache 2.0",
511
- "creation_date": 1702166400000,
512
- "tasks": [
513
  "translation_from",
514
  "translation_to",
515
  "classification",
@@ -520,16 +520,16 @@
520
  ]
521
  },
522
  {
523
- "id": "neversleep/llama-3-lumimaid-70b",
524
- "name": "Llama 3 Lumimaid 70B",
525
- "provider_name": "NeverSleep",
526
- "cost": 6.0,
527
- "hf_id": "NeverSleep/Llama-3-Lumimaid-70B-v0.1",
528
- "size": 70553706496.0,
529
- "type": "open-source",
530
- "license": "Cc By Nc 4.0",
531
- "creation_date": 1714262400000,
532
- "tasks": [
533
  "translation_from",
534
  "translation_to",
535
  "classification",
@@ -540,16 +540,16 @@
540
  ]
541
  },
542
  {
543
- "id": "nvidia/llama-3.1-nemotron-70b-instruct",
544
- "name": "Llama 3.1 Nemotron 70B Instruct",
545
- "provider_name": "NVIDIA",
546
- "cost": 0.3,
547
- "hf_id": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF",
548
- "size": 70553706496.0,
549
- "type": "open-source",
550
- "license": "Llama3.1",
551
- "creation_date": 1728691200000,
552
- "tasks": [
553
  "translation_from",
554
  "translation_to",
555
  "classification",
@@ -560,16 +560,16 @@
560
  ]
561
  },
562
  {
563
- "id": "openai/chatgpt-4o-latest",
564
- "name": "ChatGPT-4o",
565
- "provider_name": "OpenAI",
566
- "cost": 15.0,
567
- "hf_id": null,
568
- "size": null,
569
- "type": "closed-source",
570
- "license": null,
571
- "creation_date": 1723593600000,
572
- "tasks": [
573
  "translation_from",
574
  "translation_to",
575
  "classification",
@@ -580,16 +580,16 @@
580
  ]
581
  },
582
  {
583
- "id": "openai/gpt-3.5-turbo",
584
- "name": "GPT-3.5 Turbo",
585
- "provider_name": "OpenAI",
586
- "cost": 1.5,
587
- "hf_id": null,
588
- "size": null,
589
- "type": "closed-source",
590
- "license": null,
591
- "creation_date": 1685232000000,
592
- "tasks": [
593
  "translation_from",
594
  "translation_to",
595
  "classification",
@@ -600,16 +600,16 @@
600
  ]
601
  },
602
  {
603
- "id": "openai/gpt-3.5-turbo-0613",
604
- "name": "GPT-3.5 Turbo (older v0613)",
605
- "provider_name": "OpenAI",
606
- "cost": 2.0,
607
- "hf_id": null,
608
- "size": null,
609
- "type": "closed-source",
610
- "license": null,
611
- "creation_date": 1706140800000,
612
- "tasks": [
613
  "translation_from",
614
  "translation_to",
615
  "classification",
@@ -620,16 +620,16 @@
620
  ]
621
  },
622
  {
623
- "id": "openai/gpt-4.1",
624
- "name": "GPT-4.1",
625
- "provider_name": "OpenAI",
626
- "cost": 8.0,
627
- "hf_id": null,
628
- "size": null,
629
- "type": "closed-source",
630
- "license": null,
631
- "creation_date": 1744588800000,
632
- "tasks": [
633
  "translation_from",
634
  "translation_to",
635
  "classification",
@@ -640,16 +640,16 @@
640
  ]
641
  },
642
  {
643
- "id": "openai/gpt-4.1-mini",
644
- "name": "GPT-4.1 Mini",
645
- "provider_name": "OpenAI",
646
- "cost": 1.6,
647
- "hf_id": null,
648
- "size": null,
649
- "type": "closed-source",
650
- "license": null,
651
- "creation_date": 1744588800000,
652
- "tasks": [
653
  "translation_from",
654
  "translation_to",
655
  "classification",
@@ -660,16 +660,16 @@
660
  ]
661
  },
662
  {
663
- "id": "openai/gpt-4.1-nano",
664
- "name": "GPT-4.1 Nano",
665
- "provider_name": "OpenAI",
666
- "cost": 0.4,
667
- "hf_id": null,
668
- "size": null,
669
- "type": "closed-source",
670
- "license": null,
671
- "creation_date": 1744588800000,
672
- "tasks": [
673
  "translation_from",
674
  "translation_to",
675
  "classification",
@@ -680,16 +680,16 @@
680
  ]
681
  },
682
  {
683
- "id": "openai/gpt-4o-2024-11-20",
684
- "name": "GPT-4o (2024-11-20)",
685
- "provider_name": "OpenAI",
686
- "cost": 10.0,
687
- "hf_id": null,
688
- "size": null,
689
- "type": "closed-source",
690
- "license": null,
691
- "creation_date": 1732060800000,
692
- "tasks": [
693
  "translation_from",
694
  "translation_to",
695
  "classification",
@@ -700,16 +700,16 @@
700
  ]
701
  },
702
  {
703
- "id": "openai/gpt-4o-mini",
704
- "name": "GPT-4o-mini",
705
- "provider_name": "OpenAI",
706
- "cost": 0.6,
707
- "hf_id": null,
708
- "size": null,
709
- "type": "closed-source",
710
- "license": null,
711
- "creation_date": 1721260800000,
712
- "tasks": [
713
  "translation_from",
714
  "translation_to",
715
  "classification",
@@ -720,16 +720,16 @@
720
  ]
721
  },
722
  {
723
- "id": "openai/gpt-5",
724
- "name": "GPT-5",
725
- "provider_name": "OpenAI",
726
- "cost": 10.0,
727
- "hf_id": null,
728
- "size": null,
729
- "type": "closed-source",
730
- "license": null,
731
- "creation_date": 1754524800000,
732
- "tasks": [
733
  "translation_from",
734
  "translation_to",
735
  "classification",
@@ -740,16 +740,16 @@
740
  ]
741
  },
742
  {
743
- "id": "opengvlab/internvl3-14b",
744
- "name": "InternVL3 14B",
745
- "provider_name": "OpenGVLab",
746
- "cost": 0.4,
747
- "hf_id": "OpenGVLab/InternVL3-14B",
748
- "size": 15117256704.0,
749
- "type": "open-source",
750
- "license": "Apache 2.0",
751
- "creation_date": 1744243200000,
752
- "tasks": [
753
  "translation_from",
754
  "translation_to",
755
  "classification",
@@ -760,16 +760,16 @@
760
  ]
761
  },
762
  {
763
- "id": "qwen/qwen3-235b-a22b",
764
- "name": "Qwen3 235B A22B",
765
- "provider_name": "Qwen",
766
- "cost": 0.0,
767
- "hf_id": "Qwen/Qwen3-235B-A22B",
768
- "size": 235093634560.0,
769
- "type": "open-source",
770
- "license": "Apache 2.0",
771
- "creation_date": 1745712000000,
772
- "tasks": [
773
  "translation_from",
774
  "translation_to",
775
  "classification",
@@ -780,16 +780,16 @@
780
  ]
781
  },
782
  {
783
- "id": "qwen/qwen3-30b-a3b",
784
- "name": "Qwen3 30B A3B",
785
- "provider_name": "Qwen",
786
- "cost": 0.0,
787
- "hf_id": "Qwen/Qwen3-30B-A3B",
788
- "size": 30532122624.0,
789
- "type": "open-source",
790
- "license": "Apache 2.0",
791
- "creation_date": 1745712000000,
792
- "tasks": [
793
  "translation_from",
794
  "translation_to",
795
  "classification",
@@ -800,16 +800,16 @@
800
  ]
801
  },
802
  {
803
- "id": "qwen/qwen3-32b",
804
- "name": "Qwen3 32B",
805
- "provider_name": "Qwen",
806
- "cost": 0.07,
807
- "hf_id": "Qwen/Qwen3-32B",
808
- "size": 32762123264.0,
809
- "type": "open-source",
810
- "license": "Apache 2.0",
811
- "creation_date": 1745712000000,
812
- "tasks": [
813
  "translation_from",
814
  "translation_to",
815
  "classification",
@@ -820,16 +820,16 @@
820
  ]
821
  },
822
  {
823
- "id": "qwen/qwq-32b",
824
- "name": "QwQ 32B",
825
- "provider_name": "Qwen",
826
- "cost": 0.0,
827
- "hf_id": "Qwen/QwQ-32B",
828
- "size": 32763876352.0,
829
- "type": "open-source",
830
- "license": "Apache 2.0",
831
- "creation_date": 1741132800000,
832
- "tasks": [
833
  "translation_from",
834
  "translation_to",
835
  "classification",
@@ -840,16 +840,16 @@
840
  ]
841
  },
842
  {
843
- "id": "switchpoint/router",
844
- "name": "Switchpoint Router",
845
- "provider_name": "Switchpoint Router",
846
- "cost": 3.4,
847
- "hf_id": null,
848
- "size": null,
849
- "type": "closed-source",
850
- "license": null,
851
- "creation_date": 1752192000000,
852
- "tasks": [
853
  "translation_from",
854
  "translation_to",
855
  "classification",
@@ -860,16 +860,16 @@
860
  ]
861
  },
862
  {
863
- "id": "thedrummer/anubis-pro-105b-v1",
864
- "name": "Anubis Pro 105B V1",
865
- "provider_name": "TheDrummer",
866
- "cost": 1.0,
867
- "hf_id": "TheDrummer/Anubis-Pro-105B-v1",
868
- "size": 104779882496.0,
869
- "type": "open-source",
870
- "license": "Other",
871
- "creation_date": 1738454400000,
872
- "tasks": [
873
  "translation_from",
874
  "translation_to",
875
  "classification",
@@ -880,16 +880,16 @@
880
  ]
881
  },
882
  {
883
- "id": "thedrummer/skyfall-36b-v2",
884
- "name": "Skyfall 36B V2",
885
- "provider_name": "TheDrummer",
886
- "cost": 0.19,
887
- "hf_id": "TheDrummer/Skyfall-36B-v2",
888
- "size": 36910535680.0,
889
- "type": "open-source",
890
- "license": "Other",
891
- "creation_date": 1738540800000,
892
- "tasks": [
893
  "translation_from",
894
  "translation_to",
895
  "classification",
@@ -900,16 +900,16 @@
900
  ]
901
  },
902
  {
903
- "id": "tngtech/deepseek-r1t-chimera",
904
- "name": "DeepSeek R1T Chimera",
905
- "provider_name": "TNG",
906
- "cost": 0.0,
907
- "hf_id": "tngtech/DeepSeek-R1T-Chimera",
908
- "size": 684531386000.0,
909
- "type": "open-source",
910
- "license": "Mit",
911
- "creation_date": 1745625600000,
912
- "tasks": [
913
  "translation_from",
914
  "translation_to",
915
  "classification",
@@ -920,16 +920,16 @@
920
  ]
921
  },
922
  {
923
- "id": "tngtech/deepseek-r1t2-chimera",
924
- "name": "DeepSeek R1T2 Chimera",
925
- "provider_name": "TNG",
926
- "cost": 0.0,
927
- "hf_id": "tngtech/DeepSeek-TNG-R1T2-Chimera",
928
- "size": 684531386000.0,
929
- "type": "open-source",
930
- "license": "Mit",
931
- "creation_date": 1751414400000,
932
- "tasks": [
933
  "translation_from",
934
  "translation_to",
935
  "classification",
@@ -940,16 +940,16 @@
940
  ]
941
  },
942
  {
943
- "id": "x-ai/grok-2-1212",
944
- "name": "Grok 2 1212",
945
- "provider_name": "xAI",
946
- "cost": 10.0,
947
- "hf_id": null,
948
- "size": null,
949
- "type": "closed-source",
950
- "license": null,
951
- "creation_date": 1734220800000,
952
- "tasks": [
953
  "translation_from",
954
  "translation_to",
955
  "classification",
@@ -960,29 +960,38 @@
960
  ]
961
  },
962
  {
963
- "id": "google/translate-v2",
964
- "name": "Google Translate",
965
- "provider_name": "Google",
966
- "cost": 20.0,
967
- "hf_id": null,
968
- "size": null,
969
- "type": "closed-source",
970
- "license": null,
971
- "creation_date": null,
972
- "tasks": [
973
  "translation_from",
974
- "translation_to"
 
 
 
 
 
975
  ]
976
  },
977
  {
978
- "id": "moonshotai/kimi-k2",
979
- "name": "Kimi K2",
980
- "provider_name": "Moonshot AI",
981
- "size": null,
982
- "type": "closed-source",
983
- "cost": 0.6,
984
- "hf_id": null,
985
- "creation_date": null,
986
- "license": null
 
 
 
 
987
  }
988
  ]
 
1
  [
2
  {
3
+ "id":"ai21\/jamba-large-1.7",
4
+ "name":"Jamba Large 1.7",
5
+ "provider_name":"AI21",
6
+ "cost":8.0,
7
+ "hf_id":"ai21labs\/AI21-Jamba-Large-1.7",
8
+ "size":398555145696.0,
9
+ "type":"open-source",
10
+ "license":"Other",
11
+ "creation_date":1751414400000,
12
+ "tasks":[
13
  "translation_from",
14
  "translation_to",
15
  "classification",
 
20
  ]
21
  },
22
  {
23
+ "id":"amazon\/nova-micro-v1",
24
+ "name":"Nova Micro 1.0",
25
+ "provider_name":"Amazon",
26
+ "cost":0.14,
27
+ "hf_id":null,
28
+ "size":null,
29
+ "type":"closed-source",
30
+ "license":null,
31
+ "creation_date":1733356800000,
32
+ "tasks":[
33
  "translation_from",
34
  "translation_to",
35
  "classification",
 
40
  ]
41
  },
42
  {
43
+ "id":"anthracite-org\/magnum-v4-72b",
44
+ "name":"Magnum v4 72B",
45
+ "provider_name":"Magnum v4 72B",
46
+ "cost":5.0,
47
+ "hf_id":"anthracite-org\/magnum-v4-72b",
48
+ "size":72706203648.0,
49
+ "type":"open-source",
50
+ "license":"Apache 2.0",
51
+ "creation_date":1726790400000,
52
+ "tasks":[
53
  "translation_from",
54
  "translation_to",
55
  "classification",
 
60
  ]
61
  },
62
  {
63
+ "id":"anthropic\/claude-3.7-sonnet",
64
+ "name":"Claude 3.7 Sonnet",
65
+ "provider_name":"Anthropic",
66
+ "cost":15.0,
67
+ "hf_id":null,
68
+ "size":null,
69
+ "type":"closed-source",
70
+ "license":null,
71
+ "creation_date":1740355200000,
72
+ "tasks":[
73
  "translation_from",
74
  "translation_to",
75
  "classification",
 
80
  ]
81
  },
82
  {
83
+ "id":"anthropic\/claude-sonnet-4",
84
+ "name":"Claude Sonnet 4",
85
+ "provider_name":"Anthropic",
86
+ "cost":15.0,
87
+ "hf_id":null,
88
+ "size":null,
89
+ "type":"closed-source",
90
+ "license":null,
91
+ "creation_date":1747872000000,
92
+ "tasks":[
93
  "translation_from",
94
  "translation_to",
95
  "classification",
 
100
  ]
101
  },
102
  {
103
+ "id":"arcee-ai\/virtuoso-large",
104
+ "name":"Virtuoso Large",
105
+ "provider_name":"Arcee AI",
106
+ "cost":1.2,
107
+ "hf_id":"arcee-ai\/Virtuoso-Large",
108
+ "size":72706203648.0,
109
+ "type":"open-source",
110
+ "license":"Other",
111
+ "creation_date":1749427200000,
112
+ "tasks":[
113
  "translation_from",
114
  "translation_to",
115
  "classification",
 
120
  ]
121
  },
122
  {
123
+ "id":"arliai\/qwq-32b-arliai-rpr-v1",
124
+ "name":"QwQ 32B RpR v1",
125
+ "provider_name":"ArliAI",
126
+ "cost":0.0,
127
+ "hf_id":"ArliAI\/QwQ-32B-ArliAI-RpR-v1",
128
+ "size":32763876352.0,
129
+ "type":"open-source",
130
+ "license":"Apache 2.0",
131
+ "creation_date":1743984000000,
132
+ "tasks":[
133
  "translation_from",
134
  "translation_to",
135
  "classification",
 
140
  ]
141
  },
142
  {
143
+ "id":"baidu\/ernie-4.5-300b-a47b",
144
+ "name":"ERNIE 4.5 300B A47B ",
145
+ "provider_name":"Baidu",
146
+ "cost":1.1,
147
+ "hf_id":"baidu\/ERNIE-4.5-300B-A47B-PT",
148
+ "size":300474051776.0,
149
+ "type":"open-source",
150
+ "license":"Apache 2.0",
151
+ "creation_date":1751068800000,
152
+ "tasks":[
153
  "translation_from",
154
  "translation_to",
155
  "classification",
 
160
  ]
161
  },
162
  {
163
+ "id":"deepseek\/deepseek-chat",
164
+ "name":"DeepSeek V3",
165
+ "provider_name":"DeepSeek",
166
+ "cost":0.8,
167
+ "hf_id":"deepseek-ai\/DeepSeek-V3",
168
+ "size":684531386000.0,
169
+ "type":"open-source",
170
+ "license":"",
171
+ "creation_date":1735084800000,
172
+ "tasks":[
173
  "translation_from",
174
  "translation_to",
175
  "classification",
 
180
  ]
181
  },
182
  {
183
+ "id":"deepseek\/deepseek-chat-v3-0324",
184
+ "name":"DeepSeek V3 0324",
185
+ "provider_name":"DeepSeek",
186
+ "cost":0.0,
187
+ "hf_id":"deepseek-ai\/DeepSeek-V3-0324",
188
+ "size":684531386000.0,
189
+ "type":"open-source",
190
+ "license":"Mit",
191
+ "creation_date":1742774400000,
192
+ "tasks":[
193
  "translation_from",
194
  "translation_to",
195
  "classification",
 
200
  ]
201
  },
202
  {
203
+ "id":"deepseek\/deepseek-chat-v3.1",
204
+ "name":"DeepSeek V3.1",
205
+ "provider_name":"DeepSeek",
206
+ "cost":0.0,
207
+ "hf_id":"deepseek-ai\/DeepSeek-V3.1",
208
+ "size":684531386000.0,
209
+ "type":"open-source",
210
+ "license":"Mit",
211
+ "creation_date":1755734400000,
212
+ "tasks":[
213
  "translation_from",
214
  "translation_to",
215
  "classification",
 
220
  ]
221
  },
222
  {
223
+ "id":"eleutherai\/llemma_7b",
224
+ "name":"Llemma 7b",
225
+ "provider_name":"EleutherAI",
226
+ "cost":1.2,
227
+ "hf_id":"EleutherAI\/llemma_7b",
228
+ "size":null,
229
+ "type":"open-source",
230
+ "license":"Llama2",
231
+ "creation_date":1694476800000,
232
+ "tasks":[
233
  "translation_from",
234
  "translation_to",
235
  "classification",
 
240
  ]
241
  },
242
  {
243
+ "id":"google\/gemini-2.0-flash-001",
244
+ "name":"Gemini 2.0 Flash",
245
+ "provider_name":"Google",
246
+ "cost":0.4,
247
+ "hf_id":null,
248
+ "size":null,
249
+ "type":"closed-source",
250
+ "license":null,
251
+ "creation_date":1738713600000,
252
+ "tasks":[
253
  "translation_from",
254
  "translation_to",
255
  "classification",
 
260
  ]
261
  },
262
  {
263
+ "id":"google\/gemini-2.0-flash-lite-001",
264
+ "name":"Gemini 2.0 Flash Lite",
265
+ "provider_name":"Google",
266
+ "cost":0.3,
267
+ "hf_id":null,
268
+ "size":null,
269
+ "type":"closed-source",
270
+ "license":null,
271
+ "creation_date":1740441600000,
272
+ "tasks":[
273
  "translation_from",
274
  "translation_to",
275
  "classification",
 
280
  ]
281
  },
282
  {
283
+ "id":"google\/gemini-2.5-flash",
284
+ "name":"Gemini 2.5 Flash",
285
+ "provider_name":"Google",
286
+ "cost":2.5,
287
+ "hf_id":null,
288
+ "size":null,
289
+ "type":"closed-source",
290
+ "license":null,
291
+ "creation_date":1750118400000,
292
+ "tasks":[
293
  "translation_from",
294
  "translation_to",
295
  "classification",
 
300
  ]
301
  },
302
  {
303
+ "id":"google\/gemma-2-9b-it",
304
+ "name":"Gemma 2 9B",
305
+ "provider_name":"Google",
306
+ "cost":0.0,
307
+ "hf_id":"google\/gemma-2-9b-it",
308
+ "size":9241705984.0,
309
+ "type":"open-source",
310
+ "license":"Gemma",
311
+ "creation_date":1719187200000,
312
+ "tasks":[
313
  "translation_from",
314
  "translation_to",
315
  "classification",
 
320
  ]
321
  },
322
  {
323
+ "id":"google\/gemma-3-12b-it",
324
+ "name":"Gemma 3 12B",
325
+ "provider_name":"Google",
326
+ "cost":0.0,
327
+ "hf_id":"google\/gemma-3-12b-it",
328
+ "size":12187325040.0,
329
+ "type":"open-source",
330
+ "license":"Gemma",
331
+ "creation_date":1740787200000,
332
+ "tasks":[
333
  "translation_from",
334
  "translation_to",
335
  "classification",
 
340
  ]
341
  },
342
  {
343
+ "id":"google\/gemma-3-27b-it",
344
+ "name":"Gemma 3 27B",
345
+ "provider_name":"Google",
346
+ "cost":0.0,
347
+ "hf_id":"google\/gemma-3-27b-it",
348
+ "size":27432406640.0,
349
+ "type":"open-source",
350
+ "license":"Gemma",
351
+ "creation_date":1740787200000,
352
+ "tasks":[
353
  "translation_from",
354
  "translation_to",
355
  "classification",
 
360
  ]
361
  },
362
  {
363
+ "id":"google\/gemma-3-4b-it",
364
+ "name":"Gemma 3 4B",
365
+ "provider_name":"Google",
366
+ "cost":0.0,
367
+ "hf_id":"google\/gemma-3-4b-it",
368
+ "size":4300079472.0,
369
+ "type":"open-source",
370
+ "license":"Gemma",
371
+ "creation_date":1740009600000,
372
+ "tasks":[
373
  "translation_from",
374
  "translation_to",
375
  "classification",
 
380
  ]
381
  },
382
  {
383
+ "id":"liquid\/lfm-7b",
384
+ "name":"LFM 7B",
385
+ "provider_name":"Liquid",
386
+ "cost":0.01,
387
+ "hf_id":null,
388
+ "size":null,
389
+ "type":"closed-source",
390
+ "license":null,
391
+ "creation_date":1737763200000,
392
+ "tasks":[
393
  "translation_from",
394
  "translation_to",
395
  "classification",
 
400
  ]
401
  },
402
  {
403
+ "id":"meta-llama\/llama-3-70b-instruct",
404
+ "name":"Llama 3 70B Instruct",
405
+ "provider_name":"Meta",
406
+ "cost":0.4,
407
+ "hf_id":"meta-llama\/Meta-Llama-3-70B-Instruct",
408
+ "size":70553706496.0,
409
+ "type":"open-source",
410
+ "license":"Llama3",
411
+ "creation_date":1713312000000,
412
+ "tasks":[
413
  "translation_from",
414
  "translation_to",
415
  "classification",
 
420
  ]
421
  },
422
  {
423
+ "id":"meta-llama\/llama-3.1-70b-instruct",
424
+ "name":"Llama 3.1 70B Instruct",
425
+ "provider_name":"Meta",
426
+ "cost":0.28,
427
+ "hf_id":"meta-llama\/Llama-3.1-70B-Instruct",
428
+ "size":70553706496.0,
429
+ "type":"open-source",
430
+ "license":"Llama3.1",
431
+ "creation_date":1721088000000,
432
+ "tasks":[
433
  "translation_from",
434
  "translation_to",
435
  "classification",
 
440
  ]
441
  },
442
  {
443
+ "id":"meta-llama\/llama-3.3-70b-instruct",
444
+ "name":"Llama 3.3 70B Instruct",
445
+ "provider_name":"Meta",
446
+ "cost":0.0,
447
+ "hf_id":"meta-llama\/Llama-3.3-70B-Instruct",
448
+ "size":70553706496.0,
449
+ "type":"open-source",
450
+ "license":"Llama3.3",
451
+ "creation_date":1732579200000,
452
+ "tasks":[
453
  "translation_from",
454
  "translation_to",
455
  "classification",
 
460
  ]
461
  },
462
  {
463
+ "id":"meta-llama\/llama-4-maverick",
464
+ "name":"Llama 4 Maverick",
465
+ "provider_name":"Meta",
466
+ "cost":0.0,
467
+ "hf_id":"meta-llama\/Llama-4-Maverick-17B-128E-Instruct",
468
+ "size":401583781376.0,
469
+ "type":"open-source",
470
+ "license":"Other",
471
+ "creation_date":1743465600000,
472
+ "tasks":[
473
  "translation_from",
474
  "translation_to",
475
  "classification",
 
480
  ]
481
  },
482
  {
483
+ "id":"microsoft\/phi-4",
484
+ "name":"Phi 4",
485
+ "provider_name":"Microsoft",
486
+ "cost":0.14,
487
+ "hf_id":"microsoft\/phi-4",
488
+ "size":14659507200.0,
489
+ "type":"open-source",
490
+ "license":"Mit",
491
+ "creation_date":1733875200000,
492
+ "tasks":[
493
  "translation_from",
494
  "translation_to",
495
  "classification",
 
500
  ]
501
  },
502
  {
503
+ "id":"microsoft\/phi-4-multimodal-instruct",
504
+ "name":"Phi 4 Multimodal Instruct",
505
+ "provider_name":"Microsoft",
506
+ "cost":0.1,
507
+ "hf_id":"microsoft\/Phi-4-multimodal-instruct",
508
+ "size":5574460384.0,
509
+ "type":"open-source",
510
+ "license":"Mit",
511
+ "creation_date":1740355200000,
512
+ "tasks":[
513
  "translation_from",
514
  "translation_to",
515
  "classification",
 
520
  ]
521
  },
522
  {
523
+ "id":"mistralai\/mistral-nemo",
524
+ "name":"Mistral Nemo",
525
+ "provider_name":"Mistral",
526
+ "cost":0.0,
527
+ "hf_id":"mistralai\/Mistral-Nemo-Instruct-2407",
528
+ "size":12247782400.0,
529
+ "type":"open-source",
530
+ "license":"Apache 2.0",
531
+ "creation_date":1721174400000,
532
+ "tasks":[
533
  "translation_from",
534
  "translation_to",
535
  "classification",
 
540
  ]
541
  },
542
  {
543
+ "id":"mistralai\/mistral-saba",
544
+ "name":"Saba",
545
+ "provider_name":"Mistral",
546
+ "cost":0.6,
547
+ "hf_id":null,
548
+ "size":null,
549
+ "type":"closed-source",
550
+ "license":null,
551
+ "creation_date":1739750400000,
552
+ "tasks":[
553
  "translation_from",
554
  "translation_to",
555
  "classification",
 
560
  ]
561
  },
562
  {
563
+ "id":"mistralai\/mistral-small-3.1-24b-instruct",
564
+ "name":"Mistral Small 3.1 24B",
565
+ "provider_name":"Mistral",
566
+ "cost":0.0,
567
+ "hf_id":"mistralai\/Mistral-Small-3.1-24B-Instruct-2503",
568
+ "size":24011361280.0,
569
+ "type":"open-source",
570
+ "license":"Apache 2.0",
571
+ "creation_date":1741651200000,
572
+ "tasks":[
573
  "translation_from",
574
  "translation_to",
575
  "classification",
 
580
  ]
581
  },
582
  {
583
+ "id":"mistralai\/mixtral-8x7b-instruct",
584
+ "name":"Mixtral 8x7B Instruct",
585
+ "provider_name":"Mistral",
586
+ "cost":0.24,
587
+ "hf_id":"mistralai\/Mixtral-8x7B-Instruct-v0.1",
588
+ "size":46702792704.0,
589
+ "type":"open-source",
590
+ "license":"Apache 2.0",
591
+ "creation_date":1702166400000,
592
+ "tasks":[
593
  "translation_from",
594
  "translation_to",
595
  "classification",
 
600
  ]
601
  },
602
  {
603
+ "id":"moonshotai\/kimi-k2",
604
+ "name":"Kimi K2",
605
+ "provider_name":"MoonshotAI",
606
+ "cost":0.0,
607
+ "hf_id":"moonshotai\/Kimi-K2-Instruct",
608
+ "size":null,
609
+ "type":"open-source",
610
+ "license":"Other",
611
+ "creation_date":1752192000000,
612
+ "tasks":[
613
  "translation_from",
614
  "translation_to",
615
  "classification",
 
620
  ]
621
  },
622
  {
623
+ "id":"nousresearch\/deephermes-3-llama-3-8b-preview",
624
+ "name":"DeepHermes 3 Llama 3 8B Preview",
625
+ "provider_name":"Nous",
626
+ "cost":0.0,
627
+ "hf_id":"NousResearch\/DeepHermes-3-Llama-3-8B-Preview",
628
+ "size":8030261248.0,
629
+ "type":"open-source",
630
+ "license":"Llama3",
631
+ "creation_date":1739318400000,
632
+ "tasks":[
633
  "translation_from",
634
  "translation_to",
635
  "classification",
 
640
  ]
641
  },
642
  {
643
+ "id":"openai\/gpt-4.1",
644
+ "name":"GPT-4.1",
645
+ "provider_name":"OpenAI",
646
+ "cost":8.0,
647
+ "hf_id":null,
648
+ "size":null,
649
+ "type":"closed-source",
650
+ "license":null,
651
+ "creation_date":1744588800000,
652
+ "tasks":[
653
  "translation_from",
654
  "translation_to",
655
  "classification",
 
660
  ]
661
  },
662
  {
663
+ "id":"openai\/gpt-4.1-mini",
664
+ "name":"GPT-4.1 Mini",
665
+ "provider_name":"OpenAI",
666
+ "cost":1.6,
667
+ "hf_id":null,
668
+ "size":null,
669
+ "type":"closed-source",
670
+ "license":null,
671
+ "creation_date":1744588800000,
672
+ "tasks":[
673
  "translation_from",
674
  "translation_to",
675
  "classification",
 
680
  ]
681
  },
682
  {
683
+ "id":"openai\/gpt-4.1-nano",
684
+ "name":"GPT-4.1 Nano",
685
+ "provider_name":"OpenAI",
686
+ "cost":0.4,
687
+ "hf_id":null,
688
+ "size":null,
689
+ "type":"closed-source",
690
+ "license":null,
691
+ "creation_date":1744588800000,
692
+ "tasks":[
693
  "translation_from",
694
  "translation_to",
695
  "classification",
 
700
  ]
701
  },
702
  {
703
+ "id":"openai\/gpt-4o-2024-11-20",
704
+ "name":"GPT-4o (2024-11-20)",
705
+ "provider_name":"OpenAI",
706
+ "cost":10.0,
707
+ "hf_id":null,
708
+ "size":null,
709
+ "type":"closed-source",
710
+ "license":null,
711
+ "creation_date":1732060800000,
712
+ "tasks":[
713
  "translation_from",
714
  "translation_to",
715
  "classification",
 
720
  ]
721
  },
722
  {
723
+ "id":"openai\/gpt-4o-mini",
724
+ "name":"GPT-4o-mini",
725
+ "provider_name":"OpenAI",
726
+ "cost":0.6,
727
+ "hf_id":null,
728
+ "size":null,
729
+ "type":"closed-source",
730
+ "license":null,
731
+ "creation_date":1721260800000,
732
+ "tasks":[
733
  "translation_from",
734
  "translation_to",
735
  "classification",
 
740
  ]
741
  },
742
  {
743
+ "id":"openai\/gpt-5",
744
+ "name":"GPT-5",
745
+ "provider_name":"OpenAI",
746
+ "cost":10.0,
747
+ "hf_id":null,
748
+ "size":null,
749
+ "type":"closed-source",
750
+ "license":null,
751
+ "creation_date":1754524800000,
752
+ "tasks":[
753
  "translation_from",
754
  "translation_to",
755
  "classification",
 
760
  ]
761
  },
762
  {
763
+ "id":"openai\/gpt-5-nano",
764
+ "name":"GPT-5 Nano",
765
+ "provider_name":"OpenAI",
766
+ "cost":0.4,
767
+ "hf_id":null,
768
+ "size":null,
769
+ "type":"closed-source",
770
+ "license":null,
771
+ "creation_date":1754524800000,
772
+ "tasks":[
773
  "translation_from",
774
  "translation_to",
775
  "classification",
 
780
  ]
781
  },
782
  {
783
+ "id":"openai\/gpt-oss-120b",
784
+ "name":"gpt-oss-120b",
785
+ "provider_name":"OpenAI",
786
+ "cost":0.0,
787
+ "hf_id":"openai\/gpt-oss-120b",
788
+ "size":120412337472.0,
789
+ "type":"open-source",
790
+ "license":"Apache 2.0",
791
+ "creation_date":1754265600000,
792
+ "tasks":[
793
  "translation_from",
794
  "translation_to",
795
  "classification",
 
800
  ]
801
  },
802
  {
803
+ "id":"qwen\/qwen-2.5-72b-instruct",
804
+ "name":"Qwen2.5 72B Instruct",
805
+ "provider_name":"Qwen2.5 72B Instruct (free)",
806
+ "cost":0.0,
807
+ "hf_id":"Qwen\/Qwen2.5-72B-Instruct",
808
+ "size":72706203648.0,
809
+ "type":"open-source",
810
+ "license":"Other",
811
+ "creation_date":1726444800000,
812
+ "tasks":[
813
  "translation_from",
814
  "translation_to",
815
  "classification",
 
820
  ]
821
  },
822
  {
823
+ "id":"qwen\/qwen-2.5-coder-32b-instruct",
824
+ "name":"Qwen2.5 Coder 32B Instruct",
825
+ "provider_name":"Qwen2.5 Coder 32B Instruct (free)",
826
+ "cost":0.0,
827
+ "hf_id":"Qwen\/Qwen2.5-Coder-32B-Instruct",
828
+ "size":32763876352.0,
829
+ "type":"open-source",
830
+ "license":"Apache 2.0",
831
+ "creation_date":1730851200000,
832
+ "tasks":[
833
  "translation_from",
834
  "translation_to",
835
  "classification",
 
840
  ]
841
  },
842
  {
843
+ "id":"qwen\/qwen3-235b-a22b",
844
+ "name":"Qwen3 235B A22B",
845
+ "provider_name":"Qwen",
846
+ "cost":0.0,
847
+ "hf_id":"Qwen\/Qwen3-235B-A22B",
848
+ "size":235093634560.0,
849
+ "type":"open-source",
850
+ "license":"Apache 2.0",
851
+ "creation_date":1745712000000,
852
+ "tasks":[
853
  "translation_from",
854
  "translation_to",
855
  "classification",
 
860
  ]
861
  },
862
  {
863
+ "id":"qwen\/qwen3-30b-a3b",
864
+ "name":"Qwen3 30B A3B",
865
+ "provider_name":"Qwen",
866
+ "cost":0.0,
867
+ "hf_id":"Qwen\/Qwen3-30B-A3B",
868
+ "size":30532122624.0,
869
+ "type":"open-source",
870
+ "license":"Apache 2.0",
871
+ "creation_date":1745712000000,
872
+ "tasks":[
873
  "translation_from",
874
  "translation_to",
875
  "classification",
 
880
  ]
881
  },
882
  {
883
+ "id":"qwen\/qwen3-32b",
884
+ "name":"Qwen3 32B",
885
+ "provider_name":"Qwen",
886
+ "cost":0.07,
887
+ "hf_id":"Qwen\/Qwen3-32B",
888
+ "size":32762123264.0,
889
+ "type":"open-source",
890
+ "license":"Apache 2.0",
891
+ "creation_date":1745712000000,
892
+ "tasks":[
893
  "translation_from",
894
  "translation_to",
895
  "classification",
 
900
  ]
901
  },
902
  {
903
+ "id":"tencent\/hunyuan-a13b-instruct",
904
+ "name":"Hunyuan A13B Instruct",
905
+ "provider_name":"Tencent",
906
+ "cost":0.0,
907
+ "hf_id":"tencent\/Hunyuan-A13B-Instruct",
908
+ "size":80393183232.0,
909
+ "type":"open-source",
910
+ "license":"Other",
911
+ "creation_date":1750809600000,
912
+ "tasks":[
913
  "translation_from",
914
  "translation_to",
915
  "classification",
 
920
  ]
921
  },
922
  {
923
+ "id":"undi95\/remm-slerp-l2-13b",
924
+ "name":"ReMM SLERP 13B",
925
+ "provider_name":"ReMM SLERP 13B",
926
+ "cost":0.65,
927
+ "hf_id":"Undi95\/ReMM-SLERP-L2-13B",
928
+ "size":null,
929
+ "type":"open-source",
930
+ "license":"Cc By Nc 4.0",
931
+ "creation_date":1693785600000,
932
+ "tasks":[
933
  "translation_from",
934
  "translation_to",
935
  "classification",
 
940
  ]
941
  },
942
  {
943
+ "id":"x-ai\/grok-4",
944
+ "name":"Grok 4",
945
+ "provider_name":"xAI",
946
+ "cost":15.0,
947
+ "hf_id":null,
948
+ "size":null,
949
+ "type":"closed-source",
950
+ "license":null,
951
+ "creation_date":1752019200000,
952
+ "tasks":[
953
  "translation_from",
954
  "translation_to",
955
  "classification",
 
960
  ]
961
  },
962
  {
963
+ "id":"z-ai\/glm-4.5v",
964
+ "name":"GLM 4.5V",
965
+ "provider_name":"Z.AI",
966
+ "cost":1.8,
967
+ "hf_id":"zai-org\/GLM-4.5V",
968
+ "size":107710933120.0,
969
+ "type":"open-source",
970
+ "license":"Mit",
971
+ "creation_date":1754784000000,
972
+ "tasks":[
973
  "translation_from",
974
+ "translation_to",
975
+ "classification",
976
+ "mmlu",
977
+ "arc",
978
+ "truthfulqa",
979
+ "mgsm"
980
  ]
981
  },
982
  {
983
+ "id":"google\/translate-v2",
984
+ "name":"Google Translate",
985
+ "provider_name":"Google",
986
+ "cost":20.0,
987
+ "hf_id":null,
988
+ "size":null,
989
+ "type":"closed-source",
990
+ "license":null,
991
+ "creation_date":null,
992
+ "tasks":[
993
+ "translation_from",
994
+ "translation_to"
995
+ ]
996
  }
997
  ]
results.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1a3f388fd054fc570366705f1b8d6cb65bd6353164482d3d2c71ccec742d6158
3
- size 57534940
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce3638aedf7fd3bd28f92814be7c10a5a8f748c5cc601ab6041be798710dff54
3
+ size 11677172