CrispStrobe commited on
Commit
7cc1131
·
1 Parent(s): af78198

feat: verbose HF validation, OCR benchmarks, and corrected model mappings

Browse files
data/benchmarks.json CHANGED
@@ -73036,5 +73036,133 @@
73036
  "mteb_retrieval": "manual",
73037
  "lb_coding": "manual"
73038
  }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
73039
  }
73040
  ]
 
73036
  "mteb_retrieval": "manual",
73037
  "lb_coding": "manual"
73038
  }
73039
+ },
73040
+ {
73041
+ "hf_id": "datalab-to/chandra-ocr-2",
73042
+ "name": "chandra-ocr-2",
73043
+ "ocr_avg": 85.9,
73044
+ "sources": {
73045
+ "ocr_avg": "manual"
73046
+ }
73047
+ },
73048
+ {
73049
+ "hf_id": "rednote-hilab/dots.mocr",
73050
+ "name": "dots.mocr",
73051
+ "ocr_avg": 83.9,
73052
+ "sources": {
73053
+ "ocr_avg": "manual"
73054
+ }
73055
+ },
73056
+ {
73057
+ "hf_id": "lightonai/LightOnOCR-2-1B",
73058
+ "name": "LightOnOCR-2-1B",
73059
+ "ocr_avg": 83.2,
73060
+ "sources": {
73061
+ "ocr_avg": "manual"
73062
+ }
73063
+ },
73064
+ {
73065
+ "hf_id": "datalab-to/chandra",
73066
+ "name": "chandra",
73067
+ "ocr_avg": 83.1,
73068
+ "sources": {
73069
+ "ocr_avg": "manual"
73070
+ }
73071
+ },
73072
+ {
73073
+ "hf_id": "infly/Infinity-Parser-7B",
73074
+ "name": "Infinity-Parser-7B",
73075
+ "ocr_avg": 82.5,
73076
+ "sources": {
73077
+ "ocr_avg": "manual"
73078
+ }
73079
+ },
73080
+ {
73081
+ "hf_id": "allenai/olmOCR-2-7B-1025-FP8",
73082
+ "name": "olmOCR-2-7B-1025-FP8",
73083
+ "ocr_avg": 82.4,
73084
+ "sources": {
73085
+ "ocr_avg": "manual"
73086
+ }
73087
+ },
73088
+ {
73089
+ "hf_id": "PaddlePaddle/PaddleOCR-VL",
73090
+ "name": "PaddleOCR-VL",
73091
+ "ocr_avg": 80,
73092
+ "sources": {
73093
+ "ocr_avg": "manual"
73094
+ }
73095
+ },
73096
+ {
73097
+ "hf_id": "baidu/Qianfan-OCR",
73098
+ "name": "Qianfan-OCR",
73099
+ "ocr_avg": 79.8,
73100
+ "sources": {
73101
+ "ocr_avg": "manual"
73102
+ }
73103
+ },
73104
+ {
73105
+ "hf_id": "rednote-hilab/dots.ocr",
73106
+ "name": "dots.ocr",
73107
+ "ocr_avg": 79.1,
73108
+ "sources": {
73109
+ "ocr_avg": "manual"
73110
+ }
73111
+ },
73112
+ {
73113
+ "hf_id": "deepseek-ai/DeepSeek-OCR-2",
73114
+ "name": "DeepSeek-OCR-2",
73115
+ "ocr_avg": 76.3,
73116
+ "sources": {
73117
+ "ocr_avg": "manual"
73118
+ }
73119
+ },
73120
+ {
73121
+ "hf_id": "lightonai/LightOnOCR-1B-1025",
73122
+ "name": "LightOnOCR-1B-1025",
73123
+ "ocr_avg": 76.1,
73124
+ "sources": {
73125
+ "ocr_avg": "manual"
73126
+ }
73127
+ },
73128
+ {
73129
+ "hf_id": "deepseek-ai/DeepSeek-OCR",
73130
+ "name": "DeepSeek-OCR",
73131
+ "ocr_avg": 75.7,
73132
+ "sources": {
73133
+ "ocr_avg": "manual"
73134
+ }
73135
+ },
73136
+ {
73137
+ "hf_id": "opendatalab/MinerU2.5-2509-1.2B",
73138
+ "name": "MinerU2.5-2509-1.2B",
73139
+ "ocr_avg": 75.2,
73140
+ "sources": {
73141
+ "ocr_avg": "manual"
73142
+ }
73143
+ },
73144
+ {
73145
+ "hf_id": "zai-org/GLM-OCR",
73146
+ "name": "GLM-OCR",
73147
+ "ocr_avg": 75.2,
73148
+ "sources": {
73149
+ "ocr_avg": "manual"
73150
+ }
73151
+ },
73152
+ {
73153
+ "hf_id": "FireRedTeam/FireRed-OCR",
73154
+ "name": "FireRed-OCR",
73155
+ "ocr_avg": 70.2,
73156
+ "sources": {
73157
+ "ocr_avg": "manual"
73158
+ }
73159
+ },
73160
+ {
73161
+ "hf_id": "nanonets/Nanonets-OCR2-3B",
73162
+ "name": "Nanonets-OCR2-3B",
73163
+ "ocr_avg": 69.5,
73164
+ "sources": {
73165
+ "ocr_avg": "manual"
73166
+ }
73167
  }
73168
  ]
data/providers.json CHANGED
@@ -1088,6 +1088,16 @@
1088
  "gdpr_compliant": true,
1089
  "eu_endpoints": true,
1090
  "models": [
 
 
 
 
 
 
 
 
 
 
1091
  {
1092
  "name": "novita/meta-llama/llama-3.2-1b-instruct",
1093
  "type": "chat",
@@ -1099,16 +1109,6 @@
1099
  "hf_private": false,
1100
  "hf_id": "meta-llama/Llama-3.2-1B-Instruct"
1101
  },
1102
- {
1103
- "name": "deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo",
1104
- "type": "chat",
1105
- "input_price_per_1m": 0.02,
1106
- "output_price_per_1m": 0.05,
1107
- "currency": "USD",
1108
- "context_window": 131072,
1109
- "size_b": 8,
1110
- "hf_private": false
1111
- },
1112
  {
1113
  "name": "openai/gpt-5-nano",
1114
  "type": "vision",
@@ -1148,31 +1148,32 @@
1148
  "hf_id": "meta-llama/Meta-Llama-3-8B-Instruct"
1149
  },
1150
  {
1151
- "name": "novita/Sao10K/L3-8B-Stheno-v3.2",
1152
  "type": "chat",
1153
  "input_price_per_1m": 0.05,
1154
- "output_price_per_1m": 0.05,
1155
  "currency": "USD",
1156
- "context_window": 8192,
1157
- "size_b": 8,
1158
- "hf_private": false
 
 
1159
  },
1160
  {
1161
- "name": "novita/meta-llama/llama-3.1-8b-instruct",
1162
- "type": "chat",
1163
  "input_price_per_1m": 0.05,
1164
- "output_price_per_1m": 0.05,
1165
  "currency": "USD",
1166
- "context_window": 16384,
1167
- "size_b": 8,
1168
  "capabilities": [
1169
- "tools"
 
1170
  ],
1171
- "hf_private": false,
1172
- "hf_id": "meta-llama/Meta-Llama-3.1-8B-Instruct"
1173
  },
1174
  {
1175
- "name": "novita/sao10k/l3-8b-lunaris",
1176
  "type": "chat",
1177
  "input_price_per_1m": 0.05,
1178
  "output_price_per_1m": 0.05,
@@ -1182,40 +1183,39 @@
1182
  "hf_private": false
1183
  },
1184
  {
1185
- "name": "azure/gpt-5-nano",
1186
  "type": "chat",
1187
  "input_price_per_1m": 0.05,
1188
- "output_price_per_1m": 0.4,
1189
  "currency": "USD",
1190
- "capabilities": [
1191
- "reasoning"
1192
- ],
1193
- "context_window": 200000,
1194
- "hf_private": true
1195
  },
1196
  {
1197
- "name": "openai-responses/gpt-5-nano",
1198
- "type": "vision",
1199
  "input_price_per_1m": 0.05,
1200
- "output_price_per_1m": 0.4,
1201
  "currency": "USD",
 
 
1202
  "capabilities": [
1203
- "vision",
1204
- "reasoning"
1205
  ],
1206
- "context_window": 400000,
1207
- "hf_private": true
1208
  },
1209
  {
1210
- "name": "alibaba/qwen-turbo",
1211
  "type": "chat",
1212
  "input_price_per_1m": 0.05,
1213
- "output_price_per_1m": 0.2,
1214
  "currency": "USD",
1215
- "context_window": 1000000,
1216
  "capabilities": [
1217
- "tools"
1218
  ],
 
1219
  "hf_private": true
1220
  },
1221
  {
@@ -1262,54 +1262,31 @@
1262
  "hf_private": false
1263
  },
1264
  {
1265
- "name": "groq/openai/gpt-oss-20b",
1266
  "type": "chat",
1267
  "input_price_per_1m": 0.1,
1268
- "output_price_per_1m": 0.5,
1269
  "currency": "USD",
1270
- "context_window": 131072,
1271
- "size_b": 20,
1272
  "capabilities": [
1273
  "tools",
1274
  "reasoning"
1275
  ],
1276
- "hf_id": "openai/gpt-oss-20b",
1277
  "hf_private": false
1278
  },
1279
  {
1280
- "name": "openai/gpt-4.1-nano",
1281
- "type": "vision",
1282
- "input_price_per_1m": 0.1,
1283
- "output_price_per_1m": 0.4,
1284
- "currency": "USD",
1285
- "capabilities": [
1286
- "vision"
1287
- ],
1288
- "context_window": 1047576,
1289
- "hf_private": true
1290
- },
1291
- {
1292
- "name": "azure/gpt-4.1-nano",
1293
- "type": "vision",
1294
- "input_price_per_1m": 0.1,
1295
- "output_price_per_1m": 0.4,
1296
- "currency": "USD",
1297
- "capabilities": [
1298
- "vision"
1299
- ],
1300
- "context_window": 1047576,
1301
- "hf_private": true
1302
- },
1303
- {
1304
- "name": "azure/openai-responses/gpt-4.1-nano",
1305
  "type": "vision",
1306
  "input_price_per_1m": 0.1,
1307
  "output_price_per_1m": 0.4,
1308
  "currency": "USD",
1309
  "capabilities": [
1310
- "vision"
 
1311
  ],
1312
- "context_window": 1047576,
1313
  "hf_private": true
1314
  },
1315
  {
@@ -1338,16 +1315,7 @@
1338
  "hf_private": true
1339
  },
1340
  {
1341
- "name": "mistral/mistral-small-2503",
1342
- "type": "chat",
1343
- "input_price_per_1m": 0.1,
1344
- "output_price_per_1m": 0.3,
1345
- "currency": "USD",
1346
- "context_window": 32768,
1347
- "hf_private": true
1348
- },
1349
- {
1350
- "name": "mistral/devstral-small-latest",
1351
  "type": "chat",
1352
  "input_price_per_1m": 0.1,
1353
  "output_price_per_1m": 0.3,
@@ -1361,7 +1329,7 @@
1361
  "hf_private": false
1362
  },
1363
  {
1364
- "name": "mistral/devstral-small-2507",
1365
  "type": "chat",
1366
  "input_price_per_1m": 0.1,
1367
  "output_price_per_1m": 0.3,
@@ -1374,6 +1342,15 @@
1374
  "size_b": 24,
1375
  "hf_private": false
1376
  },
 
 
 
 
 
 
 
 
 
1377
  {
1378
  "name": "openai-responses/gpt-4.1-nano",
1379
  "type": "vision",
@@ -1387,16 +1364,15 @@
1387
  "hf_private": true
1388
  },
1389
  {
1390
- "name": "vertex/gemini-2.5-flash-lite",
1391
  "type": "vision",
1392
  "input_price_per_1m": 0.1,
1393
  "output_price_per_1m": 0.4,
1394
  "currency": "USD",
1395
  "capabilities": [
1396
- "vision",
1397
- "reasoning"
1398
  ],
1399
- "context_window": 1048576,
1400
  "hf_private": true
1401
  },
1402
  {
@@ -1410,20 +1386,44 @@
1410
  "hf_private": false
1411
  },
1412
  {
1413
- "name": "deepinfra/Qwen/Qwen3-32B",
1414
  "type": "chat",
1415
  "input_price_per_1m": 0.1,
1416
- "output_price_per_1m": 0.3,
1417
  "currency": "USD",
1418
- "context_window": 40000,
1419
- "size_b": 32,
1420
  "capabilities": [
1421
  "tools",
1422
  "reasoning"
1423
  ],
1424
- "hf_id": "Qwen/Qwen3-32B",
1425
  "hf_private": false
1426
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1427
  {
1428
  "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct-Turbo",
1429
  "type": "chat",
@@ -1476,46 +1476,69 @@
1476
  "hf_private": false
1477
  },
1478
  {
1479
- "name": "groq/openai/gpt-oss-120b",
1480
  "type": "chat",
1481
  "input_price_per_1m": 0.15,
1482
- "output_price_per_1m": 0.75,
1483
  "currency": "USD",
1484
- "context_window": 131072,
1485
- "size_b": 120,
1486
  "capabilities": [
1487
- "tools",
1488
  "reasoning"
1489
  ],
 
 
1490
  "hf_id": "openai/gpt-oss-120b",
1491
  "hf_private": false
1492
  },
1493
  {
1494
- "name": "openai/gpt-4o-mini",
 
 
 
 
 
 
 
 
 
 
1495
  "type": "vision",
1496
  "input_price_per_1m": 0.15,
1497
  "output_price_per_1m": 0.6,
1498
  "currency": "USD",
1499
  "capabilities": [
1500
- "vision"
 
1501
  ],
1502
- "context_window": 128000,
1503
  "hf_private": true
1504
  },
1505
  {
1506
- "name": "nebius/openai/gpt-oss-120b",
1507
- "type": "chat",
1508
  "input_price_per_1m": 0.15,
1509
  "output_price_per_1m": 0.6,
1510
  "currency": "USD",
1511
  "capabilities": [
 
1512
  "reasoning"
1513
  ],
1514
- "context_window": 131000,
1515
- "size_b": 120,
1516
- "hf_id": "openai/gpt-oss-120b",
1517
  "hf_private": false
1518
  },
 
 
 
 
 
 
 
 
 
 
 
 
1519
  {
1520
  "name": "novita/deepseek/deepseek-r1-distill-qwen-14b",
1521
  "type": "chat",
@@ -1533,43 +1556,20 @@
1533
  "hf_private": false
1534
  },
1535
  {
1536
- "name": "parasail/parasail-qwen3-235b-a22b-instruct-2507",
1537
  "type": "chat",
1538
  "input_price_per_1m": 0.15,
1539
- "output_price_per_1m": 0.85,
1540
- "currency": "USD",
1541
- "context_window": 262144,
1542
- "size_b": 235,
1543
- "hf_private": false
1544
- },
1545
- {
1546
- "name": "mistral/mistral-small-2603",
1547
- "type": "vision",
1548
- "input_price_per_1m": 0.15,
1549
- "output_price_per_1m": 0.6,
1550
  "currency": "USD",
 
 
1551
  "capabilities": [
1552
- "vision",
1553
  "reasoning"
1554
  ],
1555
- "context_window": 256000,
1556
- "size_b": 119,
1557
- "hf_id": "mistralai/Mistral-Small-4-119B-2603",
1558
  "hf_private": false
1559
  },
1560
- {
1561
- "name": "mistral/mistral-small-latest",
1562
- "type": "vision",
1563
- "input_price_per_1m": 0.15,
1564
- "output_price_per_1m": 0.6,
1565
- "currency": "USD",
1566
- "capabilities": [
1567
- "vision",
1568
- "reasoning"
1569
- ],
1570
- "context_window": 256000,
1571
- "hf_private": true
1572
- },
1573
  {
1574
  "name": "novita/mistralai/mistral-nemo",
1575
  "type": "chat",
@@ -1595,69 +1595,73 @@
1595
  "hf_private": false
1596
  },
1597
  {
1598
- "name": "openai/gpt-5.4-nano",
1599
- "type": "vision",
1600
  "input_price_per_1m": 0.2,
1601
- "output_price_per_1m": 1.25,
1602
  "currency": "USD",
 
1603
  "capabilities": [
1604
- "vision",
1605
  "reasoning"
1606
  ],
1607
- "context_window": 400000,
1608
- "hf_private": true
 
1609
  },
1610
  {
1611
- "name": "novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8",
1612
  "type": "chat",
1613
  "input_price_per_1m": 0.2,
1614
- "output_price_per_1m": 0.85,
1615
  "currency": "USD",
1616
- "context_window": 1048576,
1617
- "size_b": 17,
1618
  "capabilities": [
1619
- "vision",
1620
- "tools"
1621
  ],
 
1622
  "hf_private": false
1623
  },
1624
  {
1625
- "name": "novita/qwen/qwen3-235b-a22b-fp8",
1626
- "type": "chat",
1627
  "input_price_per_1m": 0.2,
1628
  "output_price_per_1m": 0.8,
1629
  "currency": "USD",
1630
- "context_window": 128000,
1631
- "size_b": 235,
1632
  "capabilities": [
1633
- "tools",
1634
- "reasoning"
1635
  ],
1636
- "hf_id": "Qwen/Qwen3-235B-A22B",
 
 
1637
  "hf_private": false
1638
  },
1639
  {
1640
- "name": "xai/grok-4-1-fast-non-reasoning",
1641
- "type": "vision",
1642
  "input_price_per_1m": 0.2,
1643
  "output_price_per_1m": 0.5,
1644
  "currency": "USD",
 
1645
  "capabilities": [
1646
- "vision"
 
 
1647
  ],
1648
- "context_window": 2000000,
1649
  "hf_private": true
1650
  },
1651
  {
1652
- "name": "xai/grok-code-fast-1",
1653
  "type": "vision",
1654
  "input_price_per_1m": 0.2,
1655
- "output_price_per_1m": 1.5,
1656
  "currency": "USD",
1657
  "capabilities": [
1658
  "vision"
1659
  ],
1660
- "context_window": 256000,
1661
  "hf_private": true
1662
  },
1663
  {
@@ -1673,7 +1677,7 @@
1673
  "hf_private": true
1674
  },
1675
  {
1676
- "name": "xai/grok-4-fast",
1677
  "type": "chat",
1678
  "input_price_per_1m": 0.2,
1679
  "output_price_per_1m": 0.5,
@@ -1687,21 +1691,32 @@
1687
  "hf_private": true
1688
  },
1689
  {
1690
- "name": "xai/grok-4-fast-non-reasoning",
1691
- "type": "chat",
1692
  "input_price_per_1m": 0.2,
1693
- "output_price_per_1m": 0.5,
 
 
 
 
 
 
 
 
 
 
 
 
1694
  "currency": "USD",
1695
- "context_window": 2000000,
1696
  "capabilities": [
1697
  "vision",
1698
- "tools",
1699
  "reasoning"
1700
  ],
 
1701
  "hf_private": true
1702
  },
1703
  {
1704
- "name": "openai-responses/gpt-5.4-nano",
1705
  "type": "vision",
1706
  "input_price_per_1m": 0.2,
1707
  "output_price_per_1m": 1.25,
@@ -1724,12 +1739,12 @@
1724
  "hf_private": false
1725
  },
1726
  {
1727
- "name": "deepinfra/Qwen/Qwen3-235B-A22B",
1728
  "type": "chat",
1729
  "input_price_per_1m": 0.2,
1730
- "output_price_per_1m": 0.6,
1731
  "currency": "USD",
1732
- "context_window": 40000,
1733
  "size_b": 235,
1734
  "capabilities": [
1735
  "tools",
@@ -1739,46 +1754,17 @@
1739
  "hf_private": false
1740
  },
1741
  {
1742
- "name": "deepinfra/zai-org/GLM-4.5-Air",
1743
  "type": "chat",
1744
  "input_price_per_1m": 0.2,
1745
- "output_price_per_1m": 1.1,
1746
- "currency": "USD",
1747
- "context_window": 131072,
1748
- "capabilities": [
1749
- "tools",
1750
- "reasoning"
1751
- ],
1752
- "hf_id": "zai-org/GLM-4.5-Air",
1753
- "size_b": 110.5,
1754
- "hf_private": false
1755
- },
1756
- {
1757
- "name": "alibaba/qwen3-30b-a3b-instruct-2507",
1758
- "type": "vision",
1759
- "input_price_per_1m": 0.2,
1760
- "output_price_per_1m": 0.8,
1761
- "currency": "USD",
1762
- "capabilities": [
1763
- "vision"
1764
- ],
1765
- "context_window": 131072,
1766
- "size_b": 30,
1767
- "hf_id": "Qwen/Qwen3-30B-A3B-Instruct-2507",
1768
- "hf_private": false
1769
- },
1770
- {
1771
- "name": "deepinfra/Qwen/Qwen2.5-72B-Instruct",
1772
- "type": "chat",
1773
- "input_price_per_1m": 0.23,
1774
- "output_price_per_1m": 0.4,
1775
  "currency": "USD",
1776
- "context_window": 131072,
1777
- "size_b": 72,
1778
  "capabilities": [
1779
- "vision"
 
1780
  ],
1781
- "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
1782
  "hf_private": false
1783
  },
1784
  {
@@ -1820,15 +1806,29 @@
1820
  "hf_private": false
1821
  },
1822
  {
1823
- "name": "azure/gpt-5-mini",
1824
  "type": "chat",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1825
  "input_price_per_1m": 0.25,
1826
- "output_price_per_1m": 2,
1827
  "currency": "USD",
1828
  "capabilities": [
1829
- "reasoning"
1830
  ],
1831
- "context_window": 200000,
1832
  "hf_private": true
1833
  },
1834
  {
@@ -1867,15 +1867,15 @@
1867
  "hf_private": true
1868
  },
1869
  {
1870
- "name": "vertex/gemini-3.1-flash-lite-preview",
1871
- "type": "vision",
1872
  "input_price_per_1m": 0.25,
1873
- "output_price_per_1m": 1.5,
1874
  "currency": "USD",
1875
  "capabilities": [
1876
- "vision"
1877
  ],
1878
- "context_window": 1048576,
1879
  "hf_private": true
1880
  },
1881
  {
@@ -1892,15 +1892,6 @@
1892
  "size_b": 685.4,
1893
  "hf_private": false
1894
  },
1895
- {
1896
- "name": "deepseek/deepseek-reasoner",
1897
- "type": "chat",
1898
- "input_price_per_1m": 0.28,
1899
- "output_price_per_1m": 0.42,
1900
- "currency": "USD",
1901
- "context_window": 128000,
1902
- "hf_private": true
1903
- },
1904
  {
1905
  "name": "deepseek/deepseek-chat",
1906
  "type": "chat",
@@ -1916,6 +1907,15 @@
1916
  "size_source": "manual",
1917
  "hf_private": false
1918
  },
 
 
 
 
 
 
 
 
 
1919
  {
1920
  "name": "nebius/deepseek-ai/DeepSeek-V3.2",
1921
  "type": "chat",
@@ -1945,50 +1945,67 @@
1945
  "hf_private": false
1946
  },
1947
  {
1948
- "name": "novita/minimax-m2.7",
1949
- "type": "vision",
1950
  "input_price_per_1m": 0.3,
1951
- "output_price_per_1m": 1.2,
1952
  "currency": "USD",
 
1953
  "capabilities": [
1954
- "vision",
1955
  "reasoning"
1956
  ],
1957
- "context_window": 200000,
1958
- "hf_private": false,
1959
- "size_b": 230,
1960
- "size_source": "manual",
1961
- "hf_id": "MiniMaxAI/MiniMax-M2.7"
1962
  },
1963
  {
1964
- "name": "novita/deepseek/deepseek-r1-distill-qwen-32b",
1965
  "type": "chat",
1966
  "input_price_per_1m": 0.3,
1967
- "output_price_per_1m": 0.3,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1968
  "currency": "USD",
1969
- "context_window": 12800,
1970
- "size_b": 32,
1971
  "capabilities": [
 
1972
  "reasoning"
1973
  ],
1974
- "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",
1975
- "hf_private": false
1976
  },
1977
  {
1978
- "name": "novita/MiniMax-M2.7",
1979
  "type": "vision",
1980
  "input_price_per_1m": 0.3,
1981
- "output_price_per_1m": 1.2,
1982
  "currency": "USD",
1983
  "capabilities": [
1984
  "vision",
1985
  "reasoning"
1986
  ],
1987
- "context_window": 200000,
1988
- "hf_private": false,
1989
- "size_b": 230,
1990
- "size_source": "manual",
1991
- "hf_id": "MiniMaxAI/MiniMax-M2.7"
1992
  },
1993
  {
1994
  "name": "minimaxi/MiniMax-M2.7",
@@ -2049,17 +2066,7 @@
2049
  "hf_private": true
2050
  },
2051
  {
2052
- "name": "parasail/parasail-gemma3-27b-it",
2053
- "type": "chat",
2054
- "input_price_per_1m": 0.3,
2055
- "output_price_per_1m": 0.5,
2056
- "currency": "USD",
2057
- "context_window": 128000,
2058
- "size_b": 27,
2059
- "hf_private": false
2060
- },
2061
- {
2062
- "name": "google/gemini-2.5-flash",
2063
  "type": "vision",
2064
  "input_price_per_1m": 0.3,
2065
  "output_price_per_1m": 2.5,
@@ -2072,16 +2079,7 @@
2072
  "hf_private": true
2073
  },
2074
  {
2075
- "name": "mistral/codestral-latest",
2076
- "type": "chat",
2077
- "input_price_per_1m": 0.3,
2078
- "output_price_per_1m": 0.9,
2079
- "currency": "USD",
2080
- "context_window": 131072,
2081
- "hf_private": true
2082
- },
2083
- {
2084
- "name": "vertex/gemini-2.5-flash",
2085
  "type": "vision",
2086
  "input_price_per_1m": 0.3,
2087
  "output_price_per_1m": 2.5,
@@ -2094,16 +2092,12 @@
2094
  "hf_private": true
2095
  },
2096
  {
2097
- "name": "vertex/gemini-2.5-flash-image",
2098
- "type": "vision",
2099
  "input_price_per_1m": 0.3,
2100
- "output_price_per_1m": 2.5,
2101
  "currency": "USD",
2102
- "capabilities": [
2103
- "vision",
2104
- "reasoning"
2105
- ],
2106
- "context_window": 1048576,
2107
  "hf_private": true
2108
  },
2109
  {
@@ -2117,44 +2111,50 @@
2117
  "hf_private": false
2118
  },
2119
  {
2120
- "name": "coding/gemini-2.5-flash",
2121
  "type": "vision",
2122
  "input_price_per_1m": 0.3,
2123
- "output_price_per_1m": 2.5,
2124
  "currency": "USD",
2125
  "capabilities": [
2126
  "vision",
2127
  "reasoning"
2128
  ],
2129
- "context_window": 1048576,
2130
- "hf_private": true
 
 
 
2131
  },
2132
  {
2133
- "name": "deepinfra/deepseek-ai/DeepSeek-V3.1",
2134
- "type": "chat",
2135
  "input_price_per_1m": 0.3,
2136
- "output_price_per_1m": 1,
2137
  "currency": "USD",
2138
- "context_window": 163840,
2139
  "capabilities": [
2140
- "tools",
2141
  "reasoning"
2142
  ],
2143
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
2144
- "size_b": 671,
2145
- "hf_private": false
 
 
2146
  },
2147
  {
2148
- "name": "alibaba/qwen3-coder-flash",
2149
- "type": "vision",
2150
  "input_price_per_1m": 0.3,
2151
- "output_price_per_1m": 1.5,
2152
  "currency": "USD",
 
 
2153
  "capabilities": [
2154
- "vision"
2155
  ],
2156
- "context_window": 1048576,
2157
- "hf_private": true
2158
  },
2159
  {
2160
  "name": "deepinfra/meta-llama/Llama-3.2-90B-Vision-Instruct",
@@ -2194,18 +2194,6 @@
2194
  "hf_private": false,
2195
  "hf_id": "meta-llama/Llama-3.3-70B-Instruct"
2196
  },
2197
- {
2198
- "name": "openai/gpt-4.1-mini",
2199
- "type": "vision",
2200
- "input_price_per_1m": 0.4,
2201
- "output_price_per_1m": 1.6,
2202
- "currency": "USD",
2203
- "capabilities": [
2204
- "vision"
2205
- ],
2206
- "context_window": 1047576,
2207
- "hf_private": true
2208
- },
2209
  {
2210
  "name": "nebius/zai-org/GLM-4.7",
2211
  "type": "chat",
@@ -2235,51 +2223,47 @@
2235
  "hf_private": false
2236
  },
2237
  {
2238
- "name": "novita/deepseek/deepseek-v3-turbo",
2239
  "type": "chat",
2240
  "input_price_per_1m": 0.4,
2241
- "output_price_per_1m": 1.3,
2242
  "currency": "USD",
2243
- "context_window": 128000,
2244
- "hf_private": true
 
 
 
 
 
2245
  },
2246
  {
2247
- "name": "novita/deepseek/deepseek-v3-0324",
2248
  "type": "chat",
2249
  "input_price_per_1m": 0.4,
2250
- "output_price_per_1m": 1.3,
2251
  "currency": "USD",
2252
- "context_window": 128000,
2253
  "capabilities": [
2254
- "tools",
2255
- "reasoning"
2256
  ],
2257
- "size_b": 685,
2258
- "hf_id": "deepseek-ai/DeepSeek-V3-0324",
2259
- "hf_private": false
2260
  },
2261
  {
2262
- "name": "azure/gpt-4.1-mini",
2263
- "type": "vision",
2264
  "input_price_per_1m": 0.4,
2265
- "output_price_per_1m": 1.6,
2266
  "currency": "USD",
2267
- "capabilities": [
2268
- "vision"
2269
- ],
2270
- "context_window": 1047576,
2271
  "hf_private": true
2272
  },
2273
  {
2274
- "name": "azure/openai-responses/gpt-4.1-mini",
2275
- "type": "vision",
2276
  "input_price_per_1m": 0.4,
2277
- "output_price_per_1m": 1.6,
2278
  "currency": "USD",
2279
- "capabilities": [
2280
- "vision"
2281
- ],
2282
- "context_window": 1047576,
2283
  "hf_private": true
2284
  },
2285
  {
@@ -2295,25 +2279,19 @@
2295
  "hf_private": true
2296
  },
2297
  {
2298
- "name": "mistral/devstral-latest",
2299
- "type": "chat",
2300
- "input_price_per_1m": 0.4,
2301
- "output_price_per_1m": 2,
2302
- "currency": "USD",
2303
- "context_window": 256000,
2304
- "hf_private": true
2305
- },
2306
- {
2307
- "name": "mistral/mistral-medium-latest",
2308
- "type": "chat",
2309
  "input_price_per_1m": 0.4,
2310
- "output_price_per_1m": 2,
2311
  "currency": "USD",
2312
- "context_window": 131072,
 
 
 
2313
  "hf_private": true
2314
  },
2315
  {
2316
- "name": "openai-responses/gpt-4.1-mini",
2317
  "type": "vision",
2318
  "input_price_per_1m": 0.4,
2319
  "output_price_per_1m": 1.6,
@@ -2325,44 +2303,52 @@
2325
  "hf_private": true
2326
  },
2327
  {
2328
- "name": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2329
  "type": "chat",
2330
  "input_price_per_1m": 0.4,
2331
- "output_price_per_1m": 1.6,
2332
  "currency": "USD",
2333
- "context_window": 262144,
2334
- "size_b": 480,
 
 
 
 
 
 
 
 
2335
  "capabilities": [
2336
- "tools"
 
2337
  ],
2338
- "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct",
 
2339
  "hf_private": false
2340
  },
2341
  {
2342
- "name": "alibaba/qwen-plus",
2343
- "type": "chat",
2344
  "input_price_per_1m": 0.4,
2345
- "output_price_per_1m": 1.2,
2346
  "currency": "USD",
2347
- "context_window": 131072,
2348
  "capabilities": [
2349
- "tools"
2350
  ],
 
2351
  "hf_private": true
2352
  },
2353
  {
2354
- "name": "nebius/moonshotai/Kimi-K2-Instruct",
2355
- "type": "chat",
2356
- "input_price_per_1m": 0.5,
2357
- "output_price_per_1m": 2.4,
2358
  "currency": "USD",
2359
- "context_window": 131000,
2360
  "capabilities": [
2361
- "tools"
2362
  ],
2363
- "hf_id": "moonshotai/Kimi-K2-Instruct",
2364
- "size_b": 1026.5,
2365
- "hf_private": false
2366
  },
2367
  {
2368
  "name": "nebius/moonshotai/kimi-k2.5",
@@ -2395,7 +2381,21 @@
2395
  "hf_private": false
2396
  },
2397
  {
2398
- "name": "google/gemini-3.1-flash-image-preview",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2399
  "type": "vision",
2400
  "input_price_per_1m": 0.5,
2401
  "output_price_per_1m": 2,
@@ -2408,7 +2408,7 @@
2408
  "hf_private": true
2409
  },
2410
  {
2411
- "name": "google/gemini-3-flash-preview",
2412
  "type": "vision",
2413
  "input_price_per_1m": 0.5,
2414
  "output_price_per_1m": 3,
@@ -2421,19 +2421,20 @@
2421
  "hf_private": true
2422
  },
2423
  {
2424
- "name": "mistral/mistral-large-latest",
2425
- "type": "chat",
2426
  "input_price_per_1m": 0.5,
2427
- "output_price_per_1m": 1.5,
2428
  "currency": "USD",
2429
- "context_window": 131072,
2430
  "capabilities": [
2431
- "tools"
 
2432
  ],
 
2433
  "hf_private": true
2434
  },
2435
  {
2436
- "name": "vertex/gemini-3-flash-preview",
2437
  "type": "vision",
2438
  "input_price_per_1m": 0.5,
2439
  "output_price_per_1m": 3,
@@ -2446,16 +2447,15 @@
2446
  "hf_private": true
2447
  },
2448
  {
2449
- "name": "vertex/gemini-3.1-flash-image-preview",
2450
- "type": "vision",
2451
  "input_price_per_1m": 0.5,
2452
- "output_price_per_1m": 2,
2453
  "currency": "USD",
 
2454
  "capabilities": [
2455
- "vision",
2456
- "reasoning"
2457
  ],
2458
- "context_window": 131072,
2459
  "hf_private": true
2460
  },
2461
  {
@@ -2529,7 +2529,7 @@
2529
  "hf_private": false
2530
  },
2531
  {
2532
- "name": "novita/zai-org/glm-4.5",
2533
  "type": "chat",
2534
  "input_price_per_1m": 0.6,
2535
  "output_price_per_1m": 2.2,
@@ -2544,22 +2544,22 @@
2544
  "hf_private": false
2545
  },
2546
  {
2547
- "name": "novita/zai-org/glm-4.6",
2548
- "type": "chat",
2549
  "input_price_per_1m": 0.6,
2550
- "output_price_per_1m": 2.2,
2551
  "currency": "USD",
2552
- "context_window": 204800,
2553
  "capabilities": [
2554
- "tools",
2555
  "reasoning"
2556
  ],
2557
- "hf_id": "zai-org/GLM-4.6",
2558
- "size_b": 356.8,
 
2559
  "hf_private": false
2560
  },
2561
  {
2562
- "name": "minimaxi/MiniMax-M2.7-highspeed",
2563
  "type": "vision",
2564
  "input_price_per_1m": 0.6,
2565
  "output_price_per_1m": 2.4,
@@ -2569,12 +2569,12 @@
2569
  "reasoning"
2570
  ],
2571
  "context_window": 200000,
2572
- "hf_private": false,
2573
- "size_b": 230,
2574
- "size_source": "manual"
2575
  },
2576
  {
2577
- "name": "minimaxi/MiniMax-M2.5-highspeed",
2578
  "type": "vision",
2579
  "input_price_per_1m": 0.6,
2580
  "output_price_per_1m": 2.4,
@@ -2584,9 +2584,9 @@
2584
  "reasoning"
2585
  ],
2586
  "context_window": 200000,
2587
- "hf_id": "MiniMaxAI/MiniMax-M2.5",
2588
- "size_b": 228.7,
2589
- "hf_private": false
2590
  },
2591
  {
2592
  "name": "moonshot/kimi-k2-0711-preview",
@@ -2661,7 +2661,22 @@
2661
  "hf_private": false
2662
  },
2663
  {
2664
- "name": "deepinfra/zai-org/GLM-4.5",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2665
  "type": "chat",
2666
  "input_price_per_1m": 0.6,
2667
  "output_price_per_1m": 2.2,
@@ -2717,21 +2732,6 @@
2717
  "size_b": 358.3,
2718
  "hf_private": false
2719
  },
2720
- {
2721
- "name": "alibaba/qwen3.5",
2722
- "type": "vision",
2723
- "input_price_per_1m": 0.6,
2724
- "output_price_per_1m": 3.6,
2725
- "currency": "USD",
2726
- "capabilities": [
2727
- "vision",
2728
- "reasoning"
2729
- ],
2730
- "context_window": 256000,
2731
- "size_b": 9,
2732
- "hf_id": "Qwen/Qwen3.5-9B",
2733
- "hf_private": false
2734
- },
2735
  {
2736
  "name": "novita/microsoft/wizardlm-2-8x22b",
2737
  "type": "chat",
@@ -2757,19 +2757,16 @@
2757
  "hf_private": true
2758
  },
2759
  {
2760
- "name": "novita/deepseek/deepseek-r1-turbo",
2761
- "type": "chat",
2762
  "input_price_per_1m": 0.7,
2763
- "output_price_per_1m": 2.5,
2764
  "currency": "USD",
2765
- "context_window": 64000,
2766
  "capabilities": [
2767
- "tools",
2768
- "reasoning"
2769
  ],
2770
- "hf_id": "deepseek-ai/DeepSeek-R1",
2771
- "size_b": 671,
2772
- "size_source": "manual",
2773
  "hf_private": false
2774
  },
2775
  {
@@ -2783,20 +2780,23 @@
2783
  "hf_private": false
2784
  },
2785
  {
2786
- "name": "parasail/parasail-qwen25-vl-72b-instruct",
2787
- "type": "vision",
2788
  "input_price_per_1m": 0.7,
2789
- "output_price_per_1m": 0.7,
2790
  "currency": "USD",
 
2791
  "capabilities": [
2792
- "vision"
 
2793
  ],
2794
- "context_window": 32768,
2795
- "size_b": 72,
 
2796
  "hf_private": false
2797
  },
2798
  {
2799
- "name": "openai/gpt-5.4-mini",
2800
  "type": "vision",
2801
  "input_price_per_1m": 0.75,
2802
  "output_price_per_1m": 4.5,
@@ -2809,7 +2809,7 @@
2809
  "hf_private": true
2810
  },
2811
  {
2812
- "name": "openai-responses/gpt-5.4-mini",
2813
  "type": "vision",
2814
  "input_price_per_1m": 0.75,
2815
  "output_price_per_1m": 4.5,
@@ -2837,17 +2837,13 @@
2837
  "hf_private": false
2838
  },
2839
  {
2840
- "name": "novita/qwen/qwen2.5-vl-72b-instruct",
2841
  "type": "chat",
2842
  "input_price_per_1m": 0.8,
2843
  "output_price_per_1m": 0.8,
2844
  "currency": "USD",
2845
- "context_window": 96000,
2846
- "size_b": 72,
2847
- "capabilities": [
2848
- "vision"
2849
- ],
2850
- "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
2851
  "hf_private": false
2852
  },
2853
  {
@@ -2865,44 +2861,48 @@
2865
  "hf_private": false
2866
  },
2867
  {
2868
- "name": "deepinfra/meta-llama/Meta-Llama-3.1-405B-Instruct",
2869
  "type": "chat",
2870
  "input_price_per_1m": 0.8,
2871
  "output_price_per_1m": 0.8,
2872
  "currency": "USD",
2873
- "context_window": 130815,
2874
- "size_b": 405,
 
 
 
 
2875
  "hf_private": false
2876
  },
2877
  {
2878
- "name": "deepinfra/deepseek-ai/DeepSeek-V3",
2879
  "type": "chat",
2880
  "input_price_per_1m": 0.85,
2881
- "output_price_per_1m": 0.9,
2882
  "currency": "USD",
2883
- "context_window": 128000,
2884
  "capabilities": [
2885
  "tools",
2886
  "reasoning"
2887
  ],
2888
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
2889
  "size_b": 671,
 
2890
  "hf_private": false
2891
  },
2892
  {
2893
- "name": "deepinfra/deepseek-ai/DeepSeek-R1",
2894
  "type": "chat",
2895
  "input_price_per_1m": 0.85,
2896
- "output_price_per_1m": 2.5,
2897
  "currency": "USD",
2898
- "context_window": 64000,
2899
  "capabilities": [
2900
  "tools",
2901
  "reasoning"
2902
  ],
2903
- "hf_id": "deepseek-ai/DeepSeek-R1",
2904
  "size_b": 671,
2905
- "size_source": "manual",
2906
  "hf_private": false
2907
  },
2908
  {
@@ -2965,32 +2965,40 @@
2965
  "hf_private": true
2966
  },
2967
  {
2968
- "name": "groq/moonshotai/kimi-k2-instruct",
2969
- "type": "chat",
 
 
 
 
 
 
 
 
 
 
 
 
2970
  "input_price_per_1m": 1,
2971
- "output_price_per_1m": 3,
2972
  "currency": "USD",
2973
- "context_window": 131072,
2974
  "capabilities": [
2975
- "tools"
2976
  ],
2977
- "hf_id": "moonshotai/Kimi-K2-Instruct",
2978
- "size_b": 1026.5,
2979
- "hf_private": false
2980
  },
2981
  {
2982
- "name": "groq/moonshotai/Kimi-K2-Instruct-0905",
2983
  "type": "chat",
2984
  "input_price_per_1m": 1,
2985
- "output_price_per_1m": 3,
2986
  "currency": "USD",
2987
- "context_window": 256000,
2988
  "capabilities": [
2989
- "tools"
2990
  ],
2991
- "hf_id": "moonshotai/Kimi-K2-Instruct",
2992
- "size_b": 1026.5,
2993
- "hf_private": false
2994
  },
2995
  {
2996
  "name": "openai/o3",
@@ -3020,40 +3028,47 @@
3020
  "hf_private": false
3021
  },
3022
  {
3023
- "name": "perplexity/sonar",
3024
- "type": "chat",
3025
  "input_price_per_1m": 1,
3026
- "output_price_per_1m": 1,
3027
  "currency": "USD",
3028
- "context_window": 131072,
3029
  "capabilities": [
3030
- "vision"
 
3031
  ],
3032
- "hf_private": true
 
 
 
3033
  },
3034
  {
3035
- "name": "anthropic/claude-haiku-4-5",
3036
- "type": "vision",
3037
  "input_price_per_1m": 1,
3038
- "output_price_per_1m": 5,
3039
  "currency": "USD",
 
3040
  "capabilities": [
3041
- "vision"
3042
  ],
3043
- "context_window": 200000,
3044
- "hf_private": true
 
3045
  },
3046
  {
3047
- "name": "vertex/claude-haiku-4-5",
3048
- "type": "vision",
3049
  "input_price_per_1m": 1,
3050
- "output_price_per_1m": 5,
3051
  "currency": "USD",
 
3052
  "capabilities": [
3053
- "vision"
3054
  ],
3055
- "context_window": 200000,
3056
- "hf_private": true
 
3057
  },
3058
  {
3059
  "name": "bedrock/claude-haiku-4-5",
@@ -3068,22 +3083,7 @@
3068
  "hf_private": true
3069
  },
3070
  {
3071
- "name": "zai/GLM-5",
3072
- "type": "vision",
3073
- "input_price_per_1m": 1,
3074
- "output_price_per_1m": 3.2,
3075
- "currency": "USD",
3076
- "capabilities": [
3077
- "vision",
3078
- "reasoning"
3079
- ],
3080
- "context_window": 200000,
3081
- "hf_id": "zai-org/GLM-5",
3082
- "size_b": 753.9,
3083
- "hf_private": false
3084
- },
3085
- {
3086
- "name": "alibaba/qwen3-coder-plus",
3087
  "type": "vision",
3088
  "input_price_per_1m": 1,
3089
  "output_price_per_1m": 5,
@@ -3091,11 +3091,11 @@
3091
  "capabilities": [
3092
  "vision"
3093
  ],
3094
- "context_window": 1048576,
3095
  "hf_private": true
3096
  },
3097
  {
3098
- "name": "openai/o3-mini",
3099
  "type": "chat",
3100
  "input_price_per_1m": 1.1,
3101
  "output_price_per_1m": 4.4,
@@ -3107,7 +3107,7 @@
3107
  "hf_private": true
3108
  },
3109
  {
3110
- "name": "azure/o4-mini",
3111
  "type": "chat",
3112
  "input_price_per_1m": 1.1,
3113
  "output_price_per_1m": 4.4,
@@ -3119,7 +3119,7 @@
3119
  "hf_private": true
3120
  },
3121
  {
3122
- "name": "openai-responses/o3-mini",
3123
  "type": "chat",
3124
  "input_price_per_1m": 1.1,
3125
  "output_price_per_1m": 4.4,
@@ -3131,7 +3131,7 @@
3131
  "hf_private": true
3132
  },
3133
  {
3134
- "name": "openai-responses/o4-mini",
3135
  "type": "chat",
3136
  "input_price_per_1m": 1.1,
3137
  "output_price_per_1m": 4.4,
@@ -3142,16 +3142,6 @@
3142
  "context_window": 200000,
3143
  "hf_private": true
3144
  },
3145
- {
3146
- "name": "together/Qwen/Qwen2.5-72B-Instruct-Turbo",
3147
- "type": "chat",
3148
- "input_price_per_1m": 1.2,
3149
- "output_price_per_1m": 1.2,
3150
- "currency": "USD",
3151
- "context_window": 32768,
3152
- "size_b": 72,
3153
- "hf_private": false
3154
- },
3155
  {
3156
  "name": "moonshot/kimi-k2-turbo-preview",
3157
  "type": "chat",
@@ -3167,20 +3157,17 @@
3167
  "hf_private": false
3168
  },
3169
  {
3170
- "name": "openai/gpt-5.1-chat",
3171
- "type": "vision",
3172
- "input_price_per_1m": 1.25,
3173
- "output_price_per_1m": 10,
3174
  "currency": "USD",
3175
- "capabilities": [
3176
- "vision",
3177
- "reasoning"
3178
- ],
3179
- "context_window": 128000,
3180
- "hf_private": true
3181
  },
3182
  {
3183
- "name": "openai/gpt-5.1",
3184
  "type": "vision",
3185
  "input_price_per_1m": 1.25,
3186
  "output_price_per_1m": 10,
@@ -3189,11 +3176,11 @@
3189
  "vision",
3190
  "reasoning"
3191
  ],
3192
- "context_window": 400000,
3193
  "hf_private": true
3194
  },
3195
  {
3196
- "name": "openai/gpt-5-chat",
3197
  "type": "vision",
3198
  "input_price_per_1m": 1.25,
3199
  "output_price_per_1m": 10,
@@ -3202,35 +3189,37 @@
3202
  "vision",
3203
  "reasoning"
3204
  ],
3205
- "context_window": 128000,
3206
  "hf_private": true
3207
  },
3208
  {
3209
- "name": "azure/gpt-5.1",
3210
- "type": "chat",
3211
  "input_price_per_1m": 1.25,
3212
  "output_price_per_1m": 10,
3213
  "currency": "USD",
3214
  "capabilities": [
 
3215
  "reasoning"
3216
  ],
3217
- "context_window": 200000,
3218
  "hf_private": true
3219
  },
3220
  {
3221
- "name": "azure/gpt-5",
3222
- "type": "chat",
3223
  "input_price_per_1m": 1.25,
3224
  "output_price_per_1m": 10,
3225
  "currency": "USD",
3226
  "capabilities": [
 
3227
  "reasoning"
3228
  ],
3229
- "context_window": 200000,
3230
  "hf_private": true
3231
  },
3232
  {
3233
- "name": "google/gemini-2.5-pro",
3234
  "type": "vision",
3235
  "input_price_per_1m": 1.25,
3236
  "output_price_per_1m": 10,
@@ -3239,11 +3228,11 @@
3239
  "vision",
3240
  "reasoning"
3241
  ],
3242
- "context_window": 1048576,
3243
  "hf_private": true
3244
  },
3245
  {
3246
- "name": "openai-responses/gpt-5.1",
3247
  "type": "vision",
3248
  "input_price_per_1m": 1.25,
3249
  "output_price_per_1m": 10,
@@ -3256,7 +3245,7 @@
3256
  "hf_private": true
3257
  },
3258
  {
3259
- "name": "openai-responses/gpt-5.1-codex",
3260
  "type": "vision",
3261
  "input_price_per_1m": 1.25,
3262
  "output_price_per_1m": 10,
@@ -3269,7 +3258,7 @@
3269
  "hf_private": true
3270
  },
3271
  {
3272
- "name": "openai-responses/gpt-5-codex",
3273
  "type": "vision",
3274
  "input_price_per_1m": 1.25,
3275
  "output_price_per_1m": 10,
@@ -3282,7 +3271,7 @@
3282
  "hf_private": true
3283
  },
3284
  {
3285
- "name": "openai-responses/gpt-5",
3286
  "type": "vision",
3287
  "input_price_per_1m": 1.25,
3288
  "output_price_per_1m": 10,
@@ -3291,11 +3280,11 @@
3291
  "vision",
3292
  "reasoning"
3293
  ],
3294
- "context_window": 400000,
3295
  "hf_private": true
3296
  },
3297
  {
3298
- "name": "vertex/gemini-2.5-pro",
3299
  "type": "vision",
3300
  "input_price_per_1m": 1.25,
3301
  "output_price_per_1m": 10,
@@ -3304,7 +3293,7 @@
3304
  "vision",
3305
  "reasoning"
3306
  ],
3307
- "context_window": 1048576,
3308
  "hf_private": true
3309
  },
3310
  {
@@ -3323,20 +3312,31 @@
3323
  "hf_private": false
3324
  },
3325
  {
3326
- "name": "coding/gemini-2.5-pro",
3327
- "type": "vision",
3328
  "input_price_per_1m": 1.25,
3329
  "output_price_per_1m": 10,
3330
  "currency": "USD",
3331
  "capabilities": [
3332
- "vision",
3333
  "reasoning"
3334
  ],
3335
- "context_window": 1048576,
3336
  "hf_private": true
3337
  },
3338
  {
3339
- "name": "novita/sao10k/l31-70b-euryale-v2.2",
 
 
 
 
 
 
 
 
 
 
 
 
3340
  "type": "chat",
3341
  "input_price_per_1m": 1.48,
3342
  "output_price_per_1m": 1.48,
@@ -3346,7 +3346,7 @@
3346
  "hf_private": false
3347
  },
3348
  {
3349
- "name": "novita/sao10k/l3-70b-euryale-v2.1",
3350
  "type": "chat",
3351
  "input_price_per_1m": 1.48,
3352
  "output_price_per_1m": 1.48,
@@ -3368,7 +3368,7 @@
3368
  "hf_private": true
3369
  },
3370
  {
3371
- "name": "openai/gpt-5.2",
3372
  "type": "vision",
3373
  "input_price_per_1m": 1.75,
3374
  "output_price_per_1m": 14,
@@ -3381,7 +3381,7 @@
3381
  "hf_private": true
3382
  },
3383
  {
3384
- "name": "openai/gpt-5.3-chat",
3385
  "type": "vision",
3386
  "input_price_per_1m": 1.75,
3387
  "output_price_per_1m": 14,
@@ -3390,11 +3390,11 @@
3390
  "vision",
3391
  "reasoning"
3392
  ],
3393
- "context_window": 128000,
3394
  "hf_private": true
3395
  },
3396
  {
3397
- "name": "openai/gpt-5.2-chat",
3398
  "type": "vision",
3399
  "input_price_per_1m": 1.75,
3400
  "output_price_per_1m": 14,
@@ -3403,23 +3403,24 @@
3403
  "vision",
3404
  "reasoning"
3405
  ],
3406
- "context_window": 128000,
3407
  "hf_private": true
3408
  },
3409
  {
3410
- "name": "azure/gpt-5.2",
3411
- "type": "chat",
3412
  "input_price_per_1m": 1.75,
3413
  "output_price_per_1m": 14,
3414
  "currency": "USD",
3415
  "capabilities": [
 
3416
  "reasoning"
3417
  ],
3418
- "context_window": 200000,
3419
  "hf_private": true
3420
  },
3421
  {
3422
- "name": "azure/openai-responses/gpt-5.2-codex",
3423
  "type": "vision",
3424
  "input_price_per_1m": 1.75,
3425
  "output_price_per_1m": 14,
@@ -3428,11 +3429,11 @@
3428
  "vision",
3429
  "reasoning"
3430
  ],
3431
- "context_window": 400000,
3432
  "hf_private": true
3433
  },
3434
  {
3435
- "name": "azure/gpt-5.3-codex",
3436
  "type": "vision",
3437
  "input_price_per_1m": 1.75,
3438
  "output_price_per_1m": 14,
@@ -3441,11 +3442,11 @@
3441
  "vision",
3442
  "reasoning"
3443
  ],
3444
- "context_window": 400000,
3445
  "hf_private": true
3446
  },
3447
  {
3448
- "name": "openai-responses/gpt-5.2-codex",
3449
  "type": "vision",
3450
  "input_price_per_1m": 1.75,
3451
  "output_price_per_1m": 14,
@@ -3458,20 +3459,19 @@
3458
  "hf_private": true
3459
  },
3460
  {
3461
- "name": "openai-responses/gpt-5.3-codex",
3462
- "type": "vision",
3463
  "input_price_per_1m": 1.75,
3464
  "output_price_per_1m": 14,
3465
  "currency": "USD",
3466
  "capabilities": [
3467
- "vision",
3468
  "reasoning"
3469
  ],
3470
- "context_window": 400000,
3471
  "hf_private": true
3472
  },
3473
  {
3474
- "name": "openai-responses/gpt-5.3-chat",
3475
  "type": "vision",
3476
  "input_price_per_1m": 1.75,
3477
  "output_price_per_1m": 14,
@@ -3480,11 +3480,11 @@
3480
  "vision",
3481
  "reasoning"
3482
  ],
3483
- "context_window": 128000,
3484
  "hf_private": true
3485
  },
3486
  {
3487
- "name": "openai-responses/gpt-5.2",
3488
  "type": "vision",
3489
  "input_price_per_1m": 1.75,
3490
  "output_price_per_1m": 14,
@@ -3497,74 +3497,64 @@
3497
  "hf_private": true
3498
  },
3499
  {
3500
- "name": "openai/gpt-4.1",
3501
- "type": "vision",
3502
- "input_price_per_1m": 2,
3503
- "output_price_per_1m": 8,
3504
- "currency": "USD",
3505
- "capabilities": [
3506
- "vision"
3507
- ],
3508
- "context_window": 1047576,
3509
- "hf_private": true
3510
- },
3511
- {
3512
- "name": "openai/o4-mini-deep-research",
3513
- "type": "vision",
3514
  "input_price_per_1m": 2,
3515
- "output_price_per_1m": 8,
3516
  "currency": "USD",
3517
- "capabilities": [
3518
- "vision",
3519
- "reasoning"
3520
- ],
3521
- "context_window": 100000,
3522
  "hf_private": true
3523
  },
3524
  {
3525
- "name": "nebius/deepseek-ai/DeepSeek-V3-0324-fast",
3526
- "type": "chat",
3527
  "input_price_per_1m": 2,
3528
- "output_price_per_1m": 6,
3529
  "currency": "USD",
3530
- "context_window": 128000,
 
 
 
 
3531
  "hf_private": true
3532
  },
3533
  {
3534
- "name": "perplexity/sonar-reasoning-pro",
3535
- "type": "chat",
3536
  "input_price_per_1m": 2,
3537
- "output_price_per_1m": 8,
3538
  "currency": "USD",
3539
- "context_window": 131072,
3540
  "capabilities": [
3541
  "vision",
3542
  "reasoning"
3543
  ],
 
3544
  "hf_private": true
3545
  },
3546
  {
3547
- "name": "azure/gpt-4.1",
3548
  "type": "vision",
3549
  "input_price_per_1m": 2,
3550
- "output_price_per_1m": 8,
3551
  "currency": "USD",
3552
  "capabilities": [
3553
- "vision"
 
3554
  ],
3555
- "context_window": 1047576,
3556
  "hf_private": true
3557
  },
3558
  {
3559
- "name": "azure/openai-responses/gpt-4.1",
3560
- "type": "vision",
3561
  "input_price_per_1m": 2,
3562
  "output_price_per_1m": 8,
3563
  "currency": "USD",
 
3564
  "capabilities": [
3565
- "vision"
 
3566
  ],
3567
- "context_window": 1047576,
3568
  "hf_private": true
3569
  },
3570
  {
@@ -3590,7 +3580,7 @@
3590
  "hf_private": true
3591
  },
3592
  {
3593
- "name": "google/gemini-3-pro-preview",
3594
  "type": "vision",
3595
  "input_price_per_1m": 2,
3596
  "output_price_per_1m": 12,
@@ -3603,7 +3593,7 @@
3603
  "hf_private": true
3604
  },
3605
  {
3606
- "name": "google/gemini-3.1-pro-preview",
3607
  "type": "vision",
3608
  "input_price_per_1m": 2,
3609
  "output_price_per_1m": 12,
@@ -3637,58 +3627,56 @@
3637
  "hf_private": true
3638
  },
3639
  {
3640
- "name": "vertex/gemini-3.1-pro-preview",
3641
  "type": "vision",
3642
  "input_price_per_1m": 2,
3643
- "output_price_per_1m": 12,
3644
  "currency": "USD",
3645
  "capabilities": [
3646
- "vision",
3647
- "reasoning"
3648
  ],
3649
- "context_window": 1048576,
3650
  "hf_private": true
3651
  },
3652
  {
3653
- "name": "vertex/gemini-3-pro-preview",
3654
  "type": "vision",
3655
  "input_price_per_1m": 2,
3656
- "output_price_per_1m": 12,
3657
  "currency": "USD",
3658
  "capabilities": [
3659
  "vision",
3660
  "reasoning"
3661
  ],
3662
- "context_window": 1048576,
3663
  "hf_private": true
3664
  },
3665
  {
3666
- "name": "vertex/gemini-3-pro-image-preview",
3667
  "type": "vision",
3668
  "input_price_per_1m": 2,
3669
- "output_price_per_1m": 12,
3670
  "currency": "USD",
3671
  "capabilities": [
3672
- "vision",
3673
- "reasoning"
3674
  ],
3675
- "context_window": 1048576,
3676
  "hf_private": true
3677
  },
3678
  {
3679
- "name": "openai/gpt-4o-2024-11-20",
3680
  "type": "vision",
3681
- "input_price_per_1m": 2.5,
3682
- "output_price_per_1m": 10,
3683
  "currency": "USD",
3684
  "capabilities": [
3685
  "vision"
3686
  ],
3687
- "context_window": 128000,
3688
  "hf_private": true
3689
  },
3690
  {
3691
- "name": "openai/gpt-5.4",
3692
  "type": "vision",
3693
  "input_price_per_1m": 2.5,
3694
  "output_price_per_1m": 15,
@@ -3701,19 +3689,7 @@
3701
  "hf_private": true
3702
  },
3703
  {
3704
- "name": "openai/gpt-4o-2024-08-06",
3705
- "type": "vision",
3706
- "input_price_per_1m": 2.5,
3707
- "output_price_per_1m": 10,
3708
- "currency": "USD",
3709
- "capabilities": [
3710
- "vision"
3711
- ],
3712
- "context_window": 128000,
3713
- "hf_private": true
3714
- },
3715
- {
3716
- "name": "openai/gpt-4o-2024-05-13",
3717
  "type": "vision",
3718
  "input_price_per_1m": 2.5,
3719
  "output_price_per_1m": 10,
@@ -3737,7 +3713,7 @@
3737
  "hf_private": true
3738
  },
3739
  {
3740
- "name": "azure/openai-responses/gpt-5.4",
3741
  "type": "vision",
3742
  "input_price_per_1m": 2.5,
3743
  "output_price_per_1m": 15,
@@ -3750,44 +3726,44 @@
3750
  "hf_private": true
3751
  },
3752
  {
3753
- "name": "openai-responses/gpt-5.4",
3754
  "type": "vision",
3755
  "input_price_per_1m": 2.5,
3756
- "output_price_per_1m": 15,
3757
  "currency": "USD",
3758
  "capabilities": [
3759
- "vision",
3760
- "reasoning"
3761
  ],
3762
- "context_window": 1050000,
3763
  "hf_private": true
3764
  },
3765
  {
3766
- "name": "perplexity/sonar-pro",
3767
- "type": "chat",
3768
- "input_price_per_1m": 3,
3769
- "output_price_per_1m": 15,
3770
  "currency": "USD",
3771
- "context_window": 204800,
3772
  "capabilities": [
3773
  "vision"
3774
  ],
 
3775
  "hf_private": true
3776
  },
3777
  {
3778
- "name": "xai/grok-4",
3779
  "type": "vision",
3780
- "input_price_per_1m": 3,
3781
  "output_price_per_1m": 15,
3782
  "currency": "USD",
3783
  "capabilities": [
3784
- "vision"
 
3785
  ],
3786
- "context_window": 256000,
3787
  "hf_private": true
3788
  },
3789
  {
3790
- "name": "anthropic/claude-sonnet-4",
3791
  "type": "vision",
3792
  "input_price_per_1m": 3,
3793
  "output_price_per_1m": 15,
@@ -3796,11 +3772,11 @@
3796
  "vision",
3797
  "reasoning"
3798
  ],
3799
- "context_window": 1000000,
3800
  "hf_private": true
3801
  },
3802
  {
3803
- "name": "anthropic/claude-sonnet-4-6",
3804
  "type": "vision",
3805
  "input_price_per_1m": 3,
3806
  "output_price_per_1m": 15,
@@ -3809,11 +3785,11 @@
3809
  "vision",
3810
  "reasoning"
3811
  ],
3812
- "context_window": 1000000,
3813
  "hf_private": true
3814
  },
3815
  {
3816
- "name": "anthropic/claude-sonnet-4-5",
3817
  "type": "vision",
3818
  "input_price_per_1m": 3,
3819
  "output_price_per_1m": 15,
@@ -3822,7 +3798,7 @@
3822
  "vision",
3823
  "reasoning"
3824
  ],
3825
- "context_window": 1000000,
3826
  "hf_private": true
3827
  },
3828
  {
@@ -3838,33 +3814,31 @@
3838
  "hf_private": true
3839
  },
3840
  {
3841
- "name": "vertex/claude-sonnet-4",
3842
- "type": "vision",
3843
  "input_price_per_1m": 3,
3844
  "output_price_per_1m": 15,
3845
  "currency": "USD",
 
3846
  "capabilities": [
3847
- "vision",
3848
- "reasoning"
3849
  ],
3850
- "context_window": 200000,
3851
  "hf_private": true
3852
  },
3853
  {
3854
- "name": "vertex/claude-3-7-sonnet",
3855
  "type": "vision",
3856
  "input_price_per_1m": 3,
3857
  "output_price_per_1m": 15,
3858
  "currency": "USD",
3859
  "capabilities": [
3860
- "vision",
3861
- "reasoning"
3862
  ],
3863
- "context_window": 200000,
3864
  "hf_private": true
3865
  },
3866
  {
3867
- "name": "vertex/claude-sonnet-4-5",
3868
  "type": "vision",
3869
  "input_price_per_1m": 3,
3870
  "output_price_per_1m": 15,
@@ -3893,7 +3867,7 @@
3893
  "hf_private": false
3894
  },
3895
  {
3896
- "name": "bedrock/claude-sonnet-4-6",
3897
  "type": "vision",
3898
  "input_price_per_1m": 3,
3899
  "output_price_per_1m": 15,
@@ -3902,11 +3876,11 @@
3902
  "vision",
3903
  "reasoning"
3904
  ],
3905
- "context_window": 1000000,
3906
  "hf_private": true
3907
  },
3908
  {
3909
- "name": "bedrock/claude-3-7-sonnet",
3910
  "type": "vision",
3911
  "input_price_per_1m": 3,
3912
  "output_price_per_1m": 15,
@@ -3932,7 +3906,7 @@
3932
  "hf_private": true
3933
  },
3934
  {
3935
- "name": "bedrock/claude-sonnet-4",
3936
  "type": "vision",
3937
  "input_price_per_1m": 3,
3938
  "output_price_per_1m": 15,
@@ -3941,11 +3915,11 @@
3941
  "vision",
3942
  "reasoning"
3943
  ],
3944
- "context_window": 200000,
3945
  "hf_private": true
3946
  },
3947
  {
3948
- "name": "coding/claude-sonnet-4-20250514",
3949
  "type": "vision",
3950
  "input_price_per_1m": 3,
3951
  "output_price_per_1m": 15,
@@ -3954,7 +3928,33 @@
3954
  "vision",
3955
  "reasoning"
3956
  ],
3957
- "context_window": 200000,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3958
  "hf_private": true
3959
  },
3960
  {
@@ -3974,57 +3974,57 @@
3974
  "hf_private": false
3975
  },
3976
  {
3977
- "name": "openai/chatgpt-4o",
3978
  "type": "vision",
3979
  "input_price_per_1m": 5,
3980
- "output_price_per_1m": 15,
3981
  "currency": "USD",
3982
  "capabilities": [
3983
- "vision"
 
3984
  ],
3985
- "context_window": 128000,
3986
  "hf_private": true
3987
  },
3988
  {
3989
- "name": "xai/grok-3",
3990
- "type": "chat",
3991
  "input_price_per_1m": 5,
3992
  "output_price_per_1m": 25,
3993
  "currency": "USD",
3994
- "context_window": 131072,
3995
  "capabilities": [
3996
- "tools"
 
3997
  ],
 
3998
  "hf_private": true
3999
  },
4000
  {
4001
- "name": "anthropic/claude-opus-4-5",
4002
- "type": "vision",
4003
  "input_price_per_1m": 5,
4004
  "output_price_per_1m": 25,
4005
  "currency": "USD",
 
4006
  "capabilities": [
4007
- "vision",
4008
- "reasoning"
4009
  ],
4010
- "context_window": 200000,
4011
  "hf_private": true
4012
  },
4013
  {
4014
- "name": "anthropic/claude-opus-4-6",
4015
  "type": "vision",
4016
  "input_price_per_1m": 5,
4017
- "output_price_per_1m": 25,
4018
  "currency": "USD",
4019
  "capabilities": [
4020
- "vision",
4021
- "reasoning"
4022
  ],
4023
- "context_window": 1000000,
4024
  "hf_private": true
4025
  },
4026
  {
4027
- "name": "vertex/claude-opus-4-5",
4028
  "type": "vision",
4029
  "input_price_per_1m": 5,
4030
  "output_price_per_1m": 25,
@@ -4037,7 +4037,7 @@
4037
  "hf_private": true
4038
  },
4039
  {
4040
- "name": "vertex/claude-opus-4-6",
4041
  "type": "vision",
4042
  "input_price_per_1m": 5,
4043
  "output_price_per_1m": 25,
@@ -4050,7 +4050,7 @@
4050
  "hf_private": true
4051
  },
4052
  {
4053
- "name": "bedrock/claude-opus-4-6",
4054
  "type": "vision",
4055
  "input_price_per_1m": 5,
4056
  "output_price_per_1m": 25,
@@ -4063,7 +4063,7 @@
4063
  "hf_private": true
4064
  },
4065
  {
4066
- "name": "bedrock/claude-opus-4-5",
4067
  "type": "vision",
4068
  "input_price_per_1m": 5,
4069
  "output_price_per_1m": 25,
@@ -4089,10 +4089,10 @@
4089
  "hf_private": true
4090
  },
4091
  {
4092
- "name": "openai/o1",
4093
  "type": "vision",
4094
  "input_price_per_1m": 15,
4095
- "output_price_per_1m": 60,
4096
  "currency": "USD",
4097
  "capabilities": [
4098
  "vision",
@@ -4102,7 +4102,7 @@
4102
  "hf_private": true
4103
  },
4104
  {
4105
- "name": "anthropic/claude-opus-4",
4106
  "type": "vision",
4107
  "input_price_per_1m": 15,
4108
  "output_price_per_1m": 75,
@@ -4115,7 +4115,7 @@
4115
  "hf_private": true
4116
  },
4117
  {
4118
- "name": "anthropic/claude-opus-4-1",
4119
  "type": "vision",
4120
  "input_price_per_1m": 15,
4121
  "output_price_per_1m": 75,
@@ -4141,10 +4141,10 @@
4141
  "hf_private": true
4142
  },
4143
  {
4144
- "name": "vertex/claude-opus-4",
4145
  "type": "vision",
4146
  "input_price_per_1m": 15,
4147
- "output_price_per_1m": 75,
4148
  "currency": "USD",
4149
  "capabilities": [
4150
  "vision",
@@ -4154,7 +4154,7 @@
4154
  "hf_private": true
4155
  },
4156
  {
4157
- "name": "vertex/claude-opus-4-1",
4158
  "type": "vision",
4159
  "input_price_per_1m": 15,
4160
  "output_price_per_1m": 75,
@@ -4167,7 +4167,7 @@
4167
  "hf_private": true
4168
  },
4169
  {
4170
- "name": "bedrock/claude-opus-4",
4171
  "type": "vision",
4172
  "input_price_per_1m": 15,
4173
  "output_price_per_1m": 75,
@@ -4180,7 +4180,7 @@
4180
  "hf_private": true
4181
  },
4182
  {
4183
- "name": "coding/claude-opus-4-20250514",
4184
  "type": "vision",
4185
  "input_price_per_1m": 15,
4186
  "output_price_per_1m": 75,
@@ -4206,7 +4206,7 @@
4206
  "hf_private": true
4207
  },
4208
  {
4209
- "name": "openai/gpt-5.4-pro",
4210
  "type": "vision",
4211
  "input_price_per_1m": 30,
4212
  "output_price_per_1m": 180,
@@ -4219,7 +4219,7 @@
4219
  "hf_private": true
4220
  },
4221
  {
4222
- "name": "azure/openai-responses/gpt-5.4-pro",
4223
  "type": "vision",
4224
  "input_price_per_1m": 30,
4225
  "output_price_per_1m": 180,
@@ -4232,7 +4232,7 @@
4232
  "hf_private": true
4233
  },
4234
  {
4235
- "name": "openai-responses/gpt-5.4-pro",
4236
  "type": "vision",
4237
  "input_price_per_1m": 30,
4238
  "output_price_per_1m": 180,
 
1088
  "gdpr_compliant": true,
1089
  "eu_endpoints": true,
1090
  "models": [
1091
+ {
1092
+ "name": "deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo",
1093
+ "type": "chat",
1094
+ "input_price_per_1m": 0.02,
1095
+ "output_price_per_1m": 0.05,
1096
+ "currency": "USD",
1097
+ "context_window": 131072,
1098
+ "size_b": 8,
1099
+ "hf_private": false
1100
+ },
1101
  {
1102
  "name": "novita/meta-llama/llama-3.2-1b-instruct",
1103
  "type": "chat",
 
1109
  "hf_private": false,
1110
  "hf_id": "meta-llama/Llama-3.2-1B-Instruct"
1111
  },
 
 
 
 
 
 
 
 
 
 
1112
  {
1113
  "name": "openai/gpt-5-nano",
1114
  "type": "vision",
 
1148
  "hf_id": "meta-llama/Meta-Llama-3-8B-Instruct"
1149
  },
1150
  {
1151
+ "name": "alibaba/qwen-turbo",
1152
  "type": "chat",
1153
  "input_price_per_1m": 0.05,
1154
+ "output_price_per_1m": 0.2,
1155
  "currency": "USD",
1156
+ "context_window": 1000000,
1157
+ "capabilities": [
1158
+ "tools"
1159
+ ],
1160
+ "hf_private": true
1161
  },
1162
  {
1163
+ "name": "openai-responses/gpt-5-nano",
1164
+ "type": "vision",
1165
  "input_price_per_1m": 0.05,
1166
+ "output_price_per_1m": 0.4,
1167
  "currency": "USD",
 
 
1168
  "capabilities": [
1169
+ "vision",
1170
+ "reasoning"
1171
  ],
1172
+ "context_window": 400000,
1173
+ "hf_private": true
1174
  },
1175
  {
1176
+ "name": "novita/Sao10K/L3-8B-Stheno-v3.2",
1177
  "type": "chat",
1178
  "input_price_per_1m": 0.05,
1179
  "output_price_per_1m": 0.05,
 
1183
  "hf_private": false
1184
  },
1185
  {
1186
+ "name": "novita/sao10k/l3-8b-lunaris",
1187
  "type": "chat",
1188
  "input_price_per_1m": 0.05,
1189
+ "output_price_per_1m": 0.05,
1190
  "currency": "USD",
1191
+ "context_window": 8192,
1192
+ "size_b": 8,
1193
+ "hf_private": false
 
 
1194
  },
1195
  {
1196
+ "name": "novita/meta-llama/llama-3.1-8b-instruct",
1197
+ "type": "chat",
1198
  "input_price_per_1m": 0.05,
1199
+ "output_price_per_1m": 0.05,
1200
  "currency": "USD",
1201
+ "context_window": 16384,
1202
+ "size_b": 8,
1203
  "capabilities": [
1204
+ "tools"
 
1205
  ],
1206
+ "hf_private": false,
1207
+ "hf_id": "meta-llama/Meta-Llama-3.1-8B-Instruct"
1208
  },
1209
  {
1210
+ "name": "azure/gpt-5-nano",
1211
  "type": "chat",
1212
  "input_price_per_1m": 0.05,
1213
+ "output_price_per_1m": 0.4,
1214
  "currency": "USD",
 
1215
  "capabilities": [
1216
+ "reasoning"
1217
  ],
1218
+ "context_window": 200000,
1219
  "hf_private": true
1220
  },
1221
  {
 
1262
  "hf_private": false
1263
  },
1264
  {
1265
+ "name": "deepinfra/Qwen/Qwen3-32B",
1266
  "type": "chat",
1267
  "input_price_per_1m": 0.1,
1268
+ "output_price_per_1m": 0.3,
1269
  "currency": "USD",
1270
+ "context_window": 40000,
1271
+ "size_b": 32,
1272
  "capabilities": [
1273
  "tools",
1274
  "reasoning"
1275
  ],
1276
+ "hf_id": "Qwen/Qwen3-32B",
1277
  "hf_private": false
1278
  },
1279
  {
1280
+ "name": "vertex/gemini-2.5-flash-lite",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1281
  "type": "vision",
1282
  "input_price_per_1m": 0.1,
1283
  "output_price_per_1m": 0.4,
1284
  "currency": "USD",
1285
  "capabilities": [
1286
+ "vision",
1287
+ "reasoning"
1288
  ],
1289
+ "context_window": 1048576,
1290
  "hf_private": true
1291
  },
1292
  {
 
1315
  "hf_private": true
1316
  },
1317
  {
1318
+ "name": "mistral/devstral-small-2507",
 
 
 
 
 
 
 
 
 
1319
  "type": "chat",
1320
  "input_price_per_1m": 0.1,
1321
  "output_price_per_1m": 0.3,
 
1329
  "hf_private": false
1330
  },
1331
  {
1332
+ "name": "mistral/devstral-small-latest",
1333
  "type": "chat",
1334
  "input_price_per_1m": 0.1,
1335
  "output_price_per_1m": 0.3,
 
1342
  "size_b": 24,
1343
  "hf_private": false
1344
  },
1345
+ {
1346
+ "name": "mistral/mistral-small-2503",
1347
+ "type": "chat",
1348
+ "input_price_per_1m": 0.1,
1349
+ "output_price_per_1m": 0.3,
1350
+ "currency": "USD",
1351
+ "context_window": 32768,
1352
+ "hf_private": true
1353
+ },
1354
  {
1355
  "name": "openai-responses/gpt-4.1-nano",
1356
  "type": "vision",
 
1364
  "hf_private": true
1365
  },
1366
  {
1367
+ "name": "openai/gpt-4.1-nano",
1368
  "type": "vision",
1369
  "input_price_per_1m": 0.1,
1370
  "output_price_per_1m": 0.4,
1371
  "currency": "USD",
1372
  "capabilities": [
1373
+ "vision"
 
1374
  ],
1375
+ "context_window": 1047576,
1376
  "hf_private": true
1377
  },
1378
  {
 
1386
  "hf_private": false
1387
  },
1388
  {
1389
+ "name": "groq/openai/gpt-oss-20b",
1390
  "type": "chat",
1391
  "input_price_per_1m": 0.1,
1392
+ "output_price_per_1m": 0.5,
1393
  "currency": "USD",
1394
+ "context_window": 131072,
1395
+ "size_b": 20,
1396
  "capabilities": [
1397
  "tools",
1398
  "reasoning"
1399
  ],
1400
+ "hf_id": "openai/gpt-oss-20b",
1401
  "hf_private": false
1402
  },
1403
+ {
1404
+ "name": "azure/openai-responses/gpt-4.1-nano",
1405
+ "type": "vision",
1406
+ "input_price_per_1m": 0.1,
1407
+ "output_price_per_1m": 0.4,
1408
+ "currency": "USD",
1409
+ "capabilities": [
1410
+ "vision"
1411
+ ],
1412
+ "context_window": 1047576,
1413
+ "hf_private": true
1414
+ },
1415
+ {
1416
+ "name": "azure/gpt-4.1-nano",
1417
+ "type": "vision",
1418
+ "input_price_per_1m": 0.1,
1419
+ "output_price_per_1m": 0.4,
1420
+ "currency": "USD",
1421
+ "capabilities": [
1422
+ "vision"
1423
+ ],
1424
+ "context_window": 1047576,
1425
+ "hf_private": true
1426
+ },
1427
  {
1428
  "name": "deepinfra/meta-llama/Llama-3.3-70B-Instruct-Turbo",
1429
  "type": "chat",
 
1476
  "hf_private": false
1477
  },
1478
  {
1479
+ "name": "nebius/openai/gpt-oss-120b",
1480
  "type": "chat",
1481
  "input_price_per_1m": 0.15,
1482
+ "output_price_per_1m": 0.6,
1483
  "currency": "USD",
 
 
1484
  "capabilities": [
 
1485
  "reasoning"
1486
  ],
1487
+ "context_window": 131000,
1488
+ "size_b": 120,
1489
  "hf_id": "openai/gpt-oss-120b",
1490
  "hf_private": false
1491
  },
1492
  {
1493
+ "name": "parasail/parasail-qwen3-235b-a22b-instruct-2507",
1494
+ "type": "chat",
1495
+ "input_price_per_1m": 0.15,
1496
+ "output_price_per_1m": 0.85,
1497
+ "currency": "USD",
1498
+ "context_window": 262144,
1499
+ "size_b": 235,
1500
+ "hf_private": false
1501
+ },
1502
+ {
1503
+ "name": "mistral/mistral-small-latest",
1504
  "type": "vision",
1505
  "input_price_per_1m": 0.15,
1506
  "output_price_per_1m": 0.6,
1507
  "currency": "USD",
1508
  "capabilities": [
1509
+ "vision",
1510
+ "reasoning"
1511
  ],
1512
+ "context_window": 256000,
1513
  "hf_private": true
1514
  },
1515
  {
1516
+ "name": "mistral/mistral-small-2603",
1517
+ "type": "vision",
1518
  "input_price_per_1m": 0.15,
1519
  "output_price_per_1m": 0.6,
1520
  "currency": "USD",
1521
  "capabilities": [
1522
+ "vision",
1523
  "reasoning"
1524
  ],
1525
+ "context_window": 256000,
1526
+ "size_b": 119,
1527
+ "hf_id": "mistralai/Mistral-Small-4-119B-2603",
1528
  "hf_private": false
1529
  },
1530
+ {
1531
+ "name": "openai/gpt-4o-mini",
1532
+ "type": "vision",
1533
+ "input_price_per_1m": 0.15,
1534
+ "output_price_per_1m": 0.6,
1535
+ "currency": "USD",
1536
+ "capabilities": [
1537
+ "vision"
1538
+ ],
1539
+ "context_window": 128000,
1540
+ "hf_private": true
1541
+ },
1542
  {
1543
  "name": "novita/deepseek/deepseek-r1-distill-qwen-14b",
1544
  "type": "chat",
 
1556
  "hf_private": false
1557
  },
1558
  {
1559
+ "name": "groq/openai/gpt-oss-120b",
1560
  "type": "chat",
1561
  "input_price_per_1m": 0.15,
1562
+ "output_price_per_1m": 0.75,
 
 
 
 
 
 
 
 
 
 
1563
  "currency": "USD",
1564
+ "context_window": 131072,
1565
+ "size_b": 120,
1566
  "capabilities": [
1567
+ "tools",
1568
  "reasoning"
1569
  ],
1570
+ "hf_id": "openai/gpt-oss-120b",
 
 
1571
  "hf_private": false
1572
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
1573
  {
1574
  "name": "novita/mistralai/mistral-nemo",
1575
  "type": "chat",
 
1595
  "hf_private": false
1596
  },
1597
  {
1598
+ "name": "deepinfra/zai-org/GLM-4.5-Air",
1599
+ "type": "chat",
1600
  "input_price_per_1m": 0.2,
1601
+ "output_price_per_1m": 1.1,
1602
  "currency": "USD",
1603
+ "context_window": 131072,
1604
  "capabilities": [
1605
+ "tools",
1606
  "reasoning"
1607
  ],
1608
+ "hf_id": "zai-org/GLM-4.5-Air",
1609
+ "size_b": 110.5,
1610
+ "hf_private": false
1611
  },
1612
  {
1613
+ "name": "deepinfra/Qwen/Qwen3-235B-A22B",
1614
  "type": "chat",
1615
  "input_price_per_1m": 0.2,
1616
+ "output_price_per_1m": 0.6,
1617
  "currency": "USD",
1618
+ "context_window": 40000,
1619
+ "size_b": 235,
1620
  "capabilities": [
1621
+ "tools",
1622
+ "reasoning"
1623
  ],
1624
+ "hf_id": "Qwen/Qwen3-235B-A22B",
1625
  "hf_private": false
1626
  },
1627
  {
1628
+ "name": "alibaba/qwen3-30b-a3b-instruct-2507",
1629
+ "type": "vision",
1630
  "input_price_per_1m": 0.2,
1631
  "output_price_per_1m": 0.8,
1632
  "currency": "USD",
 
 
1633
  "capabilities": [
1634
+ "vision"
 
1635
  ],
1636
+ "context_window": 131072,
1637
+ "size_b": 30,
1638
+ "hf_id": "Qwen/Qwen3-30B-A3B-Instruct-2507",
1639
  "hf_private": false
1640
  },
1641
  {
1642
+ "name": "xai/grok-4-fast",
1643
+ "type": "chat",
1644
  "input_price_per_1m": 0.2,
1645
  "output_price_per_1m": 0.5,
1646
  "currency": "USD",
1647
+ "context_window": 2000000,
1648
  "capabilities": [
1649
+ "vision",
1650
+ "tools",
1651
+ "reasoning"
1652
  ],
 
1653
  "hf_private": true
1654
  },
1655
  {
1656
+ "name": "xai/grok-4-1-fast-non-reasoning",
1657
  "type": "vision",
1658
  "input_price_per_1m": 0.2,
1659
+ "output_price_per_1m": 0.5,
1660
  "currency": "USD",
1661
  "capabilities": [
1662
  "vision"
1663
  ],
1664
+ "context_window": 2000000,
1665
  "hf_private": true
1666
  },
1667
  {
 
1677
  "hf_private": true
1678
  },
1679
  {
1680
+ "name": "xai/grok-4-fast-non-reasoning",
1681
  "type": "chat",
1682
  "input_price_per_1m": 0.2,
1683
  "output_price_per_1m": 0.5,
 
1691
  "hf_private": true
1692
  },
1693
  {
1694
+ "name": "xai/grok-code-fast-1",
1695
+ "type": "vision",
1696
  "input_price_per_1m": 0.2,
1697
+ "output_price_per_1m": 1.5,
1698
+ "currency": "USD",
1699
+ "capabilities": [
1700
+ "vision"
1701
+ ],
1702
+ "context_window": 256000,
1703
+ "hf_private": true
1704
+ },
1705
+ {
1706
+ "name": "openai-responses/gpt-5.4-nano",
1707
+ "type": "vision",
1708
+ "input_price_per_1m": 0.2,
1709
+ "output_price_per_1m": 1.25,
1710
  "currency": "USD",
 
1711
  "capabilities": [
1712
  "vision",
 
1713
  "reasoning"
1714
  ],
1715
+ "context_window": 400000,
1716
  "hf_private": true
1717
  },
1718
  {
1719
+ "name": "openai/gpt-5.4-nano",
1720
  "type": "vision",
1721
  "input_price_per_1m": 0.2,
1722
  "output_price_per_1m": 1.25,
 
1739
  "hf_private": false
1740
  },
1741
  {
1742
+ "name": "novita/qwen/qwen3-235b-a22b-fp8",
1743
  "type": "chat",
1744
  "input_price_per_1m": 0.2,
1745
+ "output_price_per_1m": 0.8,
1746
  "currency": "USD",
1747
+ "context_window": 128000,
1748
  "size_b": 235,
1749
  "capabilities": [
1750
  "tools",
 
1754
  "hf_private": false
1755
  },
1756
  {
1757
+ "name": "novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8",
1758
  "type": "chat",
1759
  "input_price_per_1m": 0.2,
1760
+ "output_price_per_1m": 0.85,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1761
  "currency": "USD",
1762
+ "context_window": 1048576,
1763
+ "size_b": 17,
1764
  "capabilities": [
1765
+ "vision",
1766
+ "tools"
1767
  ],
 
1768
  "hf_private": false
1769
  },
1770
  {
 
1806
  "hf_private": false
1807
  },
1808
  {
1809
+ "name": "deepinfra/Qwen/Qwen2.5-72B-Instruct",
1810
  "type": "chat",
1811
+ "input_price_per_1m": 0.23,
1812
+ "output_price_per_1m": 0.4,
1813
+ "currency": "USD",
1814
+ "context_window": 131072,
1815
+ "size_b": 72,
1816
+ "capabilities": [
1817
+ "vision"
1818
+ ],
1819
+ "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
1820
+ "hf_private": false
1821
+ },
1822
+ {
1823
+ "name": "vertex/gemini-3.1-flash-lite-preview",
1824
+ "type": "vision",
1825
  "input_price_per_1m": 0.25,
1826
+ "output_price_per_1m": 1.5,
1827
  "currency": "USD",
1828
  "capabilities": [
1829
+ "vision"
1830
  ],
1831
+ "context_window": 1048576,
1832
  "hf_private": true
1833
  },
1834
  {
 
1867
  "hf_private": true
1868
  },
1869
  {
1870
+ "name": "azure/gpt-5-mini",
1871
+ "type": "chat",
1872
  "input_price_per_1m": 0.25,
1873
+ "output_price_per_1m": 2,
1874
  "currency": "USD",
1875
  "capabilities": [
1876
+ "reasoning"
1877
  ],
1878
+ "context_window": 200000,
1879
  "hf_private": true
1880
  },
1881
  {
 
1892
  "size_b": 685.4,
1893
  "hf_private": false
1894
  },
 
 
 
 
 
 
 
 
 
1895
  {
1896
  "name": "deepseek/deepseek-chat",
1897
  "type": "chat",
 
1907
  "size_source": "manual",
1908
  "hf_private": false
1909
  },
1910
+ {
1911
+ "name": "deepseek/deepseek-reasoner",
1912
+ "type": "chat",
1913
+ "input_price_per_1m": 0.28,
1914
+ "output_price_per_1m": 0.42,
1915
+ "currency": "USD",
1916
+ "context_window": 128000,
1917
+ "hf_private": true
1918
+ },
1919
  {
1920
  "name": "nebius/deepseek-ai/DeepSeek-V3.2",
1921
  "type": "chat",
 
1945
  "hf_private": false
1946
  },
1947
  {
1948
+ "name": "deepinfra/deepseek-ai/DeepSeek-V3.1",
1949
+ "type": "chat",
1950
  "input_price_per_1m": 0.3,
1951
+ "output_price_per_1m": 1,
1952
  "currency": "USD",
1953
+ "context_window": 163840,
1954
  "capabilities": [
1955
+ "tools",
1956
  "reasoning"
1957
  ],
1958
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
1959
+ "size_b": 671,
1960
+ "hf_private": false
 
 
1961
  },
1962
  {
1963
+ "name": "parasail/parasail-gemma3-27b-it",
1964
  "type": "chat",
1965
  "input_price_per_1m": 0.3,
1966
+ "output_price_per_1m": 0.5,
1967
+ "currency": "USD",
1968
+ "context_window": 128000,
1969
+ "size_b": 27,
1970
+ "hf_private": false
1971
+ },
1972
+ {
1973
+ "name": "alibaba/qwen3-coder-flash",
1974
+ "type": "vision",
1975
+ "input_price_per_1m": 0.3,
1976
+ "output_price_per_1m": 1.5,
1977
+ "currency": "USD",
1978
+ "capabilities": [
1979
+ "vision"
1980
+ ],
1981
+ "context_window": 1048576,
1982
+ "hf_private": true
1983
+ },
1984
+ {
1985
+ "name": "vertex/gemini-2.5-flash",
1986
+ "type": "vision",
1987
+ "input_price_per_1m": 0.3,
1988
+ "output_price_per_1m": 2.5,
1989
  "currency": "USD",
 
 
1990
  "capabilities": [
1991
+ "vision",
1992
  "reasoning"
1993
  ],
1994
+ "context_window": 1048576,
1995
+ "hf_private": true
1996
  },
1997
  {
1998
+ "name": "vertex/gemini-2.5-flash-image",
1999
  "type": "vision",
2000
  "input_price_per_1m": 0.3,
2001
+ "output_price_per_1m": 2.5,
2002
  "currency": "USD",
2003
  "capabilities": [
2004
  "vision",
2005
  "reasoning"
2006
  ],
2007
+ "context_window": 1048576,
2008
+ "hf_private": true
 
 
 
2009
  },
2010
  {
2011
  "name": "minimaxi/MiniMax-M2.7",
 
2066
  "hf_private": true
2067
  },
2068
  {
2069
+ "name": "coding/gemini-2.5-flash",
 
 
 
 
 
 
 
 
 
 
2070
  "type": "vision",
2071
  "input_price_per_1m": 0.3,
2072
  "output_price_per_1m": 2.5,
 
2079
  "hf_private": true
2080
  },
2081
  {
2082
+ "name": "google/gemini-2.5-flash",
 
 
 
 
 
 
 
 
 
2083
  "type": "vision",
2084
  "input_price_per_1m": 0.3,
2085
  "output_price_per_1m": 2.5,
 
2092
  "hf_private": true
2093
  },
2094
  {
2095
+ "name": "mistral/codestral-latest",
2096
+ "type": "chat",
2097
  "input_price_per_1m": 0.3,
2098
+ "output_price_per_1m": 0.9,
2099
  "currency": "USD",
2100
+ "context_window": 131072,
 
 
 
 
2101
  "hf_private": true
2102
  },
2103
  {
 
2111
  "hf_private": false
2112
  },
2113
  {
2114
+ "name": "novita/MiniMax-M2.7",
2115
  "type": "vision",
2116
  "input_price_per_1m": 0.3,
2117
+ "output_price_per_1m": 1.2,
2118
  "currency": "USD",
2119
  "capabilities": [
2120
  "vision",
2121
  "reasoning"
2122
  ],
2123
+ "context_window": 200000,
2124
+ "hf_private": false,
2125
+ "size_b": 230,
2126
+ "size_source": "manual",
2127
+ "hf_id": "MiniMaxAI/MiniMax-M2.7"
2128
  },
2129
  {
2130
+ "name": "novita/minimax-m2.7",
2131
+ "type": "vision",
2132
  "input_price_per_1m": 0.3,
2133
+ "output_price_per_1m": 1.2,
2134
  "currency": "USD",
 
2135
  "capabilities": [
2136
+ "vision",
2137
  "reasoning"
2138
  ],
2139
+ "context_window": 200000,
2140
+ "hf_private": false,
2141
+ "size_b": 230,
2142
+ "size_source": "manual",
2143
+ "hf_id": "MiniMaxAI/MiniMax-M2.7"
2144
  },
2145
  {
2146
+ "name": "novita/deepseek/deepseek-r1-distill-qwen-32b",
2147
+ "type": "chat",
2148
  "input_price_per_1m": 0.3,
2149
+ "output_price_per_1m": 0.3,
2150
  "currency": "USD",
2151
+ "context_window": 12800,
2152
+ "size_b": 32,
2153
  "capabilities": [
2154
+ "reasoning"
2155
  ],
2156
+ "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",
2157
+ "hf_private": false
2158
  },
2159
  {
2160
  "name": "deepinfra/meta-llama/Llama-3.2-90B-Vision-Instruct",
 
2194
  "hf_private": false,
2195
  "hf_id": "meta-llama/Llama-3.3-70B-Instruct"
2196
  },
 
 
 
 
 
 
 
 
 
 
 
 
2197
  {
2198
  "name": "nebius/zai-org/GLM-4.7",
2199
  "type": "chat",
 
2223
  "hf_private": false
2224
  },
2225
  {
2226
+ "name": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2227
  "type": "chat",
2228
  "input_price_per_1m": 0.4,
2229
+ "output_price_per_1m": 1.6,
2230
  "currency": "USD",
2231
+ "context_window": 262144,
2232
+ "size_b": 480,
2233
+ "capabilities": [
2234
+ "tools"
2235
+ ],
2236
+ "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct",
2237
+ "hf_private": false
2238
  },
2239
  {
2240
+ "name": "alibaba/qwen-plus",
2241
  "type": "chat",
2242
  "input_price_per_1m": 0.4,
2243
+ "output_price_per_1m": 1.2,
2244
  "currency": "USD",
2245
+ "context_window": 131072,
2246
  "capabilities": [
2247
+ "tools"
 
2248
  ],
2249
+ "hf_private": true
 
 
2250
  },
2251
  {
2252
+ "name": "mistral/devstral-latest",
2253
+ "type": "chat",
2254
  "input_price_per_1m": 0.4,
2255
+ "output_price_per_1m": 2,
2256
  "currency": "USD",
2257
+ "context_window": 256000,
 
 
 
2258
  "hf_private": true
2259
  },
2260
  {
2261
+ "name": "mistral/mistral-medium-latest",
2262
+ "type": "chat",
2263
  "input_price_per_1m": 0.4,
2264
+ "output_price_per_1m": 2,
2265
  "currency": "USD",
2266
+ "context_window": 131072,
 
 
 
2267
  "hf_private": true
2268
  },
2269
  {
 
2279
  "hf_private": true
2280
  },
2281
  {
2282
+ "name": "openai-responses/gpt-4.1-mini",
2283
+ "type": "vision",
 
 
 
 
 
 
 
 
 
2284
  "input_price_per_1m": 0.4,
2285
+ "output_price_per_1m": 1.6,
2286
  "currency": "USD",
2287
+ "capabilities": [
2288
+ "vision"
2289
+ ],
2290
+ "context_window": 1047576,
2291
  "hf_private": true
2292
  },
2293
  {
2294
+ "name": "openai/gpt-4.1-mini",
2295
  "type": "vision",
2296
  "input_price_per_1m": 0.4,
2297
  "output_price_per_1m": 1.6,
 
2303
  "hf_private": true
2304
  },
2305
  {
2306
+ "name": "novita/deepseek/deepseek-v3-turbo",
2307
  "type": "chat",
2308
  "input_price_per_1m": 0.4,
2309
+ "output_price_per_1m": 1.3,
2310
  "currency": "USD",
2311
+ "context_window": 128000,
2312
+ "hf_private": true
2313
+ },
2314
+ {
2315
+ "name": "novita/deepseek/deepseek-v3-0324",
2316
+ "type": "chat",
2317
+ "input_price_per_1m": 0.4,
2318
+ "output_price_per_1m": 1.3,
2319
+ "currency": "USD",
2320
+ "context_window": 128000,
2321
  "capabilities": [
2322
+ "tools",
2323
+ "reasoning"
2324
  ],
2325
+ "size_b": 685,
2326
+ "hf_id": "deepseek-ai/DeepSeek-V3-0324",
2327
  "hf_private": false
2328
  },
2329
  {
2330
+ "name": "azure/gpt-4.1-mini",
2331
+ "type": "vision",
2332
  "input_price_per_1m": 0.4,
2333
+ "output_price_per_1m": 1.6,
2334
  "currency": "USD",
 
2335
  "capabilities": [
2336
+ "vision"
2337
  ],
2338
+ "context_window": 1047576,
2339
  "hf_private": true
2340
  },
2341
  {
2342
+ "name": "azure/openai-responses/gpt-4.1-mini",
2343
+ "type": "vision",
2344
+ "input_price_per_1m": 0.4,
2345
+ "output_price_per_1m": 1.6,
2346
  "currency": "USD",
 
2347
  "capabilities": [
2348
+ "vision"
2349
  ],
2350
+ "context_window": 1047576,
2351
+ "hf_private": true
 
2352
  },
2353
  {
2354
  "name": "nebius/moonshotai/kimi-k2.5",
 
2381
  "hf_private": false
2382
  },
2383
  {
2384
+ "name": "nebius/moonshotai/Kimi-K2-Instruct",
2385
+ "type": "chat",
2386
+ "input_price_per_1m": 0.5,
2387
+ "output_price_per_1m": 2.4,
2388
+ "currency": "USD",
2389
+ "context_window": 131000,
2390
+ "capabilities": [
2391
+ "tools"
2392
+ ],
2393
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2394
+ "size_b": 1026.5,
2395
+ "hf_private": false
2396
+ },
2397
+ {
2398
+ "name": "vertex/gemini-3.1-flash-image-preview",
2399
  "type": "vision",
2400
  "input_price_per_1m": 0.5,
2401
  "output_price_per_1m": 2,
 
2408
  "hf_private": true
2409
  },
2410
  {
2411
+ "name": "vertex/gemini-3-flash-preview",
2412
  "type": "vision",
2413
  "input_price_per_1m": 0.5,
2414
  "output_price_per_1m": 3,
 
2421
  "hf_private": true
2422
  },
2423
  {
2424
+ "name": "google/gemini-3.1-flash-image-preview",
2425
+ "type": "vision",
2426
  "input_price_per_1m": 0.5,
2427
+ "output_price_per_1m": 2,
2428
  "currency": "USD",
 
2429
  "capabilities": [
2430
+ "vision",
2431
+ "reasoning"
2432
  ],
2433
+ "context_window": 131072,
2434
  "hf_private": true
2435
  },
2436
  {
2437
+ "name": "google/gemini-3-flash-preview",
2438
  "type": "vision",
2439
  "input_price_per_1m": 0.5,
2440
  "output_price_per_1m": 3,
 
2447
  "hf_private": true
2448
  },
2449
  {
2450
+ "name": "mistral/mistral-large-latest",
2451
+ "type": "chat",
2452
  "input_price_per_1m": 0.5,
2453
+ "output_price_per_1m": 1.5,
2454
  "currency": "USD",
2455
+ "context_window": 131072,
2456
  "capabilities": [
2457
+ "tools"
 
2458
  ],
 
2459
  "hf_private": true
2460
  },
2461
  {
 
2529
  "hf_private": false
2530
  },
2531
  {
2532
+ "name": "deepinfra/zai-org/GLM-4.5",
2533
  "type": "chat",
2534
  "input_price_per_1m": 0.6,
2535
  "output_price_per_1m": 2.2,
 
2544
  "hf_private": false
2545
  },
2546
  {
2547
+ "name": "alibaba/qwen3.5",
2548
+ "type": "vision",
2549
  "input_price_per_1m": 0.6,
2550
+ "output_price_per_1m": 3.6,
2551
  "currency": "USD",
 
2552
  "capabilities": [
2553
+ "vision",
2554
  "reasoning"
2555
  ],
2556
+ "context_window": 256000,
2557
+ "size_b": 9,
2558
+ "hf_id": "Qwen/Qwen3.5-9B",
2559
  "hf_private": false
2560
  },
2561
  {
2562
+ "name": "minimaxi/MiniMax-M2.5-highspeed",
2563
  "type": "vision",
2564
  "input_price_per_1m": 0.6,
2565
  "output_price_per_1m": 2.4,
 
2569
  "reasoning"
2570
  ],
2571
  "context_window": 200000,
2572
+ "hf_id": "MiniMaxAI/MiniMax-M2.5",
2573
+ "size_b": 228.7,
2574
+ "hf_private": false
2575
  },
2576
  {
2577
+ "name": "minimaxi/MiniMax-M2.7-highspeed",
2578
  "type": "vision",
2579
  "input_price_per_1m": 0.6,
2580
  "output_price_per_1m": 2.4,
 
2584
  "reasoning"
2585
  ],
2586
  "context_window": 200000,
2587
+ "hf_private": false,
2588
+ "size_b": 230,
2589
+ "size_source": "manual"
2590
  },
2591
  {
2592
  "name": "moonshot/kimi-k2-0711-preview",
 
2661
  "hf_private": false
2662
  },
2663
  {
2664
+ "name": "novita/zai-org/glm-4.6",
2665
+ "type": "chat",
2666
+ "input_price_per_1m": 0.6,
2667
+ "output_price_per_1m": 2.2,
2668
+ "currency": "USD",
2669
+ "context_window": 204800,
2670
+ "capabilities": [
2671
+ "tools",
2672
+ "reasoning"
2673
+ ],
2674
+ "hf_id": "zai-org/GLM-4.6",
2675
+ "size_b": 356.8,
2676
+ "hf_private": false
2677
+ },
2678
+ {
2679
+ "name": "novita/zai-org/glm-4.5",
2680
  "type": "chat",
2681
  "input_price_per_1m": 0.6,
2682
  "output_price_per_1m": 2.2,
 
2732
  "size_b": 358.3,
2733
  "hf_private": false
2734
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2735
  {
2736
  "name": "novita/microsoft/wizardlm-2-8x22b",
2737
  "type": "chat",
 
2757
  "hf_private": true
2758
  },
2759
  {
2760
+ "name": "parasail/parasail-qwen25-vl-72b-instruct",
2761
+ "type": "vision",
2762
  "input_price_per_1m": 0.7,
2763
+ "output_price_per_1m": 0.7,
2764
  "currency": "USD",
 
2765
  "capabilities": [
2766
+ "vision"
 
2767
  ],
2768
+ "context_window": 32768,
2769
+ "size_b": 72,
 
2770
  "hf_private": false
2771
  },
2772
  {
 
2780
  "hf_private": false
2781
  },
2782
  {
2783
+ "name": "novita/deepseek/deepseek-r1-turbo",
2784
+ "type": "chat",
2785
  "input_price_per_1m": 0.7,
2786
+ "output_price_per_1m": 2.5,
2787
  "currency": "USD",
2788
+ "context_window": 64000,
2789
  "capabilities": [
2790
+ "tools",
2791
+ "reasoning"
2792
  ],
2793
+ "hf_id": "deepseek-ai/DeepSeek-R1",
2794
+ "size_b": 671,
2795
+ "size_source": "manual",
2796
  "hf_private": false
2797
  },
2798
  {
2799
+ "name": "openai-responses/gpt-5.4-mini",
2800
  "type": "vision",
2801
  "input_price_per_1m": 0.75,
2802
  "output_price_per_1m": 4.5,
 
2809
  "hf_private": true
2810
  },
2811
  {
2812
+ "name": "openai/gpt-5.4-mini",
2813
  "type": "vision",
2814
  "input_price_per_1m": 0.75,
2815
  "output_price_per_1m": 4.5,
 
2837
  "hf_private": false
2838
  },
2839
  {
2840
+ "name": "deepinfra/meta-llama/Meta-Llama-3.1-405B-Instruct",
2841
  "type": "chat",
2842
  "input_price_per_1m": 0.8,
2843
  "output_price_per_1m": 0.8,
2844
  "currency": "USD",
2845
+ "context_window": 130815,
2846
+ "size_b": 405,
 
 
 
 
2847
  "hf_private": false
2848
  },
2849
  {
 
2861
  "hf_private": false
2862
  },
2863
  {
2864
+ "name": "novita/qwen/qwen2.5-vl-72b-instruct",
2865
  "type": "chat",
2866
  "input_price_per_1m": 0.8,
2867
  "output_price_per_1m": 0.8,
2868
  "currency": "USD",
2869
+ "context_window": 96000,
2870
+ "size_b": 72,
2871
+ "capabilities": [
2872
+ "vision"
2873
+ ],
2874
+ "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
2875
  "hf_private": false
2876
  },
2877
  {
2878
+ "name": "deepinfra/deepseek-ai/DeepSeek-R1",
2879
  "type": "chat",
2880
  "input_price_per_1m": 0.85,
2881
+ "output_price_per_1m": 2.5,
2882
  "currency": "USD",
2883
+ "context_window": 64000,
2884
  "capabilities": [
2885
  "tools",
2886
  "reasoning"
2887
  ],
2888
+ "hf_id": "deepseek-ai/DeepSeek-R1",
2889
  "size_b": 671,
2890
+ "size_source": "manual",
2891
  "hf_private": false
2892
  },
2893
  {
2894
+ "name": "deepinfra/deepseek-ai/DeepSeek-V3",
2895
  "type": "chat",
2896
  "input_price_per_1m": 0.85,
2897
+ "output_price_per_1m": 0.9,
2898
  "currency": "USD",
2899
+ "context_window": 128000,
2900
  "capabilities": [
2901
  "tools",
2902
  "reasoning"
2903
  ],
2904
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
2905
  "size_b": 671,
 
2906
  "hf_private": false
2907
  },
2908
  {
 
2965
  "hf_private": true
2966
  },
2967
  {
2968
+ "name": "alibaba/qwen3-coder-plus",
2969
+ "type": "vision",
2970
+ "input_price_per_1m": 1,
2971
+ "output_price_per_1m": 5,
2972
+ "currency": "USD",
2973
+ "capabilities": [
2974
+ "vision"
2975
+ ],
2976
+ "context_window": 1048576,
2977
+ "hf_private": true
2978
+ },
2979
+ {
2980
+ "name": "vertex/claude-haiku-4-5",
2981
+ "type": "vision",
2982
  "input_price_per_1m": 1,
2983
+ "output_price_per_1m": 5,
2984
  "currency": "USD",
 
2985
  "capabilities": [
2986
+ "vision"
2987
  ],
2988
+ "context_window": 200000,
2989
+ "hf_private": true
 
2990
  },
2991
  {
2992
+ "name": "perplexity/sonar",
2993
  "type": "chat",
2994
  "input_price_per_1m": 1,
2995
+ "output_price_per_1m": 1,
2996
  "currency": "USD",
2997
+ "context_window": 131072,
2998
  "capabilities": [
2999
+ "vision"
3000
  ],
3001
+ "hf_private": true
 
 
3002
  },
3003
  {
3004
  "name": "openai/o3",
 
3028
  "hf_private": false
3029
  },
3030
  {
3031
+ "name": "zai/GLM-5",
3032
+ "type": "vision",
3033
  "input_price_per_1m": 1,
3034
+ "output_price_per_1m": 3.2,
3035
  "currency": "USD",
 
3036
  "capabilities": [
3037
+ "vision",
3038
+ "reasoning"
3039
  ],
3040
+ "context_window": 200000,
3041
+ "hf_id": "zai-org/GLM-5",
3042
+ "size_b": 753.9,
3043
+ "hf_private": false
3044
  },
3045
  {
3046
+ "name": "groq/moonshotai/kimi-k2-instruct",
3047
+ "type": "chat",
3048
  "input_price_per_1m": 1,
3049
+ "output_price_per_1m": 3,
3050
  "currency": "USD",
3051
+ "context_window": 131072,
3052
  "capabilities": [
3053
+ "tools"
3054
  ],
3055
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
3056
+ "size_b": 1026.5,
3057
+ "hf_private": false
3058
  },
3059
  {
3060
+ "name": "groq/moonshotai/Kimi-K2-Instruct-0905",
3061
+ "type": "chat",
3062
  "input_price_per_1m": 1,
3063
+ "output_price_per_1m": 3,
3064
  "currency": "USD",
3065
+ "context_window": 256000,
3066
  "capabilities": [
3067
+ "tools"
3068
  ],
3069
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
3070
+ "size_b": 1026.5,
3071
+ "hf_private": false
3072
  },
3073
  {
3074
  "name": "bedrock/claude-haiku-4-5",
 
3083
  "hf_private": true
3084
  },
3085
  {
3086
+ "name": "anthropic/claude-haiku-4-5",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3087
  "type": "vision",
3088
  "input_price_per_1m": 1,
3089
  "output_price_per_1m": 5,
 
3091
  "capabilities": [
3092
  "vision"
3093
  ],
3094
+ "context_window": 200000,
3095
  "hf_private": true
3096
  },
3097
  {
3098
+ "name": "openai-responses/o3-mini",
3099
  "type": "chat",
3100
  "input_price_per_1m": 1.1,
3101
  "output_price_per_1m": 4.4,
 
3107
  "hf_private": true
3108
  },
3109
  {
3110
+ "name": "openai-responses/o4-mini",
3111
  "type": "chat",
3112
  "input_price_per_1m": 1.1,
3113
  "output_price_per_1m": 4.4,
 
3119
  "hf_private": true
3120
  },
3121
  {
3122
+ "name": "openai/o3-mini",
3123
  "type": "chat",
3124
  "input_price_per_1m": 1.1,
3125
  "output_price_per_1m": 4.4,
 
3131
  "hf_private": true
3132
  },
3133
  {
3134
+ "name": "azure/o4-mini",
3135
  "type": "chat",
3136
  "input_price_per_1m": 1.1,
3137
  "output_price_per_1m": 4.4,
 
3142
  "context_window": 200000,
3143
  "hf_private": true
3144
  },
 
 
 
 
 
 
 
 
 
 
3145
  {
3146
  "name": "moonshot/kimi-k2-turbo-preview",
3147
  "type": "chat",
 
3157
  "hf_private": false
3158
  },
3159
  {
3160
+ "name": "together/Qwen/Qwen2.5-72B-Instruct-Turbo",
3161
+ "type": "chat",
3162
+ "input_price_per_1m": 1.2,
3163
+ "output_price_per_1m": 1.2,
3164
  "currency": "USD",
3165
+ "context_window": 32768,
3166
+ "size_b": 72,
3167
+ "hf_private": false
 
 
 
3168
  },
3169
  {
3170
+ "name": "vertex/gemini-2.5-pro",
3171
  "type": "vision",
3172
  "input_price_per_1m": 1.25,
3173
  "output_price_per_1m": 10,
 
3176
  "vision",
3177
  "reasoning"
3178
  ],
3179
+ "context_window": 1048576,
3180
  "hf_private": true
3181
  },
3182
  {
3183
+ "name": "coding/gemini-2.5-pro",
3184
  "type": "vision",
3185
  "input_price_per_1m": 1.25,
3186
  "output_price_per_1m": 10,
 
3189
  "vision",
3190
  "reasoning"
3191
  ],
3192
+ "context_window": 1048576,
3193
  "hf_private": true
3194
  },
3195
  {
3196
+ "name": "google/gemini-2.5-pro",
3197
+ "type": "vision",
3198
  "input_price_per_1m": 1.25,
3199
  "output_price_per_1m": 10,
3200
  "currency": "USD",
3201
  "capabilities": [
3202
+ "vision",
3203
  "reasoning"
3204
  ],
3205
+ "context_window": 1048576,
3206
  "hf_private": true
3207
  },
3208
  {
3209
+ "name": "openai-responses/gpt-5",
3210
+ "type": "vision",
3211
  "input_price_per_1m": 1.25,
3212
  "output_price_per_1m": 10,
3213
  "currency": "USD",
3214
  "capabilities": [
3215
+ "vision",
3216
  "reasoning"
3217
  ],
3218
+ "context_window": 400000,
3219
  "hf_private": true
3220
  },
3221
  {
3222
+ "name": "openai-responses/gpt-5.1",
3223
  "type": "vision",
3224
  "input_price_per_1m": 1.25,
3225
  "output_price_per_1m": 10,
 
3228
  "vision",
3229
  "reasoning"
3230
  ],
3231
+ "context_window": 400000,
3232
  "hf_private": true
3233
  },
3234
  {
3235
+ "name": "openai-responses/gpt-5.1-codex",
3236
  "type": "vision",
3237
  "input_price_per_1m": 1.25,
3238
  "output_price_per_1m": 10,
 
3245
  "hf_private": true
3246
  },
3247
  {
3248
+ "name": "openai-responses/gpt-5-codex",
3249
  "type": "vision",
3250
  "input_price_per_1m": 1.25,
3251
  "output_price_per_1m": 10,
 
3258
  "hf_private": true
3259
  },
3260
  {
3261
+ "name": "openai/gpt-5.1",
3262
  "type": "vision",
3263
  "input_price_per_1m": 1.25,
3264
  "output_price_per_1m": 10,
 
3271
  "hf_private": true
3272
  },
3273
  {
3274
+ "name": "openai/gpt-5-chat",
3275
  "type": "vision",
3276
  "input_price_per_1m": 1.25,
3277
  "output_price_per_1m": 10,
 
3280
  "vision",
3281
  "reasoning"
3282
  ],
3283
+ "context_window": 128000,
3284
  "hf_private": true
3285
  },
3286
  {
3287
+ "name": "openai/gpt-5.1-chat",
3288
  "type": "vision",
3289
  "input_price_per_1m": 1.25,
3290
  "output_price_per_1m": 10,
 
3293
  "vision",
3294
  "reasoning"
3295
  ],
3296
+ "context_window": 128000,
3297
  "hf_private": true
3298
  },
3299
  {
 
3312
  "hf_private": false
3313
  },
3314
  {
3315
+ "name": "azure/gpt-5",
3316
+ "type": "chat",
3317
  "input_price_per_1m": 1.25,
3318
  "output_price_per_1m": 10,
3319
  "currency": "USD",
3320
  "capabilities": [
 
3321
  "reasoning"
3322
  ],
3323
+ "context_window": 200000,
3324
  "hf_private": true
3325
  },
3326
  {
3327
+ "name": "azure/gpt-5.1",
3328
+ "type": "chat",
3329
+ "input_price_per_1m": 1.25,
3330
+ "output_price_per_1m": 10,
3331
+ "currency": "USD",
3332
+ "capabilities": [
3333
+ "reasoning"
3334
+ ],
3335
+ "context_window": 200000,
3336
+ "hf_private": true
3337
+ },
3338
+ {
3339
+ "name": "novita/sao10k/l3-70b-euryale-v2.1",
3340
  "type": "chat",
3341
  "input_price_per_1m": 1.48,
3342
  "output_price_per_1m": 1.48,
 
3346
  "hf_private": false
3347
  },
3348
  {
3349
+ "name": "novita/sao10k/l31-70b-euryale-v2.2",
3350
  "type": "chat",
3351
  "input_price_per_1m": 1.48,
3352
  "output_price_per_1m": 1.48,
 
3368
  "hf_private": true
3369
  },
3370
  {
3371
+ "name": "openai-responses/gpt-5.2-codex",
3372
  "type": "vision",
3373
  "input_price_per_1m": 1.75,
3374
  "output_price_per_1m": 14,
 
3381
  "hf_private": true
3382
  },
3383
  {
3384
+ "name": "openai-responses/gpt-5.2",
3385
  "type": "vision",
3386
  "input_price_per_1m": 1.75,
3387
  "output_price_per_1m": 14,
 
3390
  "vision",
3391
  "reasoning"
3392
  ],
3393
+ "context_window": 400000,
3394
  "hf_private": true
3395
  },
3396
  {
3397
+ "name": "openai-responses/gpt-5.3-codex",
3398
  "type": "vision",
3399
  "input_price_per_1m": 1.75,
3400
  "output_price_per_1m": 14,
 
3403
  "vision",
3404
  "reasoning"
3405
  ],
3406
+ "context_window": 400000,
3407
  "hf_private": true
3408
  },
3409
  {
3410
+ "name": "openai-responses/gpt-5.3-chat",
3411
+ "type": "vision",
3412
  "input_price_per_1m": 1.75,
3413
  "output_price_per_1m": 14,
3414
  "currency": "USD",
3415
  "capabilities": [
3416
+ "vision",
3417
  "reasoning"
3418
  ],
3419
+ "context_window": 128000,
3420
  "hf_private": true
3421
  },
3422
  {
3423
+ "name": "openai/gpt-5.2-chat",
3424
  "type": "vision",
3425
  "input_price_per_1m": 1.75,
3426
  "output_price_per_1m": 14,
 
3429
  "vision",
3430
  "reasoning"
3431
  ],
3432
+ "context_window": 128000,
3433
  "hf_private": true
3434
  },
3435
  {
3436
+ "name": "openai/gpt-5.3-chat",
3437
  "type": "vision",
3438
  "input_price_per_1m": 1.75,
3439
  "output_price_per_1m": 14,
 
3442
  "vision",
3443
  "reasoning"
3444
  ],
3445
+ "context_window": 128000,
3446
  "hf_private": true
3447
  },
3448
  {
3449
+ "name": "openai/gpt-5.2",
3450
  "type": "vision",
3451
  "input_price_per_1m": 1.75,
3452
  "output_price_per_1m": 14,
 
3459
  "hf_private": true
3460
  },
3461
  {
3462
+ "name": "azure/gpt-5.2",
3463
+ "type": "chat",
3464
  "input_price_per_1m": 1.75,
3465
  "output_price_per_1m": 14,
3466
  "currency": "USD",
3467
  "capabilities": [
 
3468
  "reasoning"
3469
  ],
3470
+ "context_window": 200000,
3471
  "hf_private": true
3472
  },
3473
  {
3474
+ "name": "azure/gpt-5.3-codex",
3475
  "type": "vision",
3476
  "input_price_per_1m": 1.75,
3477
  "output_price_per_1m": 14,
 
3480
  "vision",
3481
  "reasoning"
3482
  ],
3483
+ "context_window": 400000,
3484
  "hf_private": true
3485
  },
3486
  {
3487
+ "name": "azure/openai-responses/gpt-5.2-codex",
3488
  "type": "vision",
3489
  "input_price_per_1m": 1.75,
3490
  "output_price_per_1m": 14,
 
3497
  "hf_private": true
3498
  },
3499
  {
3500
+ "name": "nebius/deepseek-ai/DeepSeek-V3-0324-fast",
3501
+ "type": "chat",
 
 
 
 
 
 
 
 
 
 
 
 
3502
  "input_price_per_1m": 2,
3503
+ "output_price_per_1m": 6,
3504
  "currency": "USD",
3505
+ "context_window": 128000,
 
 
 
 
3506
  "hf_private": true
3507
  },
3508
  {
3509
+ "name": "vertex/gemini-3.1-pro-preview",
3510
+ "type": "vision",
3511
  "input_price_per_1m": 2,
3512
+ "output_price_per_1m": 12,
3513
  "currency": "USD",
3514
+ "capabilities": [
3515
+ "vision",
3516
+ "reasoning"
3517
+ ],
3518
+ "context_window": 1048576,
3519
  "hf_private": true
3520
  },
3521
  {
3522
+ "name": "vertex/gemini-3-pro-preview",
3523
+ "type": "vision",
3524
  "input_price_per_1m": 2,
3525
+ "output_price_per_1m": 12,
3526
  "currency": "USD",
 
3527
  "capabilities": [
3528
  "vision",
3529
  "reasoning"
3530
  ],
3531
+ "context_window": 1048576,
3532
  "hf_private": true
3533
  },
3534
  {
3535
+ "name": "vertex/gemini-3-pro-image-preview",
3536
  "type": "vision",
3537
  "input_price_per_1m": 2,
3538
+ "output_price_per_1m": 12,
3539
  "currency": "USD",
3540
  "capabilities": [
3541
+ "vision",
3542
+ "reasoning"
3543
  ],
3544
+ "context_window": 1048576,
3545
  "hf_private": true
3546
  },
3547
  {
3548
+ "name": "perplexity/sonar-reasoning-pro",
3549
+ "type": "chat",
3550
  "input_price_per_1m": 2,
3551
  "output_price_per_1m": 8,
3552
  "currency": "USD",
3553
+ "context_window": 131072,
3554
  "capabilities": [
3555
+ "vision",
3556
+ "reasoning"
3557
  ],
 
3558
  "hf_private": true
3559
  },
3560
  {
 
3580
  "hf_private": true
3581
  },
3582
  {
3583
+ "name": "google/gemini-3.1-pro-preview",
3584
  "type": "vision",
3585
  "input_price_per_1m": 2,
3586
  "output_price_per_1m": 12,
 
3593
  "hf_private": true
3594
  },
3595
  {
3596
+ "name": "google/gemini-3-pro-preview",
3597
  "type": "vision",
3598
  "input_price_per_1m": 2,
3599
  "output_price_per_1m": 12,
 
3627
  "hf_private": true
3628
  },
3629
  {
3630
+ "name": "openai/gpt-4.1",
3631
  "type": "vision",
3632
  "input_price_per_1m": 2,
3633
+ "output_price_per_1m": 8,
3634
  "currency": "USD",
3635
  "capabilities": [
3636
+ "vision"
 
3637
  ],
3638
+ "context_window": 1047576,
3639
  "hf_private": true
3640
  },
3641
  {
3642
+ "name": "openai/o4-mini-deep-research",
3643
  "type": "vision",
3644
  "input_price_per_1m": 2,
3645
+ "output_price_per_1m": 8,
3646
  "currency": "USD",
3647
  "capabilities": [
3648
  "vision",
3649
  "reasoning"
3650
  ],
3651
+ "context_window": 100000,
3652
  "hf_private": true
3653
  },
3654
  {
3655
+ "name": "azure/gpt-4.1",
3656
  "type": "vision",
3657
  "input_price_per_1m": 2,
3658
+ "output_price_per_1m": 8,
3659
  "currency": "USD",
3660
  "capabilities": [
3661
+ "vision"
 
3662
  ],
3663
+ "context_window": 1047576,
3664
  "hf_private": true
3665
  },
3666
  {
3667
+ "name": "azure/openai-responses/gpt-4.1",
3668
  "type": "vision",
3669
+ "input_price_per_1m": 2,
3670
+ "output_price_per_1m": 8,
3671
  "currency": "USD",
3672
  "capabilities": [
3673
  "vision"
3674
  ],
3675
+ "context_window": 1047576,
3676
  "hf_private": true
3677
  },
3678
  {
3679
+ "name": "openai-responses/gpt-5.4",
3680
  "type": "vision",
3681
  "input_price_per_1m": 2.5,
3682
  "output_price_per_1m": 15,
 
3689
  "hf_private": true
3690
  },
3691
  {
3692
+ "name": "openai/gpt-4o-2024-11-20",
 
 
 
 
 
 
 
 
 
 
 
 
3693
  "type": "vision",
3694
  "input_price_per_1m": 2.5,
3695
  "output_price_per_1m": 10,
 
3713
  "hf_private": true
3714
  },
3715
  {
3716
+ "name": "openai/gpt-5.4",
3717
  "type": "vision",
3718
  "input_price_per_1m": 2.5,
3719
  "output_price_per_1m": 15,
 
3726
  "hf_private": true
3727
  },
3728
  {
3729
+ "name": "openai/gpt-4o-2024-05-13",
3730
  "type": "vision",
3731
  "input_price_per_1m": 2.5,
3732
+ "output_price_per_1m": 10,
3733
  "currency": "USD",
3734
  "capabilities": [
3735
+ "vision"
 
3736
  ],
3737
+ "context_window": 128000,
3738
  "hf_private": true
3739
  },
3740
  {
3741
+ "name": "openai/gpt-4o-2024-08-06",
3742
+ "type": "vision",
3743
+ "input_price_per_1m": 2.5,
3744
+ "output_price_per_1m": 10,
3745
  "currency": "USD",
 
3746
  "capabilities": [
3747
  "vision"
3748
  ],
3749
+ "context_window": 128000,
3750
  "hf_private": true
3751
  },
3752
  {
3753
+ "name": "azure/openai-responses/gpt-5.4",
3754
  "type": "vision",
3755
+ "input_price_per_1m": 2.5,
3756
  "output_price_per_1m": 15,
3757
  "currency": "USD",
3758
  "capabilities": [
3759
+ "vision",
3760
+ "reasoning"
3761
  ],
3762
+ "context_window": 1050000,
3763
  "hf_private": true
3764
  },
3765
  {
3766
+ "name": "vertex/claude-sonnet-4-5",
3767
  "type": "vision",
3768
  "input_price_per_1m": 3,
3769
  "output_price_per_1m": 15,
 
3772
  "vision",
3773
  "reasoning"
3774
  ],
3775
+ "context_window": 200000,
3776
  "hf_private": true
3777
  },
3778
  {
3779
+ "name": "vertex/claude-3-7-sonnet",
3780
  "type": "vision",
3781
  "input_price_per_1m": 3,
3782
  "output_price_per_1m": 15,
 
3785
  "vision",
3786
  "reasoning"
3787
  ],
3788
+ "context_window": 200000,
3789
  "hf_private": true
3790
  },
3791
  {
3792
+ "name": "vertex/claude-sonnet-4",
3793
  "type": "vision",
3794
  "input_price_per_1m": 3,
3795
  "output_price_per_1m": 15,
 
3798
  "vision",
3799
  "reasoning"
3800
  ],
3801
+ "context_window": 200000,
3802
  "hf_private": true
3803
  },
3804
  {
 
3814
  "hf_private": true
3815
  },
3816
  {
3817
+ "name": "perplexity/sonar-pro",
3818
+ "type": "chat",
3819
  "input_price_per_1m": 3,
3820
  "output_price_per_1m": 15,
3821
  "currency": "USD",
3822
+ "context_window": 204800,
3823
  "capabilities": [
3824
+ "vision"
 
3825
  ],
 
3826
  "hf_private": true
3827
  },
3828
  {
3829
+ "name": "xai/grok-4",
3830
  "type": "vision",
3831
  "input_price_per_1m": 3,
3832
  "output_price_per_1m": 15,
3833
  "currency": "USD",
3834
  "capabilities": [
3835
+ "vision"
 
3836
  ],
3837
+ "context_window": 256000,
3838
  "hf_private": true
3839
  },
3840
  {
3841
+ "name": "coding/claude-sonnet-4-20250514",
3842
  "type": "vision",
3843
  "input_price_per_1m": 3,
3844
  "output_price_per_1m": 15,
 
3867
  "hf_private": false
3868
  },
3869
  {
3870
+ "name": "bedrock/claude-3-7-sonnet",
3871
  "type": "vision",
3872
  "input_price_per_1m": 3,
3873
  "output_price_per_1m": 15,
 
3876
  "vision",
3877
  "reasoning"
3878
  ],
3879
+ "context_window": 200000,
3880
  "hf_private": true
3881
  },
3882
  {
3883
+ "name": "bedrock/claude-sonnet-4",
3884
  "type": "vision",
3885
  "input_price_per_1m": 3,
3886
  "output_price_per_1m": 15,
 
3906
  "hf_private": true
3907
  },
3908
  {
3909
+ "name": "bedrock/claude-sonnet-4-6",
3910
  "type": "vision",
3911
  "input_price_per_1m": 3,
3912
  "output_price_per_1m": 15,
 
3915
  "vision",
3916
  "reasoning"
3917
  ],
3918
+ "context_window": 1000000,
3919
  "hf_private": true
3920
  },
3921
  {
3922
+ "name": "anthropic/claude-sonnet-4-5",
3923
  "type": "vision",
3924
  "input_price_per_1m": 3,
3925
  "output_price_per_1m": 15,
 
3928
  "vision",
3929
  "reasoning"
3930
  ],
3931
+ "context_window": 1000000,
3932
+ "hf_private": true
3933
+ },
3934
+ {
3935
+ "name": "anthropic/claude-sonnet-4-6",
3936
+ "type": "vision",
3937
+ "input_price_per_1m": 3,
3938
+ "output_price_per_1m": 15,
3939
+ "currency": "USD",
3940
+ "capabilities": [
3941
+ "vision",
3942
+ "reasoning"
3943
+ ],
3944
+ "context_window": 1000000,
3945
+ "hf_private": true
3946
+ },
3947
+ {
3948
+ "name": "anthropic/claude-sonnet-4",
3949
+ "type": "vision",
3950
+ "input_price_per_1m": 3,
3951
+ "output_price_per_1m": 15,
3952
+ "currency": "USD",
3953
+ "capabilities": [
3954
+ "vision",
3955
+ "reasoning"
3956
+ ],
3957
+ "context_window": 1000000,
3958
  "hf_private": true
3959
  },
3960
  {
 
3974
  "hf_private": false
3975
  },
3976
  {
3977
+ "name": "vertex/claude-opus-4-6",
3978
  "type": "vision",
3979
  "input_price_per_1m": 5,
3980
+ "output_price_per_1m": 25,
3981
  "currency": "USD",
3982
  "capabilities": [
3983
+ "vision",
3984
+ "reasoning"
3985
  ],
3986
+ "context_window": 1000000,
3987
  "hf_private": true
3988
  },
3989
  {
3990
+ "name": "vertex/claude-opus-4-5",
3991
+ "type": "vision",
3992
  "input_price_per_1m": 5,
3993
  "output_price_per_1m": 25,
3994
  "currency": "USD",
 
3995
  "capabilities": [
3996
+ "vision",
3997
+ "reasoning"
3998
  ],
3999
+ "context_window": 200000,
4000
  "hf_private": true
4001
  },
4002
  {
4003
+ "name": "xai/grok-3",
4004
+ "type": "chat",
4005
  "input_price_per_1m": 5,
4006
  "output_price_per_1m": 25,
4007
  "currency": "USD",
4008
+ "context_window": 131072,
4009
  "capabilities": [
4010
+ "tools"
 
4011
  ],
 
4012
  "hf_private": true
4013
  },
4014
  {
4015
+ "name": "openai/chatgpt-4o",
4016
  "type": "vision",
4017
  "input_price_per_1m": 5,
4018
+ "output_price_per_1m": 15,
4019
  "currency": "USD",
4020
  "capabilities": [
4021
+ "vision"
 
4022
  ],
4023
+ "context_window": 128000,
4024
  "hf_private": true
4025
  },
4026
  {
4027
+ "name": "bedrock/claude-opus-4-5",
4028
  "type": "vision",
4029
  "input_price_per_1m": 5,
4030
  "output_price_per_1m": 25,
 
4037
  "hf_private": true
4038
  },
4039
  {
4040
+ "name": "bedrock/claude-opus-4-6",
4041
  "type": "vision",
4042
  "input_price_per_1m": 5,
4043
  "output_price_per_1m": 25,
 
4050
  "hf_private": true
4051
  },
4052
  {
4053
+ "name": "anthropic/claude-opus-4-6",
4054
  "type": "vision",
4055
  "input_price_per_1m": 5,
4056
  "output_price_per_1m": 25,
 
4063
  "hf_private": true
4064
  },
4065
  {
4066
+ "name": "anthropic/claude-opus-4-5",
4067
  "type": "vision",
4068
  "input_price_per_1m": 5,
4069
  "output_price_per_1m": 25,
 
4089
  "hf_private": true
4090
  },
4091
  {
4092
+ "name": "vertex/claude-opus-4-1",
4093
  "type": "vision",
4094
  "input_price_per_1m": 15,
4095
+ "output_price_per_1m": 75,
4096
  "currency": "USD",
4097
  "capabilities": [
4098
  "vision",
 
4102
  "hf_private": true
4103
  },
4104
  {
4105
+ "name": "vertex/claude-opus-4",
4106
  "type": "vision",
4107
  "input_price_per_1m": 15,
4108
  "output_price_per_1m": 75,
 
4115
  "hf_private": true
4116
  },
4117
  {
4118
+ "name": "coding/claude-opus-4-20250514",
4119
  "type": "vision",
4120
  "input_price_per_1m": 15,
4121
  "output_price_per_1m": 75,
 
4141
  "hf_private": true
4142
  },
4143
  {
4144
+ "name": "openai/o1",
4145
  "type": "vision",
4146
  "input_price_per_1m": 15,
4147
+ "output_price_per_1m": 60,
4148
  "currency": "USD",
4149
  "capabilities": [
4150
  "vision",
 
4154
  "hf_private": true
4155
  },
4156
  {
4157
+ "name": "bedrock/claude-opus-4",
4158
  "type": "vision",
4159
  "input_price_per_1m": 15,
4160
  "output_price_per_1m": 75,
 
4167
  "hf_private": true
4168
  },
4169
  {
4170
+ "name": "anthropic/claude-opus-4",
4171
  "type": "vision",
4172
  "input_price_per_1m": 15,
4173
  "output_price_per_1m": 75,
 
4180
  "hf_private": true
4181
  },
4182
  {
4183
+ "name": "anthropic/claude-opus-4-1",
4184
  "type": "vision",
4185
  "input_price_per_1m": 15,
4186
  "output_price_per_1m": 75,
 
4206
  "hf_private": true
4207
  },
4208
  {
4209
+ "name": "openai-responses/gpt-5.4-pro",
4210
  "type": "vision",
4211
  "input_price_per_1m": 30,
4212
  "output_price_per_1m": 180,
 
4219
  "hf_private": true
4220
  },
4221
  {
4222
+ "name": "openai/gpt-5.4-pro",
4223
  "type": "vision",
4224
  "input_price_per_1m": 30,
4225
  "output_price_per_1m": 180,
 
4232
  "hf_private": true
4233
  },
4234
  {
4235
+ "name": "azure/openai-responses/gpt-5.4-pro",
4236
  "type": "vision",
4237
  "input_price_per_1m": 30,
4238
  "output_price_per_1m": 180,
scripts/fetch-benchmarks.js CHANGED
@@ -604,6 +604,69 @@ function mergeMTEB(entries, mtebEntries) {
604
  return [...entries, ...newEntries];
605
  }
606
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
607
  // ─── Merge ───────────────────────────────────────────────────────────────────
608
 
609
  function mergeEntries(llmstats, hfEntries) {
@@ -647,10 +710,11 @@ const SOURCE_FIELDS = {
647
  aider: ['aider_model', 'aider_pass_rate'],
648
  aa: ['aa_id', 'aa_intelligence', 'aa_coding', 'aa_math', 'aa_mmlu_pro', 'aa_gpqa', 'aa_livecodebench', 'aa_hle', 'aa_scicode', 'aa_math_500', 'aa_aime', 'aa_tokens_per_s', 'aa_latency_s'],
649
  mteb: ['mteb_avg', 'mteb_retrieval'],
 
650
  };
651
 
652
  const SOURCE_ID_FIELD = {
653
- llmstats: 'slug', hf: 'hf_id', livebench: 'lb_name', arena: 'arena_elo', aider: 'aider_pass_rate', aa: 'aa_intelligence', mteb: 'mteb_avg',
654
  };
655
 
656
  async function refreshSource(source) {
@@ -672,6 +736,7 @@ async function refreshSource(source) {
672
  else if (source === 'aider') result = mergeAider(stripped, await fetchAider());
673
  else if (source === 'aa') result = mergeArtificialAnalysis(stripped, await fetchArtificialAnalysis());
674
  else if (source === 'mteb') result = mergeMTEB(stripped, await fetchMTEB());
 
675
  fs.writeFileSync(OUT_FILE, JSON.stringify(result, null, 2));
676
  }
677
 
@@ -774,10 +839,11 @@ async function main() {
774
  const withAi = mergeAider(withAr, aiderEntries);
775
  const withAA = mergeArtificialAnalysis(withAi, aaEntries);
776
  const withMTEB = mergeMTEB(withAA, mtebEntries);
777
- const all = mergeMTEB(withMTEB, readmeEntries);
 
778
 
779
  console.log(`\nTotal entries: ${all.length}`);
780
- console.log(` With LiveBench: ${all.filter(e => e.lb_name).length} | Arena: ${all.filter(e => e.arena_elo).length} | Aider: ${all.filter(e => e.aider_pass_rate !== undefined).length} | AA: ${all.filter(e => e.aa_intelligence !== undefined).length} | MTEB: ${all.filter(e => e.mteb_avg !== undefined).length}`);
781
 
782
  fs.writeFileSync(OUT_FILE, JSON.stringify(all, null, 2));
783
  console.log(`Saved to data/benchmarks.json (${(fs.statSync(OUT_FILE).size / 1024).toFixed(0)} KB)`);
 
604
  return [...entries, ...newEntries];
605
  }
606
 
607
+ // ─── OCR Benchmarks ────────────────────────────────────────────────────────
608
+
609
+ function mergeOCR(entries) {
610
+ const ocrData = [
611
+ { name: 'datalab-to/chandra-ocr-2', score: 85.9 },
612
+ { name: 'rednote-hilab/dots.mocr', score: 83.9 },
613
+ { name: 'lightonai/LightOnOCR-2-1B', score: 83.2 },
614
+ { name: 'datalab-to/chandra', score: 83.1 },
615
+ { name: 'infly/Infinity-Parser-7B', score: 82.5 },
616
+ { name: 'allenai/olmOCR-2-7B-1025-FP8', score: 82.4 },
617
+ { name: 'PaddlePaddle/PaddleOCR-VL', score: 80.0 },
618
+ { name: 'baidu/Qianfan-OCR', score: 79.8 },
619
+ { name: 'rednote-hilab/dots.ocr', score: 79.1 },
620
+ { name: 'deepseek-ai/DeepSeek-OCR-2', score: 76.3 },
621
+ { name: 'lightonai/LightOnOCR-1B-1025', score: 76.1 },
622
+ { name: 'deepseek-ai/DeepSeek-OCR', score: 75.7 },
623
+ { name: 'opendatalab/MinerU2.5-2509-1.2B', score: 75.2 },
624
+ { name: 'zai-org/GLM-OCR', score: 75.2 },
625
+ { name: 'FireRedTeam/FireRed-OCR', score: 70.2 },
626
+ { name: 'nanonets/Nanonets-OCR2-3B', score: 69.5 },
627
+ ];
628
+
629
+ const ocrMap = new Map();
630
+ ocrData.forEach(d => {
631
+ ocrMap.set(normName(d.name), d);
632
+ const modelPart = d.name.split('/').pop();
633
+ if (modelPart) ocrMap.set(normName(modelPart), d);
634
+ });
635
+
636
+ let matched = 0;
637
+ const usedOcr = new Set();
638
+ for (const e of entries) {
639
+ const candidates = [
640
+ normName(e.name || ''),
641
+ normName((e.hf_id || '').split('/').pop() || ''),
642
+ normName(e.hf_id || '')
643
+ ].filter(Boolean);
644
+
645
+ const ocr = candidates.map(c => ocrMap.get(c)).find(Boolean);
646
+ if (ocr) {
647
+ e.ocr_avg = ocr.score;
648
+ e.sources = { ...(e.sources || {}), ocr_avg: 'manual' };
649
+ matched++;
650
+ usedOcr.add(ocr.name);
651
+ }
652
+ }
653
+
654
+ const newEntries = [];
655
+ ocrData.forEach(d => {
656
+ if (!usedOcr.has(d.name)) {
657
+ newEntries.push({
658
+ hf_id: d.name,
659
+ name: d.name.split('/').pop(),
660
+ ocr_avg: d.score,
661
+ sources: { ocr_avg: 'manual' }
662
+ });
663
+ }
664
+ });
665
+
666
+ console.log(` OCR: ${matched} matched, ${newEntries.length} new entries`);
667
+ return [...entries, ...newEntries];
668
+ }
669
+
670
  // ─── Merge ───────────────────────────────────────────────────────────────────
671
 
672
  function mergeEntries(llmstats, hfEntries) {
 
710
  aider: ['aider_model', 'aider_pass_rate'],
711
  aa: ['aa_id', 'aa_intelligence', 'aa_coding', 'aa_math', 'aa_mmlu_pro', 'aa_gpqa', 'aa_livecodebench', 'aa_hle', 'aa_scicode', 'aa_math_500', 'aa_aime', 'aa_tokens_per_s', 'aa_latency_s'],
712
  mteb: ['mteb_avg', 'mteb_retrieval'],
713
+ ocr: ['ocr_avg'],
714
  };
715
 
716
  const SOURCE_ID_FIELD = {
717
+ llmstats: 'slug', hf: 'hf_id', livebench: 'lb_name', arena: 'arena_elo', aider: 'aider_pass_rate', aa: 'aa_intelligence', mteb: 'mteb_avg', ocr: 'ocr_avg',
718
  };
719
 
720
  async function refreshSource(source) {
 
736
  else if (source === 'aider') result = mergeAider(stripped, await fetchAider());
737
  else if (source === 'aa') result = mergeArtificialAnalysis(stripped, await fetchArtificialAnalysis());
738
  else if (source === 'mteb') result = mergeMTEB(stripped, await fetchMTEB());
739
+ else if (source === 'ocr') result = mergeOCR(stripped);
740
  fs.writeFileSync(OUT_FILE, JSON.stringify(result, null, 2));
741
  }
742
 
 
839
  const withAi = mergeAider(withAr, aiderEntries);
840
  const withAA = mergeArtificialAnalysis(withAi, aaEntries);
841
  const withMTEB = mergeMTEB(withAA, mtebEntries);
842
+ const withReadme = mergeMTEB(withMTEB, readmeEntries);
843
+ const all = mergeOCR(withReadme);
844
 
845
  console.log(`\nTotal entries: ${all.length}`);
846
+ console.log(` With LiveBench: ${all.filter(e => e.lb_name).length} | Arena: ${all.filter(e => e.arena_elo).length} | Aider: ${all.filter(e => e.aider_pass_rate !== undefined).length} | AA: ${all.filter(e => e.aa_intelligence !== undefined).length} | MTEB: ${all.filter(e => e.mteb_avg !== undefined).length} | OCR: ${all.filter(e => e.ocr_avg !== undefined).length}`);
847
 
848
  fs.writeFileSync(OUT_FILE, JSON.stringify(all, null, 2));
849
  console.log(`Saved to data/benchmarks.json (${(fs.statSync(OUT_FILE).size / 1024).toFixed(0)} KB)`);
scripts/fetch-providers.js CHANGED
@@ -221,6 +221,8 @@ const MANUAL_HF_ID_MAP = {
221
  'bge-multilingual-gemma2': 'BAAI/bge-multilingual-gemma2',
222
  'bge-en-icl': 'BAAI/bge-en-icl',
223
  'wizardlm 2 8x22b': 'alpindale/WizardLM-2-8x22B',
 
 
224
  };
225
 
226
  const MANUAL_OLLAMA_ID_MAP = {
 
221
  'bge-multilingual-gemma2': 'BAAI/bge-multilingual-gemma2',
222
  'bge-en-icl': 'BAAI/bge-en-icl',
223
  'wizardlm 2 8x22b': 'alpindale/WizardLM-2-8x22B',
224
+ 'parasail-kimi-k2-instruct': 'moonshotai/Kimi-K2-Instruct',
225
+ 'grok-2-1212': 'xai-org/grok-2',
226
  };
227
 
228
  const MANUAL_OLLAMA_ID_MAP = {
scripts/validate-hf-ids.js ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 'use strict';
2
+
3
+ const fs = require('fs');
4
+ const path = require('path');
5
+ const { fetchRobust } = require('./fetch-utils');
6
+
7
+ const PROVIDERS_FILE = path.join(__dirname, '..', 'data', 'providers.json');
8
+
9
+ async function checkHfId(hfId) {
10
+ if (!hfId) return { valid: true, status: 'N/A' };
11
+ const url = `https://huggingface.co/${hfId}`;
12
+ try {
13
+ const res = await fetchRobust(url, { method: 'HEAD', retries: 1 });
14
+ if (res.status === 200 || res.status === 302) {
15
+ return { valid: true, status: res.status };
16
+ }
17
+ return { valid: false, status: res.status };
18
+ } catch (e) {
19
+ if (e.message.includes('404')) return { valid: false, status: 404 };
20
+ return { valid: true, status: 'Error (Assume valid)' };
21
+ }
22
+ }
23
+
24
+ async function main() {
25
+ console.log('Starting Hugging Face Repository Validation...\n');
26
+
27
+ const data = JSON.parse(fs.readFileSync(PROVIDERS_FILE, 'utf8'));
28
+ const hfIdToModels = new Map();
29
+
30
+ data.providers.forEach(p => {
31
+ p.models.forEach(m => {
32
+ if (m.hf_id) {
33
+ if (!hfIdToModels.has(m.hf_id)) hfIdToModels.set(m.hf_id, []);
34
+ hfIdToModels.get(m.hf_id).push(`${p.name}: ${m.name}`);
35
+ }
36
+ });
37
+ });
38
+
39
+ const ids = Array.from(hfIdToModels.keys());
40
+ console.log(`Found ${ids.length} unique HF IDs to validate across all providers.\n`);
41
+
42
+ const invalidIds = new Set();
43
+ const results = {
44
+ valid: 0,
45
+ invalid: 0,
46
+ errors: 0
47
+ };
48
+
49
+ for (let i = 0; i < ids.length; i++) {
50
+ const id = ids[i];
51
+ const progress = `[${i + 1}/${ids.length}]`.padEnd(10);
52
+
53
+ const check = await checkHfId(id);
54
+
55
+ if (check.valid) {
56
+ results.valid++;
57
+ console.log(`${progress} ✓ VALID (${check.status}) ${id}`);
58
+ } else {
59
+ results.invalid++;
60
+ console.log(`${progress} ✗ INVALID (${check.status}) ${id}`);
61
+ console.log(` Used by: ${hfIdToModels.get(id).join(', ')}`);
62
+ invalidIds.add(id);
63
+ }
64
+
65
+ // Small delay to prevent rate limiting
66
+ await new Promise(r => setTimeout(r, 50));
67
+ }
68
+
69
+ console.log('\n' + '='.repeat(50));
70
+ console.log('VALIDATION SUMMARY');
71
+ console.log('='.repeat(50));
72
+ console.log(`Total Unique IDs: ${ids.length}`);
73
+ console.log(`Valid IDs: ${results.valid}`);
74
+ console.log(`Invalid (404s): ${results.invalid}`);
75
+ console.log('='.repeat(50));
76
+
77
+ if (invalidIds.size > 0) {
78
+ console.log(`\nAction: Removing ${invalidIds.size} invalid HF IDs from providers.json...`);
79
+ let removalCount = 0;
80
+ data.providers.forEach(p => {
81
+ p.models.forEach(m => {
82
+ if (m.hf_id && invalidIds.has(m.hf_id)) {
83
+ delete m.hf_id;
84
+ removalCount++;
85
+ }
86
+ });
87
+ });
88
+ fs.writeFileSync(PROVIDERS_FILE, JSON.stringify(data, null, 2));
89
+ console.log(`Successfully removed ${removalCount} occurrences.`);
90
+ } else {
91
+ console.log('\nSuccess: All checked HF IDs exist on Hugging Face.');
92
+ }
93
+ }
94
+
95
+ main().catch(err => {
96
+ console.error('\nFatal error during validation:', err);
97
+ process.exit(1);
98
+ });
src/App.tsx CHANGED
@@ -99,6 +99,8 @@ interface BenchmarkEntry {
99
  // MTEB (Massive Text Embedding Benchmark)
100
  mteb_avg?: number;
101
  mteb_retrieval?: number;
 
 
102
  }
103
 
104
  const normalizeName = (s?: string) =>
@@ -370,7 +372,8 @@ function App() {
370
  case 'aa_intelligence':
371
  case 'aa_tokens_per_s':
372
  case 'mteb_avg':
373
- case 'mteb_retrieval': {
 
374
  try {
375
  const bA = findBenchmark(a.name);
376
  const bB = findBenchmark(b.name);
@@ -527,6 +530,7 @@ function App() {
527
  <th onClick={() => requestSort('aa_tokens_per_s')} className="sortable" title="Artificial Analysis Median Speed (Tokens per Second)">AA Speed {getSortIcon('aa_tokens_per_s')}</th>
528
  <th onClick={() => requestSort('mteb_avg')} className="sortable" title="MTEB (Massive Text Embedding Benchmark) Average">MTEB {getSortIcon('mteb_avg')}</th>
529
  <th onClick={() => requestSort('mteb_retrieval')} className="sortable" title="MTEB Retrieval Average">MTEB-Ret {getSortIcon('mteb_retrieval')}</th>
 
530
  <th onClick={() => requestSort('lb_global')} className="sortable" title="LiveBench overall average (contamination-free)">LB {getSortIcon('lb_global')}</th>
531
  <th onClick={() => requestSort('lb_math')} className="sortable" title="LiveBench Mathematics">LB-Math {getSortIcon('lb_math')}</th>
532
  <th onClick={() => requestSort('lb_coding')} className="sortable" title="LiveBench Coding + Agentic Coding">LB-Code {getSortIcon('lb_coding')}</th>
@@ -632,6 +636,7 @@ function App() {
632
  <td className="benchmark-cell">{fmtNum(bm?.aa_tokens_per_s)}</td>
633
  <td className="benchmark-cell">{fmtNum(bm?.mteb_avg, 1)}</td>
634
  <td className="benchmark-cell">{fmtNum(bm?.mteb_retrieval, 1)}</td>
 
635
  <td className="benchmark-cell">{fmtPct(bm?.lb_global)}</td>
636
  <td className="benchmark-cell">{fmtPct(bm?.lb_math)}</td>
637
  <td className="benchmark-cell">{fmtPct(bm?.lb_coding)}</td>
@@ -646,7 +651,7 @@ function App() {
646
  <td className="benchmark-cell">{fmtPct(bm?.human_eval)}</td>
647
  </>;
648
  } catch (e) {
649
- return Array(18).fill(null).map((_, i) => <td key={i} className="benchmark-cell">–</td>);
650
  }
651
  })()}
652
  </tr>
 
99
  // MTEB (Massive Text Embedding Benchmark)
100
  mteb_avg?: number;
101
  mteb_retrieval?: number;
102
+ // OCR Benchmark
103
+ ocr_avg?: number;
104
  }
105
 
106
  const normalizeName = (s?: string) =>
 
372
  case 'aa_intelligence':
373
  case 'aa_tokens_per_s':
374
  case 'mteb_avg':
375
+ case 'mteb_retrieval':
376
+ case 'ocr_avg': {
377
  try {
378
  const bA = findBenchmark(a.name);
379
  const bB = findBenchmark(b.name);
 
530
  <th onClick={() => requestSort('aa_tokens_per_s')} className="sortable" title="Artificial Analysis Median Speed (Tokens per Second)">AA Speed {getSortIcon('aa_tokens_per_s')}</th>
531
  <th onClick={() => requestSort('mteb_avg')} className="sortable" title="MTEB (Massive Text Embedding Benchmark) Average">MTEB {getSortIcon('mteb_avg')}</th>
532
  <th onClick={() => requestSort('mteb_retrieval')} className="sortable" title="MTEB Retrieval Average">MTEB-Ret {getSortIcon('mteb_retrieval')}</th>
533
+ <th onClick={() => requestSort('ocr_avg')} className="sortable" title="OCR (Optical Character Recognition) Benchmark">OCR {getSortIcon('ocr_avg')}</th>
534
  <th onClick={() => requestSort('lb_global')} className="sortable" title="LiveBench overall average (contamination-free)">LB {getSortIcon('lb_global')}</th>
535
  <th onClick={() => requestSort('lb_math')} className="sortable" title="LiveBench Mathematics">LB-Math {getSortIcon('lb_math')}</th>
536
  <th onClick={() => requestSort('lb_coding')} className="sortable" title="LiveBench Coding + Agentic Coding">LB-Code {getSortIcon('lb_coding')}</th>
 
636
  <td className="benchmark-cell">{fmtNum(bm?.aa_tokens_per_s)}</td>
637
  <td className="benchmark-cell">{fmtNum(bm?.mteb_avg, 1)}</td>
638
  <td className="benchmark-cell">{fmtNum(bm?.mteb_retrieval, 1)}</td>
639
+ <td className="benchmark-cell">{fmtNum(bm?.ocr_avg, 1)}</td>
640
  <td className="benchmark-cell">{fmtPct(bm?.lb_global)}</td>
641
  <td className="benchmark-cell">{fmtPct(bm?.lb_math)}</td>
642
  <td className="benchmark-cell">{fmtPct(bm?.lb_coding)}</td>
 
651
  <td className="benchmark-cell">{fmtPct(bm?.human_eval)}</td>
652
  </>;
653
  } catch (e) {
654
+ return Array(19).fill(null).map((_, i) => <td key={i} className="benchmark-cell">–</td>);
655
  }
656
  })()}
657
  </tr>