CrispStrobe commited on
Commit
ec9cfc9
·
1 Parent(s): c95f8c3

feat: comprehensive audio/multimodal pricing support and improved model metadata enrichment (Whisper, Gemini 3.1, Voxtral)

Browse files
data/providers.json CHANGED
@@ -302,12 +302,12 @@
302
  {
303
  "name": "Whisper V3",
304
  "type": "audio",
305
- "input_price_per_1m": 0.006,
306
- "output_price_per_1m": 0,
307
  "currency": "CHF",
308
  "hf_id": "openai/whisper-large-v3",
309
- "size_b": 0.7,
310
- "hf_private": false
 
 
311
  },
312
  {
313
  "name": "Photomaker V2",
@@ -1163,20 +1163,17 @@
1163
  "hf_private": true
1164
  },
1165
  {
1166
- "name": "openai-responses/gpt-5-nano",
1167
- "type": "vision",
1168
  "input_price_per_1m": 0.05,
1169
- "output_price_per_1m": 0.4,
1170
  "currency": "USD",
1171
- "capabilities": [
1172
- "vision",
1173
- "reasoning"
1174
- ],
1175
- "context_window": 400000,
1176
- "hf_private": true
1177
  },
1178
  {
1179
- "name": "novita/Sao10K/L3-8B-Stheno-v3.2",
1180
  "type": "chat",
1181
  "input_price_per_1m": 0.05,
1182
  "output_price_per_1m": 0.05,
@@ -1200,14 +1197,17 @@
1200
  "hf_private": false
1201
  },
1202
  {
1203
- "name": "novita/sao10k/l3-8b-lunaris",
1204
- "type": "chat",
1205
  "input_price_per_1m": 0.05,
1206
- "output_price_per_1m": 0.05,
1207
  "currency": "USD",
1208
- "context_window": 8192,
1209
- "size_b": 8,
1210
- "hf_private": false
 
 
 
1211
  },
1212
  {
1213
  "name": "azure/gpt-5-nano",
@@ -1264,18 +1264,6 @@
1264
  "hf_id": "Gryphe/MythoMax-L2-13b",
1265
  "hf_private": false
1266
  },
1267
- {
1268
- "name": "openai-responses/gpt-4.1-nano",
1269
- "type": "vision",
1270
- "input_price_per_1m": 0.1,
1271
- "output_price_per_1m": 0.4,
1272
- "currency": "USD",
1273
- "capabilities": [
1274
- "vision"
1275
- ],
1276
- "context_window": 1047576,
1277
- "hf_private": true
1278
- },
1279
  {
1280
  "name": "google/gemini-2.0-flash-001",
1281
  "type": "vision",
@@ -1338,21 +1326,6 @@
1338
  "size_b": 24,
1339
  "hf_private": false
1340
  },
1341
- {
1342
- "name": "deepinfra/Qwen/Qwen3-32B",
1343
- "type": "chat",
1344
- "input_price_per_1m": 0.1,
1345
- "output_price_per_1m": 0.3,
1346
- "currency": "USD",
1347
- "context_window": 40000,
1348
- "size_b": 32,
1349
- "capabilities": [
1350
- "tools",
1351
- "reasoning"
1352
- ],
1353
- "hf_id": "Qwen/Qwen3-32B",
1354
- "hf_private": false
1355
- },
1356
  {
1357
  "name": "vertex/gemini-2.5-flash-lite",
1358
  "type": "vision",
@@ -1367,19 +1340,7 @@
1367
  "hf_private": true
1368
  },
1369
  {
1370
- "name": "azure/gpt-4.1-nano",
1371
- "type": "vision",
1372
- "input_price_per_1m": 0.1,
1373
- "output_price_per_1m": 0.4,
1374
- "currency": "USD",
1375
- "capabilities": [
1376
- "vision"
1377
- ],
1378
- "context_window": 1047576,
1379
- "hf_private": true
1380
- },
1381
- {
1382
- "name": "azure/openai-responses/gpt-4.1-nano",
1383
  "type": "vision",
1384
  "input_price_per_1m": 0.1,
1385
  "output_price_per_1m": 0.4,
@@ -1400,6 +1361,21 @@
1400
  "size_b": 8,
1401
  "hf_private": false
1402
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1403
  {
1404
  "name": "groq/openai/gpt-oss-20b",
1405
  "type": "chat",
@@ -1416,7 +1392,31 @@
1416
  "hf_private": false
1417
  },
1418
  {
1419
- "name": "openai/gpt-4.1-nano",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1420
  "type": "vision",
1421
  "input_price_per_1m": 0.1,
1422
  "output_price_per_1m": 0.4,
@@ -1479,6 +1479,19 @@
1479
  "hf_id": "NousResearch/Hermes-2-Pro-Llama-3-8B",
1480
  "hf_private": false
1481
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
1482
  {
1483
  "name": "mistral/mistral-small-2603",
1484
  "type": "vision",
@@ -1495,17 +1508,18 @@
1495
  "hf_private": false
1496
  },
1497
  {
1498
- "name": "mistral/mistral-small-latest",
1499
- "type": "vision",
1500
  "input_price_per_1m": 0.15,
1501
  "output_price_per_1m": 0.6,
1502
  "currency": "USD",
1503
  "capabilities": [
1504
- "vision",
1505
  "reasoning"
1506
  ],
1507
- "context_window": 256000,
1508
- "hf_private": true
 
 
1509
  },
1510
  {
1511
  "name": "novita/deepseek/deepseek-r1-distill-qwen-14b",
@@ -1523,6 +1537,18 @@
1523
  "size_source": "manual",
1524
  "hf_private": false
1525
  },
 
 
 
 
 
 
 
 
 
 
 
 
1526
  {
1527
  "name": "parasail/parasail-qwen3-235b-a22b-instruct-2507",
1528
  "type": "chat",
@@ -1548,32 +1574,6 @@
1548
  "hf_id": "openai/gpt-oss-120b",
1549
  "hf_private": false
1550
  },
1551
- {
1552
- "name": "openai/gpt-4o-mini",
1553
- "type": "vision",
1554
- "input_price_per_1m": 0.15,
1555
- "output_price_per_1m": 0.6,
1556
- "currency": "USD",
1557
- "capabilities": [
1558
- "vision"
1559
- ],
1560
- "context_window": 128000,
1561
- "hf_private": true
1562
- },
1563
- {
1564
- "name": "nebius/openai/gpt-oss-120b",
1565
- "type": "chat",
1566
- "input_price_per_1m": 0.15,
1567
- "output_price_per_1m": 0.6,
1568
- "currency": "USD",
1569
- "capabilities": [
1570
- "reasoning"
1571
- ],
1572
- "context_window": 131000,
1573
- "size_b": 120,
1574
- "hf_id": "openai/gpt-oss-120b",
1575
- "hf_private": false
1576
- },
1577
  {
1578
  "name": "novita/mistralai/mistral-nemo",
1579
  "type": "chat",
@@ -1613,7 +1613,37 @@
1613
  "hf_private": false
1614
  },
1615
  {
1616
- "name": "openai-responses/gpt-5.4-nano",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1617
  "type": "vision",
1618
  "input_price_per_1m": 0.2,
1619
  "output_price_per_1m": 1.25,
@@ -1625,6 +1655,16 @@
1625
  "context_window": 400000,
1626
  "hf_private": true
1627
  },
 
 
 
 
 
 
 
 
 
 
1628
  {
1629
  "name": "xai/grok-4-fast",
1630
  "type": "chat",
@@ -1651,6 +1691,18 @@
1651
  "context_window": 2000000,
1652
  "hf_private": true
1653
  },
 
 
 
 
 
 
 
 
 
 
 
 
1654
  {
1655
  "name": "xai/grok-code-fast-1",
1656
  "type": "vision",
@@ -1678,24 +1730,12 @@
1678
  "hf_private": true
1679
  },
1680
  {
1681
- "name": "xai/grok-4-1-fast-non-reasoning",
1682
- "type": "vision",
1683
- "input_price_per_1m": 0.2,
1684
- "output_price_per_1m": 0.5,
1685
- "currency": "USD",
1686
- "capabilities": [
1687
- "vision"
1688
- ],
1689
- "context_window": 2000000,
1690
- "hf_private": true
1691
- },
1692
- {
1693
- "name": "novita/qwen/qwen3-235b-a22b-fp8",
1694
  "type": "chat",
1695
  "input_price_per_1m": 0.2,
1696
- "output_price_per_1m": 0.8,
1697
  "currency": "USD",
1698
- "context_window": 128000,
1699
  "size_b": 235,
1700
  "capabilities": [
1701
  "tools",
@@ -1705,40 +1745,10 @@
1705
  "hf_private": false
1706
  },
1707
  {
1708
- "name": "novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8",
1709
  "type": "chat",
1710
  "input_price_per_1m": 0.2,
1711
- "output_price_per_1m": 0.85,
1712
- "currency": "USD",
1713
- "context_window": 1048576,
1714
- "size_b": 17,
1715
- "capabilities": [
1716
- "vision",
1717
- "tools"
1718
- ],
1719
- "hf_id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct",
1720
- "hf_private": false
1721
- },
1722
- {
1723
- "name": "deepinfra/Qwen/Qwen3-235B-A22B",
1724
- "type": "chat",
1725
- "input_price_per_1m": 0.2,
1726
- "output_price_per_1m": 0.6,
1727
- "currency": "USD",
1728
- "context_window": 40000,
1729
- "size_b": 235,
1730
- "capabilities": [
1731
- "tools",
1732
- "reasoning"
1733
- ],
1734
- "hf_id": "Qwen/Qwen3-235B-A22B",
1735
- "hf_private": false
1736
- },
1737
- {
1738
- "name": "deepinfra/zai-org/GLM-4.5-Air",
1739
- "type": "chat",
1740
- "input_price_per_1m": 0.2,
1741
- "output_price_per_1m": 1.1,
1742
  "currency": "USD",
1743
  "context_window": 131072,
1744
  "capabilities": [
@@ -1750,17 +1760,7 @@
1750
  "hf_private": false
1751
  },
1752
  {
1753
- "name": "together/meta-llama/LlamaGuard-2-8b",
1754
- "type": "chat",
1755
- "input_price_per_1m": 0.2,
1756
- "output_price_per_1m": 0.2,
1757
- "currency": "USD",
1758
- "context_window": 8192,
1759
- "size_b": 8,
1760
- "hf_private": false
1761
- },
1762
- {
1763
- "name": "openai/gpt-5.4-nano",
1764
  "type": "vision",
1765
  "input_price_per_1m": 0.2,
1766
  "output_price_per_1m": 1.25,
@@ -1773,27 +1773,17 @@
1773
  "hf_private": true
1774
  },
1775
  {
1776
- "name": "deepinfra/deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1777
  "type": "chat",
1778
  "input_price_per_1m": 0.23,
1779
- "output_price_per_1m": 0.69,
1780
  "currency": "USD",
1781
- "context_window": 64000,
1782
- "size_b": 70,
1783
  "capabilities": [
1784
- "reasoning"
1785
  ],
1786
- "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1787
- "hf_private": false
1788
- },
1789
- {
1790
- "name": "deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct",
1791
- "type": "chat",
1792
- "input_price_per_1m": 0.23,
1793
- "output_price_per_1m": 0.4,
1794
- "currency": "USD",
1795
- "context_window": 130815,
1796
- "size_b": 70,
1797
  "hf_private": false
1798
  },
1799
  {
@@ -1811,31 +1801,28 @@
1811
  "hf_private": false
1812
  },
1813
  {
1814
- "name": "deepinfra/Qwen/Qwen2.5-72B-Instruct",
1815
  "type": "chat",
1816
  "input_price_per_1m": 0.23,
1817
- "output_price_per_1m": 0.4,
1818
  "currency": "USD",
1819
- "context_window": 131072,
1820
- "size_b": 72,
1821
  "capabilities": [
1822
- "vision"
1823
  ],
1824
- "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
1825
  "hf_private": false
1826
  },
1827
  {
1828
- "name": "openai-responses/gpt-5-mini",
1829
- "type": "vision",
1830
- "input_price_per_1m": 0.25,
1831
- "output_price_per_1m": 2,
1832
  "currency": "USD",
1833
- "capabilities": [
1834
- "vision",
1835
- "reasoning"
1836
- ],
1837
- "context_window": 400000,
1838
- "hf_private": true
1839
  },
1840
  {
1841
  "name": "google/gemini-3.1-flash-lite-preview",
@@ -1871,6 +1858,19 @@
1871
  "context_window": 1048576,
1872
  "hf_private": true
1873
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
1874
  {
1875
  "name": "azure/gpt-5-mini",
1876
  "type": "chat",
@@ -1934,19 +1934,29 @@
1934
  "hf_private": true
1935
  },
1936
  {
1937
- "name": "xai/grok-3-mini",
1938
- "type": "chat",
1939
  "input_price_per_1m": 0.3,
1940
- "output_price_per_1m": 0.5,
1941
  "currency": "USD",
1942
  "capabilities": [
 
1943
  "reasoning"
1944
  ],
 
 
 
 
 
 
 
 
 
1945
  "context_window": 131072,
1946
  "hf_private": true
1947
  },
1948
  {
1949
- "name": "google/gemini-2.5-flash",
1950
  "type": "vision",
1951
  "input_price_per_1m": 0.3,
1952
  "output_price_per_1m": 2.5,
@@ -1959,16 +1969,48 @@
1959
  "hf_private": true
1960
  },
1961
  {
1962
- "name": "mistral/codestral-latest",
1963
- "type": "chat",
1964
  "input_price_per_1m": 0.3,
1965
- "output_price_per_1m": 0.9,
1966
  "currency": "USD",
1967
- "context_window": 131072,
 
 
 
 
1968
  "hf_private": true
1969
  },
1970
  {
1971
- "name": "novita/MiniMax-M2.7",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1972
  "type": "vision",
1973
  "input_price_per_1m": 0.3,
1974
  "output_price_per_1m": 1.2,
@@ -1984,7 +2026,7 @@
1984
  "size_source": "manual"
1985
  },
1986
  {
1987
- "name": "novita/minimax-m2.7",
1988
  "type": "vision",
1989
  "input_price_per_1m": 0.3,
1990
  "output_price_per_1m": 1.2,
@@ -2014,58 +2056,50 @@
2014
  "hf_private": false
2015
  },
2016
  {
2017
- "name": "coding/gemini-2.5-flash",
2018
  "type": "vision",
2019
  "input_price_per_1m": 0.3,
2020
- "output_price_per_1m": 2.5,
2021
  "currency": "USD",
2022
  "capabilities": [
2023
  "vision",
2024
  "reasoning"
2025
  ],
2026
- "context_window": 1048576,
2027
- "hf_private": true
2028
- },
2029
- {
2030
- "name": "deepinfra/deepseek-ai/DeepSeek-V3.1",
2031
- "type": "chat",
2032
- "input_price_per_1m": 0.3,
2033
- "output_price_per_1m": 1,
2034
- "currency": "USD",
2035
- "context_window": 163840,
2036
- "capabilities": [
2037
- "tools",
2038
- "reasoning"
2039
- ],
2040
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
2041
- "size_b": 671,
2042
- "hf_private": false
2043
  },
2044
  {
2045
- "name": "vertex/gemini-2.5-flash",
2046
  "type": "vision",
2047
  "input_price_per_1m": 0.3,
2048
- "output_price_per_1m": 2.5,
2049
  "currency": "USD",
2050
  "capabilities": [
2051
  "vision",
2052
  "reasoning"
2053
  ],
2054
- "context_window": 1048576,
2055
- "hf_private": true
 
 
2056
  },
2057
  {
2058
- "name": "vertex/gemini-2.5-flash-image",
2059
- "type": "vision",
2060
  "input_price_per_1m": 0.3,
2061
- "output_price_per_1m": 2.5,
2062
  "currency": "USD",
 
2063
  "capabilities": [
2064
- "vision",
2065
  "reasoning"
2066
  ],
2067
- "context_window": 1048576,
2068
- "hf_private": true
 
2069
  },
2070
  {
2071
  "name": "together/Qwen/Qwen2.5-7B-Instruct-Turbo",
@@ -2088,78 +2122,44 @@
2088
  "hf_private": false
2089
  },
2090
  {
2091
- "name": "nebius/deepseek-ai/DeepSeek-V3.2",
2092
- "type": "chat",
2093
- "input_price_per_1m": 0.3,
2094
- "output_price_per_1m": 0.45,
2095
- "currency": "USD",
2096
- "capabilities": [
2097
- "reasoning"
2098
- ],
2099
- "context_window": 164000,
2100
- "hf_id": "deepseek-ai/DeepSeek-V3.2",
2101
- "size_b": 685.4,
2102
- "hf_private": false
2103
- },
2104
- {
2105
- "name": "nebius/minimax/minimax-m2.1",
2106
  "type": "chat",
2107
  "input_price_per_1m": 0.3,
2108
- "output_price_per_1m": 1.2,
2109
  "currency": "USD",
2110
  "capabilities": [
2111
  "reasoning"
2112
  ],
2113
- "context_window": 200000,
2114
- "hf_id": "MiniMaxAI/MiniMax-M2.1",
2115
- "size_b": 228.7,
2116
- "hf_private": false
2117
  },
2118
  {
2119
- "name": "minimaxi/MiniMax-M2",
2120
  "type": "chat",
2121
  "input_price_per_1m": 0.3,
2122
- "output_price_per_1m": 1.2,
2123
  "currency": "USD",
2124
- "context_window": 200000,
2125
  "capabilities": [
2126
  "tools",
2127
  "reasoning"
2128
  ],
2129
- "hf_id": "MiniMaxAI/MiniMax-M2",
2130
- "size_b": 228.7,
2131
- "hf_private": false
2132
- },
2133
- {
2134
- "name": "minimaxi/MiniMax-M2.5",
2135
- "type": "vision",
2136
- "input_price_per_1m": 0.3,
2137
- "output_price_per_1m": 1.2,
2138
- "currency": "USD",
2139
- "capabilities": [
2140
- "vision",
2141
- "reasoning"
2142
- ],
2143
- "context_window": 200000,
2144
- "hf_id": "MiniMaxAI/MiniMax-M2.5",
2145
- "size_b": 228.7,
2146
  "hf_private": false
2147
  },
2148
  {
2149
- "name": "minimaxi/MiniMax-M2.7",
2150
  "type": "vision",
2151
  "input_price_per_1m": 0.3,
2152
- "output_price_per_1m": 1.2,
2153
  "currency": "USD",
2154
  "capabilities": [
2155
  "vision",
2156
  "reasoning"
2157
  ],
2158
- "context_window": 200000,
2159
- "hf_id": "MiniMaxAI/MiniMax-M2.7",
2160
- "hf_private": false,
2161
- "size_b": 230,
2162
- "size_source": "manual"
2163
  },
2164
  {
2165
  "name": "deepinfra/meta-llama/Llama-3.2-90B-Vision-Instruct",
@@ -2211,18 +2211,6 @@
2211
  ],
2212
  "hf_private": true
2213
  },
2214
- {
2215
- "name": "openai-responses/gpt-4.1-mini",
2216
- "type": "vision",
2217
- "input_price_per_1m": 0.4,
2218
- "output_price_per_1m": 1.6,
2219
- "currency": "USD",
2220
- "capabilities": [
2221
- "vision"
2222
- ],
2223
- "context_window": 1047576,
2224
- "hf_private": true
2225
- },
2226
  {
2227
  "name": "mistral/devstral-medium-2507",
2228
  "type": "chat",
@@ -2253,6 +2241,34 @@
2253
  "context_window": 131072,
2254
  "hf_private": true
2255
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2256
  {
2257
  "name": "novita/deepseek/deepseek-v3-0324",
2258
  "type": "chat",
@@ -2277,6 +2293,18 @@
2277
  "context_window": 128000,
2278
  "hf_private": true
2279
  },
 
 
 
 
 
 
 
 
 
 
 
 
2280
  {
2281
  "name": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2282
  "type": "chat",
@@ -2292,7 +2320,7 @@
2292
  "hf_private": false
2293
  },
2294
  {
2295
- "name": "azure/gpt-4.1-mini",
2296
  "type": "vision",
2297
  "input_price_per_1m": 0.4,
2298
  "output_price_per_1m": 1.6,
@@ -2304,7 +2332,7 @@
2304
  "hf_private": true
2305
  },
2306
  {
2307
- "name": "azure/openai-responses/gpt-4.1-mini",
2308
  "type": "vision",
2309
  "input_price_per_1m": 0.4,
2310
  "output_price_per_1m": 1.6,
@@ -2316,7 +2344,7 @@
2316
  "hf_private": true
2317
  },
2318
  {
2319
- "name": "openai/gpt-4.1-mini",
2320
  "type": "vision",
2321
  "input_price_per_1m": 0.4,
2322
  "output_price_per_1m": 1.6,
@@ -2327,34 +2355,6 @@
2327
  "context_window": 1047576,
2328
  "hf_private": true
2329
  },
2330
- {
2331
- "name": "nebius/zai-org/GLM-4.7",
2332
- "type": "chat",
2333
- "input_price_per_1m": 0.4,
2334
- "output_price_per_1m": 2,
2335
- "currency": "USD",
2336
- "capabilities": [
2337
- "reasoning"
2338
- ],
2339
- "context_window": 200000,
2340
- "hf_id": "zai-org/GLM-4.7",
2341
- "size_b": 358.3,
2342
- "hf_private": false
2343
- },
2344
- {
2345
- "name": "nebius/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2346
- "type": "chat",
2347
- "input_price_per_1m": 0.4,
2348
- "output_price_per_1m": 1.8,
2349
- "currency": "USD",
2350
- "context_window": 262000,
2351
- "size_b": 480,
2352
- "capabilities": [
2353
- "tools"
2354
- ],
2355
- "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct",
2356
- "hf_private": false
2357
- },
2358
  {
2359
  "name": "google/gemini-3.1-flash-image-preview",
2360
  "type": "vision",
@@ -2419,21 +2419,6 @@
2419
  "context_window": 131072,
2420
  "hf_private": true
2421
  },
2422
- {
2423
- "name": "nebius/moonshotai/kimi-k2.5",
2424
- "type": "vision",
2425
- "input_price_per_1m": 0.5,
2426
- "output_price_per_1m": 2.5,
2427
- "currency": "USD",
2428
- "capabilities": [
2429
- "vision",
2430
- "reasoning"
2431
- ],
2432
- "context_window": 256000,
2433
- "hf_id": "moonshotai/Kimi-K2.5",
2434
- "size_b": 1058.6,
2435
- "hf_private": false
2436
- },
2437
  {
2438
  "name": "nebius/deepseek-ai/DeepSeek-V3-0324",
2439
  "type": "chat",
@@ -2453,14 +2438,29 @@
2453
  "name": "nebius/moonshotai/Kimi-K2-Instruct",
2454
  "type": "chat",
2455
  "input_price_per_1m": 0.5,
2456
- "output_price_per_1m": 2.4,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2457
  "currency": "USD",
2458
- "context_window": 131000,
2459
  "capabilities": [
2460
- "tools"
 
2461
  ],
2462
- "hf_id": "moonshotai/Kimi-K2-Instruct",
2463
- "size_b": 1026.5,
 
2464
  "hf_private": false
2465
  },
2466
  {
@@ -2519,18 +2519,17 @@
2519
  "hf_private": false
2520
  },
2521
  {
2522
- "name": "alibaba/qwen3.5",
2523
- "type": "vision",
2524
  "input_price_per_1m": 0.6,
2525
- "output_price_per_1m": 3.6,
2526
  "currency": "USD",
 
2527
  "capabilities": [
2528
- "vision",
2529
- "reasoning"
2530
  ],
2531
- "context_window": 256000,
2532
- "size_b": 9,
2533
- "hf_id": "Qwen/Qwen3.5-9B",
2534
  "hf_private": false
2535
  },
2536
  {
@@ -2592,51 +2591,52 @@
2592
  "hf_private": false
2593
  },
2594
  {
2595
- "name": "moonshot/kimi-k2-0905-preview",
2596
- "type": "chat",
2597
  "input_price_per_1m": 0.6,
2598
- "output_price_per_1m": 2.5,
2599
  "currency": "USD",
2600
- "context_window": 131072,
2601
  "capabilities": [
2602
- "tools"
 
2603
  ],
2604
- "hf_id": "moonshotai/Kimi-K2-Instruct-0905",
2605
- "size_b": 1026.5,
 
2606
  "hf_private": false
2607
  },
2608
  {
2609
- "name": "novita/zai-org/glm-4.6",
2610
  "type": "chat",
2611
  "input_price_per_1m": 0.6,
2612
  "output_price_per_1m": 2.2,
2613
  "currency": "USD",
2614
- "context_window": 204800,
2615
  "capabilities": [
2616
  "tools",
2617
  "reasoning"
2618
  ],
2619
- "hf_id": "zai-org/GLM-4.6",
2620
- "size_b": 356.8,
2621
  "hf_private": false
2622
  },
2623
  {
2624
- "name": "novita/zai-org/glm-4.5",
2625
  "type": "chat",
2626
  "input_price_per_1m": 0.6,
2627
  "output_price_per_1m": 2.2,
2628
  "currency": "USD",
2629
- "context_window": 131072,
2630
  "capabilities": [
2631
  "tools",
2632
  "reasoning"
2633
  ],
2634
- "hf_id": "zai-org/GLM-4.5",
2635
- "size_b": 358.3,
2636
  "hf_private": false
2637
  },
2638
  {
2639
- "name": "deepinfra/zai-org/GLM-4.5",
2640
  "type": "chat",
2641
  "input_price_per_1m": 0.6,
2642
  "output_price_per_1m": 2.2,
@@ -2651,31 +2651,34 @@
2651
  "hf_private": false
2652
  },
2653
  {
2654
- "name": "zai/GLM-4.7",
2655
- "type": "chat",
2656
  "input_price_per_1m": 0.6,
2657
- "output_price_per_1m": 2.2,
2658
  "currency": "USD",
2659
  "capabilities": [
 
2660
  "reasoning"
2661
  ],
2662
  "context_window": 200000,
2663
- "hf_id": "zai-org/GLM-4.7",
2664
- "size_b": 358.3,
2665
- "hf_private": false
 
2666
  },
2667
  {
2668
- "name": "zai/GLM-4.5",
2669
- "type": "chat",
2670
  "input_price_per_1m": 0.6,
2671
- "output_price_per_1m": 2.2,
2672
  "currency": "USD",
2673
  "capabilities": [
 
2674
  "reasoning"
2675
  ],
2676
- "context_window": 131072,
2677
- "hf_id": "zai-org/GLM-4.5",
2678
- "size_b": 358.3,
2679
  "hf_private": false
2680
  },
2681
  {
@@ -2693,49 +2696,46 @@
2693
  "hf_private": false
2694
  },
2695
  {
2696
- "name": "nebius/zai-org/GLM-4.5",
2697
  "type": "chat",
2698
  "input_price_per_1m": 0.6,
2699
  "output_price_per_1m": 2.2,
2700
  "currency": "USD",
2701
- "context_window": 128000,
2702
  "capabilities": [
2703
- "tools",
2704
  "reasoning"
2705
  ],
2706
- "hf_id": "zai-org/GLM-4.5",
 
2707
  "size_b": 358.3,
2708
  "hf_private": false
2709
  },
2710
  {
2711
- "name": "minimaxi/MiniMax-M2.7-highspeed",
2712
- "type": "vision",
2713
  "input_price_per_1m": 0.6,
2714
- "output_price_per_1m": 2.4,
2715
  "currency": "USD",
2716
  "capabilities": [
2717
- "vision",
2718
  "reasoning"
2719
  ],
2720
- "context_window": 200000,
2721
- "hf_id": "MiniMaxAI/MiniMax-M2.7",
2722
- "hf_private": false,
2723
- "size_b": 230,
2724
- "size_source": "manual"
2725
  },
2726
  {
2727
- "name": "minimaxi/MiniMax-M2.5-highspeed",
2728
- "type": "vision",
2729
  "input_price_per_1m": 0.6,
2730
- "output_price_per_1m": 2.4,
2731
  "currency": "USD",
 
2732
  "capabilities": [
2733
- "vision",
2734
  "reasoning"
2735
  ],
2736
- "context_window": 200000,
2737
- "hf_id": "MiniMaxAI/MiniMax-M2.5",
2738
- "size_b": 228.7,
2739
  "hf_private": false
2740
  },
2741
  {
@@ -2802,7 +2802,7 @@
2802
  "hf_private": false
2803
  },
2804
  {
2805
- "name": "openai-responses/gpt-5.4-mini",
2806
  "type": "vision",
2807
  "input_price_per_1m": 0.75,
2808
  "output_price_per_1m": 4.5,
@@ -2815,7 +2815,7 @@
2815
  "hf_private": true
2816
  },
2817
  {
2818
- "name": "openai/gpt-5.4-mini",
2819
  "type": "vision",
2820
  "input_price_per_1m": 0.75,
2821
  "output_price_per_1m": 4.5,
@@ -2828,17 +2828,18 @@
2828
  "hf_private": true
2829
  },
2830
  {
2831
- "name": "novita/qwen/qwen2.5-vl-72b-instruct",
2832
  "type": "chat",
2833
  "input_price_per_1m": 0.8,
2834
- "output_price_per_1m": 0.8,
2835
  "currency": "USD",
2836
- "context_window": 96000,
2837
- "size_b": 72,
2838
  "capabilities": [
2839
- "vision"
 
2840
  ],
2841
- "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
 
2842
  "hf_private": false
2843
  },
2844
  {
@@ -2856,59 +2857,58 @@
2856
  "hf_private": false
2857
  },
2858
  {
2859
- "name": "deepinfra/meta-llama/Meta-Llama-3.1-405B-Instruct",
2860
  "type": "chat",
2861
  "input_price_per_1m": 0.8,
2862
  "output_price_per_1m": 0.8,
2863
  "currency": "USD",
2864
- "context_window": 130815,
2865
- "size_b": 405,
 
 
 
 
2866
  "hf_private": false
2867
  },
2868
  {
2869
- "name": "nebius/deepseek-ai/DeepSeek-R1-0528",
2870
  "type": "chat",
2871
  "input_price_per_1m": 0.8,
2872
- "output_price_per_1m": 2.4,
2873
  "currency": "USD",
2874
- "context_window": 164000,
2875
- "capabilities": [
2876
- "tools",
2877
- "reasoning"
2878
- ],
2879
- "hf_id": "deepseek-ai/DeepSeek-R1-0528",
2880
- "size_b": 684.5,
2881
  "hf_private": false
2882
  },
2883
  {
2884
- "name": "deepinfra/deepseek-ai/DeepSeek-V3",
2885
  "type": "chat",
2886
  "input_price_per_1m": 0.85,
2887
- "output_price_per_1m": 0.9,
2888
  "currency": "USD",
2889
- "context_window": 128000,
2890
  "capabilities": [
2891
  "tools",
2892
  "reasoning"
2893
  ],
2894
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
2895
  "size_b": 671,
 
2896
  "hf_private": false
2897
  },
2898
  {
2899
- "name": "deepinfra/deepseek-ai/DeepSeek-R1",
2900
  "type": "chat",
2901
  "input_price_per_1m": 0.85,
2902
- "output_price_per_1m": 2.5,
2903
  "currency": "USD",
2904
- "context_window": 64000,
2905
  "capabilities": [
2906
  "tools",
2907
  "reasoning"
2908
  ],
2909
- "hf_id": "deepseek-ai/DeepSeek-R1",
2910
  "size_b": 671,
2911
- "size_source": "manual",
2912
  "hf_private": false
2913
  },
2914
  {
@@ -2924,27 +2924,27 @@
2924
  "hf_private": true
2925
  },
2926
  {
2927
- "name": "together/meta-llama/Llama-3.3-70B-Instruct-Turbo",
2928
  "type": "chat",
2929
  "input_price_per_1m": 0.88,
2930
  "output_price_per_1m": 0.88,
2931
  "currency": "USD",
2932
  "context_window": 131072,
2933
  "size_b": 70,
2934
- "capabilities": [
2935
- "tools"
2936
- ],
2937
- "hf_id": "meta-llama/Llama-3.3-70B-Instruct",
2938
  "hf_private": false
2939
  },
2940
  {
2941
- "name": "together/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
2942
  "type": "chat",
2943
  "input_price_per_1m": 0.88,
2944
  "output_price_per_1m": 0.88,
2945
  "currency": "USD",
2946
  "context_window": 131072,
2947
  "size_b": 70,
 
 
 
 
2948
  "hf_private": false
2949
  },
2950
  {
@@ -2984,7 +2984,7 @@
2984
  "hf_private": true
2985
  },
2986
  {
2987
- "name": "anthropic/claude-haiku-4-5",
2988
  "type": "vision",
2989
  "input_price_per_1m": 1,
2990
  "output_price_per_1m": 5,
@@ -2996,7 +2996,7 @@
2996
  "hf_private": true
2997
  },
2998
  {
2999
- "name": "bedrock/claude-haiku-4-5",
3000
  "type": "vision",
3001
  "input_price_per_1m": 1,
3002
  "output_price_per_1m": 5,
@@ -3021,6 +3021,19 @@
3021
  "size_b": 753.9,
3022
  "hf_private": false
3023
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
3024
  {
3025
  "name": "zai/GLM-5",
3026
  "type": "vision",
@@ -3037,30 +3050,28 @@
3037
  "hf_private": false
3038
  },
3039
  {
3040
- "name": "vertex/claude-haiku-4-5",
3041
- "type": "vision",
3042
  "input_price_per_1m": 1,
3043
- "output_price_per_1m": 5,
3044
  "currency": "USD",
 
3045
  "capabilities": [
3046
  "vision"
3047
  ],
3048
- "context_window": 200000,
3049
  "hf_private": true
3050
  },
3051
  {
3052
- "name": "groq/moonshotai/Kimi-K2-Instruct-0905",
3053
- "type": "chat",
3054
  "input_price_per_1m": 1,
3055
- "output_price_per_1m": 3,
3056
  "currency": "USD",
3057
- "context_window": 256000,
3058
  "capabilities": [
3059
- "tools"
3060
  ],
3061
- "hf_id": "moonshotai/Kimi-K2-Instruct",
3062
- "size_b": 1026.5,
3063
- "hf_private": false
3064
  },
3065
  {
3066
  "name": "groq/moonshotai/kimi-k2-instruct",
@@ -3077,32 +3088,21 @@
3077
  "hf_private": false
3078
  },
3079
  {
3080
- "name": "perplexity/sonar",
3081
  "type": "chat",
3082
  "input_price_per_1m": 1,
3083
- "output_price_per_1m": 1,
3084
- "currency": "USD",
3085
- "context_window": 131072,
3086
- "capabilities": [
3087
- "vision"
3088
- ],
3089
- "hf_private": true
3090
- },
3091
- {
3092
- "name": "openai/o3",
3093
- "type": "vision",
3094
- "input_price_per_1m": 1,
3095
- "output_price_per_1m": 4,
3096
  "currency": "USD",
 
3097
  "capabilities": [
3098
- "vision",
3099
- "reasoning"
3100
  ],
3101
- "context_window": 200000,
3102
- "hf_private": true
 
3103
  },
3104
  {
3105
- "name": "openai-responses/o4-mini",
3106
  "type": "chat",
3107
  "input_price_per_1m": 1.1,
3108
  "output_price_per_1m": 4.4,
@@ -3126,7 +3126,7 @@
3126
  "hf_private": true
3127
  },
3128
  {
3129
- "name": "azure/o4-mini",
3130
  "type": "chat",
3131
  "input_price_per_1m": 1.1,
3132
  "output_price_per_1m": 4.4,
@@ -3138,7 +3138,7 @@
3138
  "hf_private": true
3139
  },
3140
  {
3141
- "name": "openai/o3-mini",
3142
  "type": "chat",
3143
  "input_price_per_1m": 1.1,
3144
  "output_price_per_1m": 4.4,
@@ -3174,7 +3174,7 @@
3174
  "hf_private": false
3175
  },
3176
  {
3177
- "name": "openai-responses/gpt-5",
3178
  "type": "vision",
3179
  "input_price_per_1m": 1.25,
3180
  "output_price_per_1m": 10,
@@ -3183,11 +3183,11 @@
3183
  "vision",
3184
  "reasoning"
3185
  ],
3186
- "context_window": 400000,
3187
  "hf_private": true
3188
  },
3189
  {
3190
- "name": "openai-responses/gpt-5.1",
3191
  "type": "vision",
3192
  "input_price_per_1m": 1.25,
3193
  "output_price_per_1m": 10,
@@ -3196,11 +3196,11 @@
3196
  "vision",
3197
  "reasoning"
3198
  ],
3199
- "context_window": 400000,
3200
  "hf_private": true
3201
  },
3202
  {
3203
- "name": "openai-responses/gpt-5-codex",
3204
  "type": "vision",
3205
  "input_price_per_1m": 1.25,
3206
  "output_price_per_1m": 10,
@@ -3209,11 +3209,11 @@
3209
  "vision",
3210
  "reasoning"
3211
  ],
3212
- "context_window": 400000,
3213
  "hf_private": true
3214
  },
3215
  {
3216
- "name": "openai-responses/gpt-5.1-codex",
3217
  "type": "vision",
3218
  "input_price_per_1m": 1.25,
3219
  "output_price_per_1m": 10,
@@ -3226,7 +3226,7 @@
3226
  "hf_private": true
3227
  },
3228
  {
3229
- "name": "google/gemini-2.5-pro",
3230
  "type": "vision",
3231
  "input_price_per_1m": 1.25,
3232
  "output_price_per_1m": 10,
@@ -3235,24 +3235,26 @@
3235
  "vision",
3236
  "reasoning"
3237
  ],
3238
- "context_window": 1048576,
3239
  "hf_private": true
3240
  },
3241
  {
3242
- "name": "coding/gemini-2.5-pro",
3243
- "type": "vision",
3244
  "input_price_per_1m": 1.25,
3245
- "output_price_per_1m": 10,
3246
  "currency": "USD",
 
3247
  "capabilities": [
3248
- "vision",
3249
  "reasoning"
3250
  ],
3251
- "context_window": 1048576,
3252
- "hf_private": true
 
3253
  },
3254
  {
3255
- "name": "vertex/gemini-2.5-pro",
3256
  "type": "vision",
3257
  "input_price_per_1m": 1.25,
3258
  "output_price_per_1m": 10,
@@ -3261,76 +3263,74 @@
3261
  "vision",
3262
  "reasoning"
3263
  ],
3264
- "context_window": 1048576,
3265
  "hf_private": true
3266
  },
3267
  {
3268
- "name": "azure/gpt-5",
3269
- "type": "chat",
3270
  "input_price_per_1m": 1.25,
3271
  "output_price_per_1m": 10,
3272
  "currency": "USD",
3273
  "capabilities": [
 
3274
  "reasoning"
3275
  ],
3276
- "context_window": 200000,
3277
  "hf_private": true
3278
  },
3279
  {
3280
- "name": "azure/gpt-5.1",
3281
- "type": "chat",
3282
  "input_price_per_1m": 1.25,
3283
  "output_price_per_1m": 10,
3284
  "currency": "USD",
3285
  "capabilities": [
 
3286
  "reasoning"
3287
  ],
3288
- "context_window": 200000,
3289
  "hf_private": true
3290
  },
3291
  {
3292
- "name": "together/deepseek-ai/DeepSeek-V3",
3293
- "type": "chat",
3294
  "input_price_per_1m": 1.25,
3295
- "output_price_per_1m": 1.25,
3296
  "currency": "USD",
3297
- "context_window": 131072,
3298
  "capabilities": [
3299
- "tools",
3300
  "reasoning"
3301
  ],
3302
- "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
3303
- "size_b": 671,
3304
- "hf_private": false
3305
  },
3306
  {
3307
- "name": "openai/gpt-5-chat",
3308
- "type": "vision",
3309
  "input_price_per_1m": 1.25,
3310
  "output_price_per_1m": 10,
3311
  "currency": "USD",
3312
  "capabilities": [
3313
- "vision",
3314
  "reasoning"
3315
  ],
3316
- "context_window": 128000,
3317
  "hf_private": true
3318
  },
3319
  {
3320
- "name": "openai/gpt-5.1",
3321
- "type": "vision",
3322
  "input_price_per_1m": 1.25,
3323
  "output_price_per_1m": 10,
3324
  "currency": "USD",
3325
  "capabilities": [
3326
- "vision",
3327
  "reasoning"
3328
  ],
3329
- "context_window": 400000,
3330
  "hf_private": true
3331
  },
3332
  {
3333
- "name": "openai/gpt-5.1-chat",
3334
  "type": "vision",
3335
  "input_price_per_1m": 1.25,
3336
  "output_price_per_1m": 10,
@@ -3339,7 +3339,7 @@
3339
  "vision",
3340
  "reasoning"
3341
  ],
3342
- "context_window": 128000,
3343
  "hf_private": true
3344
  },
3345
  {
@@ -3375,7 +3375,7 @@
3375
  "hf_private": true
3376
  },
3377
  {
3378
- "name": "openai-responses/gpt-5.3-chat",
3379
  "type": "vision",
3380
  "input_price_per_1m": 1.75,
3381
  "output_price_per_1m": 14,
@@ -3388,7 +3388,7 @@
3388
  "hf_private": true
3389
  },
3390
  {
3391
- "name": "openai-responses/gpt-5.2",
3392
  "type": "vision",
3393
  "input_price_per_1m": 1.75,
3394
  "output_price_per_1m": 14,
@@ -3401,7 +3401,7 @@
3401
  "hf_private": true
3402
  },
3403
  {
3404
- "name": "openai-responses/gpt-5.2-codex",
3405
  "type": "vision",
3406
  "input_price_per_1m": 1.75,
3407
  "output_price_per_1m": 14,
@@ -3410,11 +3410,11 @@
3410
  "vision",
3411
  "reasoning"
3412
  ],
3413
- "context_window": 400000,
3414
  "hf_private": true
3415
  },
3416
  {
3417
- "name": "openai-responses/gpt-5.3-codex",
3418
  "type": "vision",
3419
  "input_price_per_1m": 1.75,
3420
  "output_price_per_1m": 14,
@@ -3427,7 +3427,7 @@
3427
  "hf_private": true
3428
  },
3429
  {
3430
- "name": "azure/gpt-5.3-codex",
3431
  "type": "vision",
3432
  "input_price_per_1m": 1.75,
3433
  "output_price_per_1m": 14,
@@ -3436,23 +3436,11 @@
3436
  "vision",
3437
  "reasoning"
3438
  ],
3439
- "context_window": 400000,
3440
- "hf_private": true
3441
- },
3442
- {
3443
- "name": "azure/gpt-5.2",
3444
- "type": "chat",
3445
- "input_price_per_1m": 1.75,
3446
- "output_price_per_1m": 14,
3447
- "currency": "USD",
3448
- "capabilities": [
3449
- "reasoning"
3450
- ],
3451
- "context_window": 200000,
3452
  "hf_private": true
3453
  },
3454
  {
3455
- "name": "azure/openai-responses/gpt-5.2-codex",
3456
  "type": "vision",
3457
  "input_price_per_1m": 1.75,
3458
  "output_price_per_1m": 14,
@@ -3465,7 +3453,7 @@
3465
  "hf_private": true
3466
  },
3467
  {
3468
- "name": "openai/gpt-5.2",
3469
  "type": "vision",
3470
  "input_price_per_1m": 1.75,
3471
  "output_price_per_1m": 14,
@@ -3478,20 +3466,19 @@
3478
  "hf_private": true
3479
  },
3480
  {
3481
- "name": "openai/gpt-5.3-chat",
3482
- "type": "vision",
3483
  "input_price_per_1m": 1.75,
3484
  "output_price_per_1m": 14,
3485
  "currency": "USD",
3486
  "capabilities": [
3487
- "vision",
3488
  "reasoning"
3489
  ],
3490
- "context_window": 128000,
3491
  "hf_private": true
3492
  },
3493
  {
3494
- "name": "openai/gpt-5.2-chat",
3495
  "type": "vision",
3496
  "input_price_per_1m": 1.75,
3497
  "output_price_per_1m": 14,
@@ -3500,45 +3487,24 @@
3500
  "vision",
3501
  "reasoning"
3502
  ],
3503
- "context_window": 128000,
3504
- "hf_private": true
3505
- },
3506
- {
3507
- "name": "openai-responses/gpt-4.1",
3508
- "type": "vision",
3509
- "input_price_per_1m": 2,
3510
- "output_price_per_1m": 8,
3511
- "currency": "USD",
3512
- "capabilities": [
3513
- "vision"
3514
- ],
3515
- "context_window": 1047576,
3516
- "hf_private": true
3517
- },
3518
- {
3519
- "name": "xai/grok-2-1212",
3520
- "type": "chat",
3521
- "input_price_per_1m": 2,
3522
- "output_price_per_1m": 10,
3523
- "currency": "USD",
3524
- "context_window": 131072,
3525
  "hf_private": true
3526
  },
3527
  {
3528
- "name": "xai/grok-4.2-beta",
3529
  "type": "vision",
3530
- "input_price_per_1m": 2,
3531
- "output_price_per_1m": 6,
3532
  "currency": "USD",
3533
  "capabilities": [
3534
  "vision",
3535
  "reasoning"
3536
  ],
3537
- "context_window": 2000000,
3538
  "hf_private": true
3539
  },
3540
  {
3541
- "name": "google/gemini-3.1-pro-preview",
3542
  "type": "vision",
3543
  "input_price_per_1m": 2,
3544
  "output_price_per_1m": 12,
@@ -3551,7 +3517,7 @@
3551
  "hf_private": true
3552
  },
3553
  {
3554
- "name": "google/gemini-3-pro-preview",
3555
  "type": "vision",
3556
  "input_price_per_1m": 2,
3557
  "output_price_per_1m": 12,
@@ -3573,7 +3539,7 @@
3573
  "hf_private": true
3574
  },
3575
  {
3576
- "name": "vertex/gemini-3.1-pro-preview",
3577
  "type": "vision",
3578
  "input_price_per_1m": 2,
3579
  "output_price_per_1m": 12,
@@ -3586,7 +3552,7 @@
3586
  "hf_private": true
3587
  },
3588
  {
3589
- "name": "vertex/gemini-3-pro-preview",
3590
  "type": "vision",
3591
  "input_price_per_1m": 2,
3592
  "output_price_per_1m": 12,
@@ -3612,7 +3578,16 @@
3612
  "hf_private": true
3613
  },
3614
  {
3615
- "name": "azure/gpt-4.1",
 
 
 
 
 
 
 
 
 
3616
  "type": "vision",
3617
  "input_price_per_1m": 2,
3618
  "output_price_per_1m": 8,
@@ -3624,15 +3599,16 @@
3624
  "hf_private": true
3625
  },
3626
  {
3627
- "name": "azure/openai-responses/gpt-4.1",
3628
  "type": "vision",
3629
  "input_price_per_1m": 2,
3630
  "output_price_per_1m": 8,
3631
  "currency": "USD",
3632
  "capabilities": [
3633
- "vision"
 
3634
  ],
3635
- "context_window": 1047576,
3636
  "hf_private": true
3637
  },
3638
  {
@@ -3649,20 +3625,29 @@
3649
  "hf_private": true
3650
  },
3651
  {
3652
- "name": "openai/o4-mini-deep-research",
3653
  "type": "vision",
3654
  "input_price_per_1m": 2,
3655
- "output_price_per_1m": 8,
3656
  "currency": "USD",
3657
  "capabilities": [
3658
  "vision",
3659
  "reasoning"
3660
  ],
3661
- "context_window": 100000,
3662
  "hf_private": true
3663
  },
3664
  {
3665
- "name": "openai/gpt-4.1",
 
 
 
 
 
 
 
 
 
3666
  "type": "vision",
3667
  "input_price_per_1m": 2,
3668
  "output_price_per_1m": 8,
@@ -3674,29 +3659,31 @@
3674
  "hf_private": true
3675
  },
3676
  {
3677
- "name": "nebius/deepseek-ai/DeepSeek-V3-0324-fast",
3678
- "type": "chat",
3679
  "input_price_per_1m": 2,
3680
- "output_price_per_1m": 6,
3681
  "currency": "USD",
3682
- "context_window": 128000,
 
 
 
3683
  "hf_private": true
3684
  },
3685
  {
3686
- "name": "openai-responses/gpt-5.4",
3687
  "type": "vision",
3688
- "input_price_per_1m": 2.5,
3689
- "output_price_per_1m": 15,
3690
  "currency": "USD",
3691
  "capabilities": [
3692
- "vision",
3693
- "reasoning"
3694
  ],
3695
- "context_window": 1050000,
3696
  "hf_private": true
3697
  },
3698
  {
3699
- "name": "azure/openai-responses/gpt-5.4",
3700
  "type": "vision",
3701
  "input_price_per_1m": 2.5,
3702
  "output_price_per_1m": 15,
@@ -3709,7 +3696,7 @@
3709
  "hf_private": true
3710
  },
3711
  {
3712
- "name": "openai/gpt-4o-2024-11-20",
3713
  "type": "vision",
3714
  "input_price_per_1m": 2.5,
3715
  "output_price_per_1m": 10,
@@ -3721,20 +3708,19 @@
3721
  "hf_private": true
3722
  },
3723
  {
3724
- "name": "openai/gpt-5.4",
3725
  "type": "vision",
3726
  "input_price_per_1m": 2.5,
3727
- "output_price_per_1m": 15,
3728
  "currency": "USD",
3729
  "capabilities": [
3730
- "vision",
3731
- "reasoning"
3732
  ],
3733
- "context_window": 1050000,
3734
  "hf_private": true
3735
  },
3736
  {
3737
- "name": "openai/gpt-4o-2024-05-13",
3738
  "type": "vision",
3739
  "input_price_per_1m": 2.5,
3740
  "output_price_per_1m": 10,
@@ -3746,7 +3732,7 @@
3746
  "hf_private": true
3747
  },
3748
  {
3749
- "name": "openai/gpt-4o",
3750
  "type": "vision",
3751
  "input_price_per_1m": 2.5,
3752
  "output_price_per_1m": 10,
@@ -3758,19 +3744,33 @@
3758
  "hf_private": true
3759
  },
3760
  {
3761
- "name": "openai/gpt-4o-2024-08-06",
 
 
 
 
 
 
 
 
 
 
 
 
 
3762
  "type": "vision",
3763
  "input_price_per_1m": 2.5,
3764
- "output_price_per_1m": 10,
3765
  "currency": "USD",
3766
  "capabilities": [
3767
- "vision"
 
3768
  ],
3769
- "context_window": 128000,
3770
  "hf_private": true
3771
  },
3772
  {
3773
- "name": "anthropic/claude-sonnet-4-5",
3774
  "type": "vision",
3775
  "input_price_per_1m": 3,
3776
  "output_price_per_1m": 15,
@@ -3779,11 +3779,11 @@
3779
  "vision",
3780
  "reasoning"
3781
  ],
3782
- "context_window": 1000000,
3783
  "hf_private": true
3784
  },
3785
  {
3786
- "name": "anthropic/claude-sonnet-4-6",
3787
  "type": "vision",
3788
  "input_price_per_1m": 3,
3789
  "output_price_per_1m": 15,
@@ -3792,11 +3792,11 @@
3792
  "vision",
3793
  "reasoning"
3794
  ],
3795
- "context_window": 1000000,
3796
  "hf_private": true
3797
  },
3798
  {
3799
- "name": "anthropic/claude-sonnet-4",
3800
  "type": "vision",
3801
  "input_price_per_1m": 3,
3802
  "output_price_per_1m": 15,
@@ -3809,19 +3809,20 @@
3809
  "hf_private": true
3810
  },
3811
  {
3812
- "name": "xai/grok-4",
3813
  "type": "vision",
3814
  "input_price_per_1m": 3,
3815
  "output_price_per_1m": 15,
3816
  "currency": "USD",
3817
  "capabilities": [
3818
- "vision"
 
3819
  ],
3820
- "context_window": 256000,
3821
  "hf_private": true
3822
  },
3823
  {
3824
- "name": "bedrock/claude-3-7-sonnet",
3825
  "type": "vision",
3826
  "input_price_per_1m": 3,
3827
  "output_price_per_1m": 15,
@@ -3834,7 +3835,7 @@
3834
  "hf_private": true
3835
  },
3836
  {
3837
- "name": "bedrock/claude-sonnet-4",
3838
  "type": "vision",
3839
  "input_price_per_1m": 3,
3840
  "output_price_per_1m": 15,
@@ -3847,20 +3848,19 @@
3847
  "hf_private": true
3848
  },
3849
  {
3850
- "name": "bedrock/claude-sonnet-4-5",
3851
  "type": "vision",
3852
  "input_price_per_1m": 3,
3853
  "output_price_per_1m": 15,
3854
  "currency": "USD",
3855
  "capabilities": [
3856
- "vision",
3857
- "reasoning"
3858
  ],
3859
  "context_window": 200000,
3860
  "hf_private": true
3861
  },
3862
  {
3863
- "name": "bedrock/claude-sonnet-4-6",
3864
  "type": "vision",
3865
  "input_price_per_1m": 3,
3866
  "output_price_per_1m": 15,
@@ -3869,37 +3869,39 @@
3869
  "vision",
3870
  "reasoning"
3871
  ],
3872
- "context_window": 1000000,
3873
  "hf_private": true
3874
  },
3875
  {
3876
- "name": "coding/claude-sonnet-4-20250514",
3877
- "type": "vision",
3878
  "input_price_per_1m": 3,
3879
- "output_price_per_1m": 15,
3880
  "currency": "USD",
 
3881
  "capabilities": [
3882
- "vision",
3883
  "reasoning"
3884
  ],
3885
- "context_window": 200000,
3886
- "hf_private": true
 
 
3887
  },
3888
  {
3889
- "name": "vertex/claude-sonnet-4",
3890
- "type": "vision",
3891
  "input_price_per_1m": 3,
3892
  "output_price_per_1m": 15,
3893
  "currency": "USD",
 
3894
  "capabilities": [
3895
- "vision",
3896
- "reasoning"
3897
  ],
3898
- "context_window": 200000,
3899
  "hf_private": true
3900
  },
3901
  {
3902
- "name": "vertex/claude-3-7-sonnet",
3903
  "type": "vision",
3904
  "input_price_per_1m": 3,
3905
  "output_price_per_1m": 15,
@@ -3908,23 +3910,24 @@
3908
  "vision",
3909
  "reasoning"
3910
  ],
3911
- "context_window": 200000,
3912
  "hf_private": true
3913
  },
3914
  {
3915
- "name": "vertex/claude-3-5-sonnet",
3916
  "type": "vision",
3917
  "input_price_per_1m": 3,
3918
  "output_price_per_1m": 15,
3919
  "currency": "USD",
3920
  "capabilities": [
3921
- "vision"
 
3922
  ],
3923
- "context_window": 200000,
3924
  "hf_private": true
3925
  },
3926
  {
3927
- "name": "vertex/claude-sonnet-4-5",
3928
  "type": "vision",
3929
  "input_price_per_1m": 3,
3930
  "output_price_per_1m": 15,
@@ -3933,35 +3936,32 @@
3933
  "vision",
3934
  "reasoning"
3935
  ],
3936
- "context_window": 200000,
3937
  "hf_private": true
3938
  },
3939
  {
3940
- "name": "together/deepseek-ai/DeepSeek-R1",
3941
- "type": "chat",
3942
  "input_price_per_1m": 3,
3943
- "output_price_per_1m": 7,
3944
  "currency": "USD",
3945
- "context_window": 64000,
3946
  "capabilities": [
3947
- "tools",
3948
- "reasoning"
3949
  ],
3950
- "hf_id": "deepseek-ai/DeepSeek-R1",
3951
- "size_b": 671,
3952
- "size_source": "manual",
3953
- "hf_private": false
3954
  },
3955
  {
3956
- "name": "perplexity/sonar-pro",
3957
- "type": "chat",
3958
  "input_price_per_1m": 3,
3959
  "output_price_per_1m": 15,
3960
  "currency": "USD",
3961
- "context_window": 204800,
3962
  "capabilities": [
3963
- "vision"
 
3964
  ],
 
3965
  "hf_private": true
3966
  },
3967
  {
@@ -3981,7 +3981,7 @@
3981
  "hf_private": false
3982
  },
3983
  {
3984
- "name": "anthropic/claude-opus-4-6",
3985
  "type": "vision",
3986
  "input_price_per_1m": 5,
3987
  "output_price_per_1m": 25,
@@ -3990,11 +3990,11 @@
3990
  "vision",
3991
  "reasoning"
3992
  ],
3993
- "context_window": 1000000,
3994
  "hf_private": true
3995
  },
3996
  {
3997
- "name": "anthropic/claude-opus-4-5",
3998
  "type": "vision",
3999
  "input_price_per_1m": 5,
4000
  "output_price_per_1m": 25,
@@ -4003,23 +4003,24 @@
4003
  "vision",
4004
  "reasoning"
4005
  ],
4006
- "context_window": 200000,
4007
  "hf_private": true
4008
  },
4009
  {
4010
- "name": "xai/grok-3",
4011
- "type": "chat",
4012
  "input_price_per_1m": 5,
4013
  "output_price_per_1m": 25,
4014
  "currency": "USD",
4015
- "context_window": 131072,
4016
  "capabilities": [
4017
- "tools"
 
4018
  ],
 
4019
  "hf_private": true
4020
  },
4021
  {
4022
- "name": "bedrock/claude-opus-4-5",
4023
  "type": "vision",
4024
  "input_price_per_1m": 5,
4025
  "output_price_per_1m": 25,
@@ -4032,20 +4033,19 @@
4032
  "hf_private": true
4033
  },
4034
  {
4035
- "name": "bedrock/claude-opus-4-6",
4036
  "type": "vision",
4037
  "input_price_per_1m": 5,
4038
- "output_price_per_1m": 25,
4039
  "currency": "USD",
4040
  "capabilities": [
4041
- "vision",
4042
- "reasoning"
4043
  ],
4044
- "context_window": 1000000,
4045
  "hf_private": true
4046
  },
4047
  {
4048
- "name": "vertex/claude-opus-4-5",
4049
  "type": "vision",
4050
  "input_price_per_1m": 5,
4051
  "output_price_per_1m": 25,
@@ -4054,11 +4054,11 @@
4054
  "vision",
4055
  "reasoning"
4056
  ],
4057
- "context_window": 200000,
4058
  "hf_private": true
4059
  },
4060
  {
4061
- "name": "vertex/claude-opus-4-6",
4062
  "type": "vision",
4063
  "input_price_per_1m": 5,
4064
  "output_price_per_1m": 25,
@@ -4067,19 +4067,19 @@
4067
  "vision",
4068
  "reasoning"
4069
  ],
4070
- "context_window": 1000000,
4071
  "hf_private": true
4072
  },
4073
  {
4074
- "name": "openai/chatgpt-4o",
4075
- "type": "vision",
4076
  "input_price_per_1m": 5,
4077
- "output_price_per_1m": 15,
4078
  "currency": "USD",
 
4079
  "capabilities": [
4080
- "vision"
4081
  ],
4082
- "context_window": 128000,
4083
  "hf_private": true
4084
  },
4085
  {
@@ -4096,7 +4096,7 @@
4096
  "hf_private": true
4097
  },
4098
  {
4099
- "name": "anthropic/claude-opus-4-1",
4100
  "type": "vision",
4101
  "input_price_per_1m": 15,
4102
  "output_price_per_1m": 75,
@@ -4109,7 +4109,7 @@
4109
  "hf_private": true
4110
  },
4111
  {
4112
- "name": "anthropic/claude-opus-4",
4113
  "type": "vision",
4114
  "input_price_per_1m": 15,
4115
  "output_price_per_1m": 75,
@@ -4122,23 +4122,23 @@
4122
  "hf_private": true
4123
  },
4124
  {
4125
- "name": "openai-responses/gpt-5-pro",
4126
  "type": "vision",
4127
  "input_price_per_1m": 15,
4128
- "output_price_per_1m": 120,
4129
  "currency": "USD",
4130
  "capabilities": [
4131
  "vision",
4132
  "reasoning"
4133
  ],
4134
- "context_window": 400000,
4135
  "hf_private": true
4136
  },
4137
  {
4138
- "name": "bedrock/claude-opus-4",
4139
  "type": "vision",
4140
  "input_price_per_1m": 15,
4141
- "output_price_per_1m": 75,
4142
  "currency": "USD",
4143
  "capabilities": [
4144
  "vision",
@@ -4148,7 +4148,7 @@
4148
  "hf_private": true
4149
  },
4150
  {
4151
- "name": "coding/claude-opus-4-20250514",
4152
  "type": "vision",
4153
  "input_price_per_1m": 15,
4154
  "output_price_per_1m": 75,
@@ -4161,7 +4161,7 @@
4161
  "hf_private": true
4162
  },
4163
  {
4164
- "name": "vertex/claude-opus-4",
4165
  "type": "vision",
4166
  "input_price_per_1m": 15,
4167
  "output_price_per_1m": 75,
@@ -4174,23 +4174,23 @@
4174
  "hf_private": true
4175
  },
4176
  {
4177
- "name": "vertex/claude-opus-4-1",
4178
  "type": "vision",
4179
  "input_price_per_1m": 15,
4180
- "output_price_per_1m": 75,
4181
  "currency": "USD",
4182
  "capabilities": [
4183
  "vision",
4184
  "reasoning"
4185
  ],
4186
- "context_window": 200000,
4187
  "hf_private": true
4188
  },
4189
  {
4190
- "name": "openai/o1",
4191
  "type": "vision",
4192
  "input_price_per_1m": 15,
4193
- "output_price_per_1m": 60,
4194
  "currency": "USD",
4195
  "capabilities": [
4196
  "vision",
@@ -4213,7 +4213,7 @@
4213
  "hf_private": true
4214
  },
4215
  {
4216
- "name": "openai-responses/gpt-5.4-pro",
4217
  "type": "vision",
4218
  "input_price_per_1m": 30,
4219
  "output_price_per_1m": 180,
@@ -4226,7 +4226,7 @@
4226
  "hf_private": true
4227
  },
4228
  {
4229
- "name": "azure/openai-responses/gpt-5.4-pro",
4230
  "type": "vision",
4231
  "input_price_per_1m": 30,
4232
  "output_price_per_1m": 180,
@@ -4239,7 +4239,7 @@
4239
  "hf_private": true
4240
  },
4241
  {
4242
- "name": "openai/gpt-5.4-pro",
4243
  "type": "vision",
4244
  "input_price_per_1m": 30,
4245
  "output_price_per_1m": 180,
@@ -4987,12 +4987,12 @@
4987
  {
4988
  "name": "whisper-large-v3",
4989
  "type": "audio",
4990
- "input_price_per_1m": 0.003,
4991
- "output_price_per_1m": 0,
4992
  "currency": "EUR",
4993
  "hf_id": "openai/whisper-large-v3",
4994
- "size_b": 0.7,
4995
- "hf_private": false
 
 
4996
  },
4997
  {
4998
  "name": "holo2-30b-a3b",
@@ -5068,8 +5068,6 @@
5068
  {
5069
  "name": "voxtral-small-24b-2507",
5070
  "type": "audio",
5071
- "input_price_per_1m": 0.15,
5072
- "output_price_per_1m": 0.35,
5073
  "currency": "EUR",
5074
  "size_b": 24,
5075
  "capabilities": [
@@ -5077,7 +5075,8 @@
5077
  "tools"
5078
  ],
5079
  "hf_id": "mistralai/Voxtral-Small-24B-2507",
5080
- "hf_private": false
 
5081
  },
5082
  {
5083
  "name": "gemma-3-27b-it",
@@ -5310,25 +5309,23 @@
5310
  },
5311
  {
5312
  "name": "Voxtral Mini Transcribe 2",
5313
- "type": "chat",
5314
- "input_price_per_1m": 0.003,
5315
- "output_price_per_1m": 0,
5316
  "currency": "USD",
5317
  "api_endpoint": "voxtral-mini-latest",
5318
- "hf_private": true
 
5319
  },
5320
  {
5321
  "name": "Voxtral Realtime",
5322
- "type": "chat",
5323
- "input_price_per_1m": 0.006,
5324
- "output_price_per_1m": 0,
5325
  "currency": "USD",
5326
  "api_endpoint": "voxtral-mini-latest",
5327
- "hf_private": true
 
5328
  },
5329
  {
5330
  "name": "Voxtral Small",
5331
- "type": "chat",
5332
  "input_price_per_1m": 0.004,
5333
  "output_price_per_1m": 0.3,
5334
  "currency": "USD",
@@ -5343,7 +5340,7 @@
5343
  },
5344
  {
5345
  "name": "Voxtral Mini",
5346
- "type": "chat",
5347
  "input_price_per_1m": 0.001,
5348
  "output_price_per_1m": 0.04,
5349
  "currency": "USD",
@@ -6053,7 +6050,8 @@
6053
  "tools",
6054
  "eu-endpoint"
6055
  ],
6056
- "hf_private": true
 
6057
  },
6058
  {
6059
  "name": "qwen/qwen3-vl-8b-instruct",
@@ -6298,7 +6296,8 @@
6298
  "tools"
6299
  ],
6300
  "size_b": 24,
6301
- "hf_private": false
 
6302
  },
6303
  {
6304
  "name": "nvidia/llama-3.3-nemotron-super-49b-v1.5",
@@ -6329,7 +6328,8 @@
6329
  "reasoning",
6330
  "eu-endpoint"
6331
  ],
6332
- "hf_private": true
 
6333
  },
6334
  {
6335
  "name": "z-ai/glm-4-32b",
@@ -6371,7 +6371,8 @@
6371
  "reasoning",
6372
  "eu-endpoint"
6373
  ],
6374
- "hf_private": true
 
6375
  },
6376
  {
6377
  "name": "mistralai/devstral-small",
@@ -6414,7 +6415,8 @@
6414
  "tools",
6415
  "eu-endpoint"
6416
  ],
6417
- "hf_private": true
 
6418
  },
6419
  {
6420
  "name": "meta-llama/llama-3.3-70b-instruct",
@@ -7198,7 +7200,8 @@
7198
  "reasoning",
7199
  "eu-endpoint"
7200
  ],
7201
- "hf_private": true
 
7202
  },
7203
  {
7204
  "name": "bytedance-seed/seed-1.6",
@@ -7532,7 +7535,8 @@
7532
  "image-gen",
7533
  "eu-endpoint"
7534
  ],
7535
- "hf_private": true
 
7536
  },
7537
  {
7538
  "name": "thedrummer/cydonia-24b-v4.1",
@@ -7570,7 +7574,8 @@
7570
  "reasoning",
7571
  "eu-endpoint"
7572
  ],
7573
- "hf_private": true
 
7574
  },
7575
  {
7576
  "name": "x-ai/grok-3-mini",
@@ -7920,7 +7925,8 @@
7920
  "reasoning",
7921
  "eu-endpoint"
7922
  ],
7923
- "hf_private": true
 
7924
  },
7925
  {
7926
  "name": "mistralai/mistral-large-2512",
@@ -8032,7 +8038,8 @@
8032
  "audio",
8033
  "audio-out"
8034
  ],
8035
- "hf_private": true
 
8036
  },
8037
  {
8038
  "name": "z-ai/glm-4.5v",
@@ -8674,7 +8681,8 @@
8674
  "reasoning",
8675
  "eu-endpoint"
8676
  ],
8677
- "hf_private": true
 
8678
  },
8679
  {
8680
  "name": "google/gemini-2.5-pro-preview",
@@ -8690,7 +8698,8 @@
8690
  "reasoning",
8691
  "eu-endpoint"
8692
  ],
8693
- "hf_private": true
 
8694
  },
8695
  {
8696
  "name": "google/gemini-2.5-pro-preview-05-06",
@@ -8707,7 +8716,8 @@
8707
  "reasoning",
8708
  "eu-endpoint"
8709
  ],
8710
- "hf_private": true
 
8711
  },
8712
  {
8713
  "name": "sao10k/l3-euryale-70b",
@@ -8841,7 +8851,8 @@
8841
  "tools",
8842
  "reasoning"
8843
  ],
8844
- "hf_private": true
 
8845
  },
8846
  {
8847
  "name": "google/gemini-3.1-pro-preview",
@@ -8858,7 +8869,8 @@
8858
  "reasoning",
8859
  "eu-endpoint"
8860
  ],
8861
- "hf_private": true
 
8862
  },
8863
  {
8864
  "name": "google/gemini-3-pro-image-preview",
@@ -8872,7 +8884,8 @@
8872
  "reasoning",
8873
  "eu-endpoint"
8874
  ],
8875
- "hf_private": true
 
8876
  },
8877
  {
8878
  "name": "google/gemini-3-pro-preview",
@@ -8889,7 +8902,8 @@
8889
  "reasoning",
8890
  "eu-endpoint"
8891
  ],
8892
- "hf_private": true
 
8893
  },
8894
  {
8895
  "name": "openai/o4-mini-deep-research",
@@ -9054,7 +9068,8 @@
9054
  "audio",
9055
  "audio-out"
9056
  ],
9057
- "hf_private": true
 
9058
  },
9059
  {
9060
  "name": "amazon/nova-premier-v1",
@@ -9095,7 +9110,8 @@
9095
  "audio-out",
9096
  "tools"
9097
  ],
9098
- "hf_private": true
 
9099
  },
9100
  {
9101
  "name": "cohere/command-a",
@@ -10076,22 +10092,22 @@
10076
  {
10077
  "name": "Whisper V3 Large",
10078
  "type": "audio",
10079
- "input_price_per_1m": 0.111,
10080
- "output_price_per_1m": 0,
10081
  "currency": "USD",
10082
  "hf_id": "openai/whisper-large-v3",
10083
- "size_b": 0.7,
10084
- "hf_private": false
 
 
10085
  },
10086
  {
10087
  "name": "Whisper Large v3 Turbo",
10088
  "type": "audio",
10089
- "input_price_per_1m": 0.04,
10090
- "output_price_per_1m": 0,
10091
  "currency": "USD",
10092
  "hf_id": "openai/whisper-large-v3-turbo",
10093
- "size_b": 0.7,
10094
- "hf_private": false
 
 
10095
  }
10096
  ]
10097
  },
@@ -10111,8 +10127,6 @@
10111
  "image-gen"
10112
  ],
10113
  "price_per_image": 0.014,
10114
- "input_price_per_1m": 0,
10115
- "output_price_per_1m": 0,
10116
  "currency": "USD",
10117
  "category": "FLUX.2",
10118
  "size_b": 4,
@@ -10128,8 +10142,6 @@
10128
  "image-gen"
10129
  ],
10130
  "price_per_image": 0.015,
10131
- "input_price_per_1m": 0,
10132
- "output_price_per_1m": 0,
10133
  "currency": "USD",
10134
  "category": "FLUX.2",
10135
  "size_b": 9,
@@ -10145,8 +10157,6 @@
10145
  "image-gen"
10146
  ],
10147
  "price_per_image": 0.025,
10148
- "input_price_per_1m": 0,
10149
- "output_price_per_1m": 0,
10150
  "currency": "USD",
10151
  "category": "FLUX.1",
10152
  "size_b": 12,
@@ -10162,8 +10172,6 @@
10162
  "image-gen"
10163
  ],
10164
  "price_per_image": 0.03,
10165
- "input_price_per_1m": 0,
10166
- "output_price_per_1m": 0,
10167
  "currency": "USD",
10168
  "category": "FLUX.2",
10169
  "size_b": 32,
@@ -10179,8 +10187,6 @@
10179
  "image-gen"
10180
  ],
10181
  "price_per_image": 0.04,
10182
- "input_price_per_1m": 0,
10183
- "output_price_per_1m": 0,
10184
  "currency": "USD",
10185
  "category": "FLUX.1",
10186
  "hf_id": "black-forest-labs/FLUX.1-pro",
@@ -10196,8 +10202,6 @@
10196
  "image-gen"
10197
  ],
10198
  "price_per_image": 0.04,
10199
- "input_price_per_1m": 0,
10200
- "output_price_per_1m": 0,
10201
  "currency": "USD",
10202
  "category": "FLUX.1",
10203
  "hf_id": "black-forest-labs/FLUX.1-pro",
@@ -10213,8 +10217,6 @@
10213
  "image-gen"
10214
  ],
10215
  "price_per_image": 0.05,
10216
- "input_price_per_1m": 0,
10217
- "output_price_per_1m": 0,
10218
  "currency": "USD",
10219
  "category": "FLUX.2",
10220
  "size_b": 32,
@@ -10230,8 +10232,6 @@
10230
  "image-gen"
10231
  ],
10232
  "price_per_image": 0.05,
10233
- "input_price_per_1m": 0,
10234
- "output_price_per_1m": 0,
10235
  "currency": "USD",
10236
  "category": "FLUX.1",
10237
  "hf_id": "black-forest-labs/FLUX.1-pro",
@@ -10247,8 +10247,6 @@
10247
  "image-gen"
10248
  ],
10249
  "price_per_image": 0.05,
10250
- "input_price_per_1m": 0,
10251
- "output_price_per_1m": 0,
10252
  "currency": "USD",
10253
  "category": "FLUX.1 Tools",
10254
  "hf_id": "black-forest-labs/FLUX.1-pro",
@@ -10264,8 +10262,6 @@
10264
  "image-gen"
10265
  ],
10266
  "price_per_image": 0.06,
10267
- "input_price_per_1m": 0,
10268
- "output_price_per_1m": 0,
10269
  "currency": "USD",
10270
  "category": "FLUX.1",
10271
  "hf_id": "black-forest-labs/FLUX.1-pro",
@@ -10281,8 +10277,6 @@
10281
  "image-gen"
10282
  ],
10283
  "price_per_image": 0.07,
10284
- "input_price_per_1m": 0,
10285
- "output_price_per_1m": 0,
10286
  "currency": "USD",
10287
  "category": "FLUX.2",
10288
  "size_b": 32,
@@ -10298,8 +10292,6 @@
10298
  "image-gen"
10299
  ],
10300
  "price_per_image": 0.08,
10301
- "input_price_per_1m": 0,
10302
- "output_price_per_1m": 0,
10303
  "currency": "USD",
10304
  "category": "FLUX.1",
10305
  "hf_id": "black-forest-labs/FLUX.1-pro",
 
302
  {
303
  "name": "Whisper V3",
304
  "type": "audio",
 
 
305
  "currency": "CHF",
306
  "hf_id": "openai/whisper-large-v3",
307
+ "size_b": 1.55,
308
+ "hf_private": false,
309
+ "price_per_minute": 0.006,
310
+ "size_source": "manual"
311
  },
312
  {
313
  "name": "Photomaker V2",
 
1163
  "hf_private": true
1164
  },
1165
  {
1166
+ "name": "novita/Sao10K/L3-8B-Stheno-v3.2",
1167
+ "type": "chat",
1168
  "input_price_per_1m": 0.05,
1169
+ "output_price_per_1m": 0.05,
1170
  "currency": "USD",
1171
+ "context_window": 8192,
1172
+ "size_b": 8,
1173
+ "hf_private": false
 
 
 
1174
  },
1175
  {
1176
+ "name": "novita/sao10k/l3-8b-lunaris",
1177
  "type": "chat",
1178
  "input_price_per_1m": 0.05,
1179
  "output_price_per_1m": 0.05,
 
1197
  "hf_private": false
1198
  },
1199
  {
1200
+ "name": "openai-responses/gpt-5-nano",
1201
+ "type": "vision",
1202
  "input_price_per_1m": 0.05,
1203
+ "output_price_per_1m": 0.4,
1204
  "currency": "USD",
1205
+ "capabilities": [
1206
+ "vision",
1207
+ "reasoning"
1208
+ ],
1209
+ "context_window": 400000,
1210
+ "hf_private": true
1211
  },
1212
  {
1213
  "name": "azure/gpt-5-nano",
 
1264
  "hf_id": "Gryphe/MythoMax-L2-13b",
1265
  "hf_private": false
1266
  },
 
 
 
 
 
 
 
 
 
 
 
 
1267
  {
1268
  "name": "google/gemini-2.0-flash-001",
1269
  "type": "vision",
 
1326
  "size_b": 24,
1327
  "hf_private": false
1328
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1329
  {
1330
  "name": "vertex/gemini-2.5-flash-lite",
1331
  "type": "vision",
 
1340
  "hf_private": true
1341
  },
1342
  {
1343
+ "name": "openai/gpt-4.1-nano",
 
 
 
 
 
 
 
 
 
 
 
 
1344
  "type": "vision",
1345
  "input_price_per_1m": 0.1,
1346
  "output_price_per_1m": 0.4,
 
1361
  "size_b": 8,
1362
  "hf_private": false
1363
  },
1364
+ {
1365
+ "name": "deepinfra/Qwen/Qwen3-32B",
1366
+ "type": "chat",
1367
+ "input_price_per_1m": 0.1,
1368
+ "output_price_per_1m": 0.3,
1369
+ "currency": "USD",
1370
+ "context_window": 40000,
1371
+ "size_b": 32,
1372
+ "capabilities": [
1373
+ "tools",
1374
+ "reasoning"
1375
+ ],
1376
+ "hf_id": "Qwen/Qwen3-32B",
1377
+ "hf_private": false
1378
+ },
1379
  {
1380
  "name": "groq/openai/gpt-oss-20b",
1381
  "type": "chat",
 
1392
  "hf_private": false
1393
  },
1394
  {
1395
+ "name": "openai-responses/gpt-4.1-nano",
1396
+ "type": "vision",
1397
+ "input_price_per_1m": 0.1,
1398
+ "output_price_per_1m": 0.4,
1399
+ "currency": "USD",
1400
+ "capabilities": [
1401
+ "vision"
1402
+ ],
1403
+ "context_window": 1047576,
1404
+ "hf_private": true
1405
+ },
1406
+ {
1407
+ "name": "azure/openai-responses/gpt-4.1-nano",
1408
+ "type": "vision",
1409
+ "input_price_per_1m": 0.1,
1410
+ "output_price_per_1m": 0.4,
1411
+ "currency": "USD",
1412
+ "capabilities": [
1413
+ "vision"
1414
+ ],
1415
+ "context_window": 1047576,
1416
+ "hf_private": true
1417
+ },
1418
+ {
1419
+ "name": "azure/gpt-4.1-nano",
1420
  "type": "vision",
1421
  "input_price_per_1m": 0.1,
1422
  "output_price_per_1m": 0.4,
 
1479
  "hf_id": "NousResearch/Hermes-2-Pro-Llama-3-8B",
1480
  "hf_private": false
1481
  },
1482
+ {
1483
+ "name": "mistral/mistral-small-latest",
1484
+ "type": "vision",
1485
+ "input_price_per_1m": 0.15,
1486
+ "output_price_per_1m": 0.6,
1487
+ "currency": "USD",
1488
+ "capabilities": [
1489
+ "vision",
1490
+ "reasoning"
1491
+ ],
1492
+ "context_window": 256000,
1493
+ "hf_private": true
1494
+ },
1495
  {
1496
  "name": "mistral/mistral-small-2603",
1497
  "type": "vision",
 
1508
  "hf_private": false
1509
  },
1510
  {
1511
+ "name": "nebius/openai/gpt-oss-120b",
1512
+ "type": "chat",
1513
  "input_price_per_1m": 0.15,
1514
  "output_price_per_1m": 0.6,
1515
  "currency": "USD",
1516
  "capabilities": [
 
1517
  "reasoning"
1518
  ],
1519
+ "context_window": 131000,
1520
+ "size_b": 120,
1521
+ "hf_id": "openai/gpt-oss-120b",
1522
+ "hf_private": false
1523
  },
1524
  {
1525
  "name": "novita/deepseek/deepseek-r1-distill-qwen-14b",
 
1537
  "size_source": "manual",
1538
  "hf_private": false
1539
  },
1540
+ {
1541
+ "name": "openai/gpt-4o-mini",
1542
+ "type": "vision",
1543
+ "input_price_per_1m": 0.15,
1544
+ "output_price_per_1m": 0.6,
1545
+ "currency": "USD",
1546
+ "capabilities": [
1547
+ "vision"
1548
+ ],
1549
+ "context_window": 128000,
1550
+ "hf_private": true
1551
+ },
1552
  {
1553
  "name": "parasail/parasail-qwen3-235b-a22b-instruct-2507",
1554
  "type": "chat",
 
1574
  "hf_id": "openai/gpt-oss-120b",
1575
  "hf_private": false
1576
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1577
  {
1578
  "name": "novita/mistralai/mistral-nemo",
1579
  "type": "chat",
 
1613
  "hf_private": false
1614
  },
1615
  {
1616
+ "name": "novita/qwen/qwen3-235b-a22b-fp8",
1617
+ "type": "chat",
1618
+ "input_price_per_1m": 0.2,
1619
+ "output_price_per_1m": 0.8,
1620
+ "currency": "USD",
1621
+ "context_window": 128000,
1622
+ "size_b": 235,
1623
+ "capabilities": [
1624
+ "tools",
1625
+ "reasoning"
1626
+ ],
1627
+ "hf_id": "Qwen/Qwen3-235B-A22B",
1628
+ "hf_private": false
1629
+ },
1630
+ {
1631
+ "name": "novita/meta-llama/llama-4-maverick-17b-128e-instruct-fp8",
1632
+ "type": "chat",
1633
+ "input_price_per_1m": 0.2,
1634
+ "output_price_per_1m": 0.85,
1635
+ "currency": "USD",
1636
+ "context_window": 1048576,
1637
+ "size_b": 17,
1638
+ "capabilities": [
1639
+ "vision",
1640
+ "tools"
1641
+ ],
1642
+ "hf_id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct",
1643
+ "hf_private": false
1644
+ },
1645
+ {
1646
+ "name": "openai/gpt-5.4-nano",
1647
  "type": "vision",
1648
  "input_price_per_1m": 0.2,
1649
  "output_price_per_1m": 1.25,
 
1655
  "context_window": 400000,
1656
  "hf_private": true
1657
  },
1658
+ {
1659
+ "name": "together/meta-llama/LlamaGuard-2-8b",
1660
+ "type": "chat",
1661
+ "input_price_per_1m": 0.2,
1662
+ "output_price_per_1m": 0.2,
1663
+ "currency": "USD",
1664
+ "context_window": 8192,
1665
+ "size_b": 8,
1666
+ "hf_private": false
1667
+ },
1668
  {
1669
  "name": "xai/grok-4-fast",
1670
  "type": "chat",
 
1691
  "context_window": 2000000,
1692
  "hf_private": true
1693
  },
1694
+ {
1695
+ "name": "xai/grok-4-1-fast-non-reasoning",
1696
+ "type": "vision",
1697
+ "input_price_per_1m": 0.2,
1698
+ "output_price_per_1m": 0.5,
1699
+ "currency": "USD",
1700
+ "capabilities": [
1701
+ "vision"
1702
+ ],
1703
+ "context_window": 2000000,
1704
+ "hf_private": true
1705
+ },
1706
  {
1707
  "name": "xai/grok-code-fast-1",
1708
  "type": "vision",
 
1730
  "hf_private": true
1731
  },
1732
  {
1733
+ "name": "deepinfra/Qwen/Qwen3-235B-A22B",
 
 
 
 
 
 
 
 
 
 
 
 
1734
  "type": "chat",
1735
  "input_price_per_1m": 0.2,
1736
+ "output_price_per_1m": 0.6,
1737
  "currency": "USD",
1738
+ "context_window": 40000,
1739
  "size_b": 235,
1740
  "capabilities": [
1741
  "tools",
 
1745
  "hf_private": false
1746
  },
1747
  {
1748
+ "name": "deepinfra/zai-org/GLM-4.5-Air",
1749
  "type": "chat",
1750
  "input_price_per_1m": 0.2,
1751
+ "output_price_per_1m": 1.1,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1752
  "currency": "USD",
1753
  "context_window": 131072,
1754
  "capabilities": [
 
1760
  "hf_private": false
1761
  },
1762
  {
1763
+ "name": "openai-responses/gpt-5.4-nano",
 
 
 
 
 
 
 
 
 
 
1764
  "type": "vision",
1765
  "input_price_per_1m": 0.2,
1766
  "output_price_per_1m": 1.25,
 
1773
  "hf_private": true
1774
  },
1775
  {
1776
+ "name": "deepinfra/Qwen/Qwen2.5-72B-Instruct",
1777
  "type": "chat",
1778
  "input_price_per_1m": 0.23,
1779
+ "output_price_per_1m": 0.4,
1780
  "currency": "USD",
1781
+ "context_window": 131072,
1782
+ "size_b": 72,
1783
  "capabilities": [
1784
+ "vision"
1785
  ],
1786
+ "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
 
 
 
 
 
 
 
 
 
 
1787
  "hf_private": false
1788
  },
1789
  {
 
1801
  "hf_private": false
1802
  },
1803
  {
1804
+ "name": "deepinfra/deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1805
  "type": "chat",
1806
  "input_price_per_1m": 0.23,
1807
+ "output_price_per_1m": 0.69,
1808
  "currency": "USD",
1809
+ "context_window": 64000,
1810
+ "size_b": 70,
1811
  "capabilities": [
1812
+ "reasoning"
1813
  ],
1814
+ "hf_id": "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
1815
  "hf_private": false
1816
  },
1817
  {
1818
+ "name": "deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct",
1819
+ "type": "chat",
1820
+ "input_price_per_1m": 0.23,
1821
+ "output_price_per_1m": 0.4,
1822
  "currency": "USD",
1823
+ "context_window": 130815,
1824
+ "size_b": 70,
1825
+ "hf_private": false
 
 
 
1826
  },
1827
  {
1828
  "name": "google/gemini-3.1-flash-lite-preview",
 
1858
  "context_window": 1048576,
1859
  "hf_private": true
1860
  },
1861
+ {
1862
+ "name": "openai-responses/gpt-5-mini",
1863
+ "type": "vision",
1864
+ "input_price_per_1m": 0.25,
1865
+ "output_price_per_1m": 2,
1866
+ "currency": "USD",
1867
+ "capabilities": [
1868
+ "vision",
1869
+ "reasoning"
1870
+ ],
1871
+ "context_window": 400000,
1872
+ "hf_private": true
1873
+ },
1874
  {
1875
  "name": "azure/gpt-5-mini",
1876
  "type": "chat",
 
1934
  "hf_private": true
1935
  },
1936
  {
1937
+ "name": "google/gemini-2.5-flash",
1938
+ "type": "vision",
1939
  "input_price_per_1m": 0.3,
1940
+ "output_price_per_1m": 2.5,
1941
  "currency": "USD",
1942
  "capabilities": [
1943
+ "vision",
1944
  "reasoning"
1945
  ],
1946
+ "context_window": 1048576,
1947
+ "hf_private": true
1948
+ },
1949
+ {
1950
+ "name": "mistral/codestral-latest",
1951
+ "type": "chat",
1952
+ "input_price_per_1m": 0.3,
1953
+ "output_price_per_1m": 0.9,
1954
+ "currency": "USD",
1955
  "context_window": 131072,
1956
  "hf_private": true
1957
  },
1958
  {
1959
+ "name": "vertex/gemini-2.5-flash",
1960
  "type": "vision",
1961
  "input_price_per_1m": 0.3,
1962
  "output_price_per_1m": 2.5,
 
1969
  "hf_private": true
1970
  },
1971
  {
1972
+ "name": "vertex/gemini-2.5-flash-image",
1973
+ "type": "vision",
1974
  "input_price_per_1m": 0.3,
1975
+ "output_price_per_1m": 2.5,
1976
  "currency": "USD",
1977
+ "capabilities": [
1978
+ "vision",
1979
+ "reasoning"
1980
+ ],
1981
+ "context_window": 1048576,
1982
  "hf_private": true
1983
  },
1984
  {
1985
+ "name": "nebius/deepseek-ai/DeepSeek-V3.2",
1986
+ "type": "chat",
1987
+ "input_price_per_1m": 0.3,
1988
+ "output_price_per_1m": 0.45,
1989
+ "currency": "USD",
1990
+ "capabilities": [
1991
+ "reasoning"
1992
+ ],
1993
+ "context_window": 164000,
1994
+ "hf_id": "deepseek-ai/DeepSeek-V3.2",
1995
+ "size_b": 685.4,
1996
+ "hf_private": false
1997
+ },
1998
+ {
1999
+ "name": "nebius/minimax/minimax-m2.1",
2000
+ "type": "chat",
2001
+ "input_price_per_1m": 0.3,
2002
+ "output_price_per_1m": 1.2,
2003
+ "currency": "USD",
2004
+ "capabilities": [
2005
+ "reasoning"
2006
+ ],
2007
+ "context_window": 200000,
2008
+ "hf_id": "MiniMaxAI/MiniMax-M2.1",
2009
+ "size_b": 228.7,
2010
+ "hf_private": false
2011
+ },
2012
+ {
2013
+ "name": "novita/minimax-m2.7",
2014
  "type": "vision",
2015
  "input_price_per_1m": 0.3,
2016
  "output_price_per_1m": 1.2,
 
2026
  "size_source": "manual"
2027
  },
2028
  {
2029
+ "name": "novita/MiniMax-M2.7",
2030
  "type": "vision",
2031
  "input_price_per_1m": 0.3,
2032
  "output_price_per_1m": 1.2,
 
2056
  "hf_private": false
2057
  },
2058
  {
2059
+ "name": "minimaxi/MiniMax-M2.7",
2060
  "type": "vision",
2061
  "input_price_per_1m": 0.3,
2062
+ "output_price_per_1m": 1.2,
2063
  "currency": "USD",
2064
  "capabilities": [
2065
  "vision",
2066
  "reasoning"
2067
  ],
2068
+ "context_window": 200000,
2069
+ "hf_id": "MiniMaxAI/MiniMax-M2.7",
2070
+ "hf_private": false,
2071
+ "size_b": 230,
2072
+ "size_source": "manual"
 
 
 
 
 
 
 
 
 
 
 
 
2073
  },
2074
  {
2075
+ "name": "minimaxi/MiniMax-M2.5",
2076
  "type": "vision",
2077
  "input_price_per_1m": 0.3,
2078
+ "output_price_per_1m": 1.2,
2079
  "currency": "USD",
2080
  "capabilities": [
2081
  "vision",
2082
  "reasoning"
2083
  ],
2084
+ "context_window": 200000,
2085
+ "hf_id": "MiniMaxAI/MiniMax-M2.5",
2086
+ "size_b": 228.7,
2087
+ "hf_private": false
2088
  },
2089
  {
2090
+ "name": "minimaxi/MiniMax-M2",
2091
+ "type": "chat",
2092
  "input_price_per_1m": 0.3,
2093
+ "output_price_per_1m": 1.2,
2094
  "currency": "USD",
2095
+ "context_window": 200000,
2096
  "capabilities": [
2097
+ "tools",
2098
  "reasoning"
2099
  ],
2100
+ "hf_id": "MiniMaxAI/MiniMax-M2",
2101
+ "size_b": 228.7,
2102
+ "hf_private": false
2103
  },
2104
  {
2105
  "name": "together/Qwen/Qwen2.5-7B-Instruct-Turbo",
 
2122
  "hf_private": false
2123
  },
2124
  {
2125
+ "name": "xai/grok-3-mini",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2126
  "type": "chat",
2127
  "input_price_per_1m": 0.3,
2128
+ "output_price_per_1m": 0.5,
2129
  "currency": "USD",
2130
  "capabilities": [
2131
  "reasoning"
2132
  ],
2133
+ "context_window": 131072,
2134
+ "hf_private": true
 
 
2135
  },
2136
  {
2137
+ "name": "deepinfra/deepseek-ai/DeepSeek-V3.1",
2138
  "type": "chat",
2139
  "input_price_per_1m": 0.3,
2140
+ "output_price_per_1m": 1,
2141
  "currency": "USD",
2142
+ "context_window": 163840,
2143
  "capabilities": [
2144
  "tools",
2145
  "reasoning"
2146
  ],
2147
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
2148
+ "size_b": 671,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2149
  "hf_private": false
2150
  },
2151
  {
2152
+ "name": "coding/gemini-2.5-flash",
2153
  "type": "vision",
2154
  "input_price_per_1m": 0.3,
2155
+ "output_price_per_1m": 2.5,
2156
  "currency": "USD",
2157
  "capabilities": [
2158
  "vision",
2159
  "reasoning"
2160
  ],
2161
+ "context_window": 1048576,
2162
+ "hf_private": true
 
 
 
2163
  },
2164
  {
2165
  "name": "deepinfra/meta-llama/Llama-3.2-90B-Vision-Instruct",
 
2211
  ],
2212
  "hf_private": true
2213
  },
 
 
 
 
 
 
 
 
 
 
 
 
2214
  {
2215
  "name": "mistral/devstral-medium-2507",
2216
  "type": "chat",
 
2241
  "context_window": 131072,
2242
  "hf_private": true
2243
  },
2244
+ {
2245
+ "name": "nebius/zai-org/GLM-4.7",
2246
+ "type": "chat",
2247
+ "input_price_per_1m": 0.4,
2248
+ "output_price_per_1m": 2,
2249
+ "currency": "USD",
2250
+ "capabilities": [
2251
+ "reasoning"
2252
+ ],
2253
+ "context_window": 200000,
2254
+ "hf_id": "zai-org/GLM-4.7",
2255
+ "size_b": 358.3,
2256
+ "hf_private": false
2257
+ },
2258
+ {
2259
+ "name": "nebius/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2260
+ "type": "chat",
2261
+ "input_price_per_1m": 0.4,
2262
+ "output_price_per_1m": 1.8,
2263
+ "currency": "USD",
2264
+ "context_window": 262000,
2265
+ "size_b": 480,
2266
+ "capabilities": [
2267
+ "tools"
2268
+ ],
2269
+ "hf_id": "Qwen/Qwen3-Coder-480B-A35B-Instruct",
2270
+ "hf_private": false
2271
+ },
2272
  {
2273
  "name": "novita/deepseek/deepseek-v3-0324",
2274
  "type": "chat",
 
2293
  "context_window": 128000,
2294
  "hf_private": true
2295
  },
2296
+ {
2297
+ "name": "openai/gpt-4.1-mini",
2298
+ "type": "vision",
2299
+ "input_price_per_1m": 0.4,
2300
+ "output_price_per_1m": 1.6,
2301
+ "currency": "USD",
2302
+ "capabilities": [
2303
+ "vision"
2304
+ ],
2305
+ "context_window": 1047576,
2306
+ "hf_private": true
2307
+ },
2308
  {
2309
  "name": "deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct",
2310
  "type": "chat",
 
2320
  "hf_private": false
2321
  },
2322
  {
2323
+ "name": "openai-responses/gpt-4.1-mini",
2324
  "type": "vision",
2325
  "input_price_per_1m": 0.4,
2326
  "output_price_per_1m": 1.6,
 
2332
  "hf_private": true
2333
  },
2334
  {
2335
+ "name": "azure/gpt-4.1-mini",
2336
  "type": "vision",
2337
  "input_price_per_1m": 0.4,
2338
  "output_price_per_1m": 1.6,
 
2344
  "hf_private": true
2345
  },
2346
  {
2347
+ "name": "azure/openai-responses/gpt-4.1-mini",
2348
  "type": "vision",
2349
  "input_price_per_1m": 0.4,
2350
  "output_price_per_1m": 1.6,
 
2355
  "context_window": 1047576,
2356
  "hf_private": true
2357
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2358
  {
2359
  "name": "google/gemini-3.1-flash-image-preview",
2360
  "type": "vision",
 
2419
  "context_window": 131072,
2420
  "hf_private": true
2421
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2422
  {
2423
  "name": "nebius/deepseek-ai/DeepSeek-V3-0324",
2424
  "type": "chat",
 
2438
  "name": "nebius/moonshotai/Kimi-K2-Instruct",
2439
  "type": "chat",
2440
  "input_price_per_1m": 0.5,
2441
+ "output_price_per_1m": 2.4,
2442
+ "currency": "USD",
2443
+ "context_window": 131000,
2444
+ "capabilities": [
2445
+ "tools"
2446
+ ],
2447
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
2448
+ "size_b": 1026.5,
2449
+ "hf_private": false
2450
+ },
2451
+ {
2452
+ "name": "nebius/moonshotai/kimi-k2.5",
2453
+ "type": "vision",
2454
+ "input_price_per_1m": 0.5,
2455
+ "output_price_per_1m": 2.5,
2456
  "currency": "USD",
 
2457
  "capabilities": [
2458
+ "vision",
2459
+ "reasoning"
2460
  ],
2461
+ "context_window": 256000,
2462
+ "hf_id": "moonshotai/Kimi-K2.5",
2463
+ "size_b": 1058.6,
2464
  "hf_private": false
2465
  },
2466
  {
 
2519
  "hf_private": false
2520
  },
2521
  {
2522
+ "name": "moonshot/kimi-k2-0905-preview",
2523
+ "type": "chat",
2524
  "input_price_per_1m": 0.6,
2525
+ "output_price_per_1m": 2.5,
2526
  "currency": "USD",
2527
+ "context_window": 131072,
2528
  "capabilities": [
2529
+ "tools"
 
2530
  ],
2531
+ "hf_id": "moonshotai/Kimi-K2-Instruct-0905",
2532
+ "size_b": 1026.5,
 
2533
  "hf_private": false
2534
  },
2535
  {
 
2591
  "hf_private": false
2592
  },
2593
  {
2594
+ "name": "alibaba/qwen3.5",
2595
+ "type": "vision",
2596
  "input_price_per_1m": 0.6,
2597
+ "output_price_per_1m": 3.6,
2598
  "currency": "USD",
 
2599
  "capabilities": [
2600
+ "vision",
2601
+ "reasoning"
2602
  ],
2603
+ "context_window": 256000,
2604
+ "size_b": 9,
2605
+ "hf_id": "Qwen/Qwen3.5-9B",
2606
  "hf_private": false
2607
  },
2608
  {
2609
+ "name": "nebius/zai-org/GLM-4.5",
2610
  "type": "chat",
2611
  "input_price_per_1m": 0.6,
2612
  "output_price_per_1m": 2.2,
2613
  "currency": "USD",
2614
+ "context_window": 128000,
2615
  "capabilities": [
2616
  "tools",
2617
  "reasoning"
2618
  ],
2619
+ "hf_id": "zai-org/GLM-4.5",
2620
+ "size_b": 358.3,
2621
  "hf_private": false
2622
  },
2623
  {
2624
+ "name": "novita/zai-org/glm-4.6",
2625
  "type": "chat",
2626
  "input_price_per_1m": 0.6,
2627
  "output_price_per_1m": 2.2,
2628
  "currency": "USD",
2629
+ "context_window": 204800,
2630
  "capabilities": [
2631
  "tools",
2632
  "reasoning"
2633
  ],
2634
+ "hf_id": "zai-org/GLM-4.6",
2635
+ "size_b": 356.8,
2636
  "hf_private": false
2637
  },
2638
  {
2639
+ "name": "novita/zai-org/glm-4.5",
2640
  "type": "chat",
2641
  "input_price_per_1m": 0.6,
2642
  "output_price_per_1m": 2.2,
 
2651
  "hf_private": false
2652
  },
2653
  {
2654
+ "name": "minimaxi/MiniMax-M2.7-highspeed",
2655
+ "type": "vision",
2656
  "input_price_per_1m": 0.6,
2657
+ "output_price_per_1m": 2.4,
2658
  "currency": "USD",
2659
  "capabilities": [
2660
+ "vision",
2661
  "reasoning"
2662
  ],
2663
  "context_window": 200000,
2664
+ "hf_id": "MiniMaxAI/MiniMax-M2.7",
2665
+ "hf_private": false,
2666
+ "size_b": 230,
2667
+ "size_source": "manual"
2668
  },
2669
  {
2670
+ "name": "minimaxi/MiniMax-M2.5-highspeed",
2671
+ "type": "vision",
2672
  "input_price_per_1m": 0.6,
2673
+ "output_price_per_1m": 2.4,
2674
  "currency": "USD",
2675
  "capabilities": [
2676
+ "vision",
2677
  "reasoning"
2678
  ],
2679
+ "context_window": 200000,
2680
+ "hf_id": "MiniMaxAI/MiniMax-M2.5",
2681
+ "size_b": 228.7,
2682
  "hf_private": false
2683
  },
2684
  {
 
2696
  "hf_private": false
2697
  },
2698
  {
2699
+ "name": "zai/GLM-4.7",
2700
  "type": "chat",
2701
  "input_price_per_1m": 0.6,
2702
  "output_price_per_1m": 2.2,
2703
  "currency": "USD",
 
2704
  "capabilities": [
 
2705
  "reasoning"
2706
  ],
2707
+ "context_window": 200000,
2708
+ "hf_id": "zai-org/GLM-4.7",
2709
  "size_b": 358.3,
2710
  "hf_private": false
2711
  },
2712
  {
2713
+ "name": "zai/GLM-4.5",
2714
+ "type": "chat",
2715
  "input_price_per_1m": 0.6,
2716
+ "output_price_per_1m": 2.2,
2717
  "currency": "USD",
2718
  "capabilities": [
 
2719
  "reasoning"
2720
  ],
2721
+ "context_window": 131072,
2722
+ "hf_id": "zai-org/GLM-4.5",
2723
+ "size_b": 358.3,
2724
+ "hf_private": false
 
2725
  },
2726
  {
2727
+ "name": "deepinfra/zai-org/GLM-4.5",
2728
+ "type": "chat",
2729
  "input_price_per_1m": 0.6,
2730
+ "output_price_per_1m": 2.2,
2731
  "currency": "USD",
2732
+ "context_window": 131072,
2733
  "capabilities": [
2734
+ "tools",
2735
  "reasoning"
2736
  ],
2737
+ "hf_id": "zai-org/GLM-4.5",
2738
+ "size_b": 358.3,
 
2739
  "hf_private": false
2740
  },
2741
  {
 
2802
  "hf_private": false
2803
  },
2804
  {
2805
+ "name": "openai/gpt-5.4-mini",
2806
  "type": "vision",
2807
  "input_price_per_1m": 0.75,
2808
  "output_price_per_1m": 4.5,
 
2815
  "hf_private": true
2816
  },
2817
  {
2818
+ "name": "openai-responses/gpt-5.4-mini",
2819
  "type": "vision",
2820
  "input_price_per_1m": 0.75,
2821
  "output_price_per_1m": 4.5,
 
2828
  "hf_private": true
2829
  },
2830
  {
2831
+ "name": "nebius/deepseek-ai/DeepSeek-R1-0528",
2832
  "type": "chat",
2833
  "input_price_per_1m": 0.8,
2834
+ "output_price_per_1m": 2.4,
2835
  "currency": "USD",
2836
+ "context_window": 164000,
 
2837
  "capabilities": [
2838
+ "tools",
2839
+ "reasoning"
2840
  ],
2841
+ "hf_id": "deepseek-ai/DeepSeek-R1-0528",
2842
+ "size_b": 684.5,
2843
  "hf_private": false
2844
  },
2845
  {
 
2857
  "hf_private": false
2858
  },
2859
  {
2860
+ "name": "novita/qwen/qwen2.5-vl-72b-instruct",
2861
  "type": "chat",
2862
  "input_price_per_1m": 0.8,
2863
  "output_price_per_1m": 0.8,
2864
  "currency": "USD",
2865
+ "context_window": 96000,
2866
+ "size_b": 72,
2867
+ "capabilities": [
2868
+ "vision"
2869
+ ],
2870
+ "hf_id": "Qwen/Qwen2.5-VL-72B-Instruct",
2871
  "hf_private": false
2872
  },
2873
  {
2874
+ "name": "deepinfra/meta-llama/Meta-Llama-3.1-405B-Instruct",
2875
  "type": "chat",
2876
  "input_price_per_1m": 0.8,
2877
+ "output_price_per_1m": 0.8,
2878
  "currency": "USD",
2879
+ "context_window": 130815,
2880
+ "size_b": 405,
 
 
 
 
 
2881
  "hf_private": false
2882
  },
2883
  {
2884
+ "name": "deepinfra/deepseek-ai/DeepSeek-R1",
2885
  "type": "chat",
2886
  "input_price_per_1m": 0.85,
2887
+ "output_price_per_1m": 2.5,
2888
  "currency": "USD",
2889
+ "context_window": 64000,
2890
  "capabilities": [
2891
  "tools",
2892
  "reasoning"
2893
  ],
2894
+ "hf_id": "deepseek-ai/DeepSeek-R1",
2895
  "size_b": 671,
2896
+ "size_source": "manual",
2897
  "hf_private": false
2898
  },
2899
  {
2900
+ "name": "deepinfra/deepseek-ai/DeepSeek-V3",
2901
  "type": "chat",
2902
  "input_price_per_1m": 0.85,
2903
+ "output_price_per_1m": 0.9,
2904
  "currency": "USD",
2905
+ "context_window": 128000,
2906
  "capabilities": [
2907
  "tools",
2908
  "reasoning"
2909
  ],
2910
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
2911
  "size_b": 671,
 
2912
  "hf_private": false
2913
  },
2914
  {
 
2924
  "hf_private": true
2925
  },
2926
  {
2927
+ "name": "together/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
2928
  "type": "chat",
2929
  "input_price_per_1m": 0.88,
2930
  "output_price_per_1m": 0.88,
2931
  "currency": "USD",
2932
  "context_window": 131072,
2933
  "size_b": 70,
 
 
 
 
2934
  "hf_private": false
2935
  },
2936
  {
2937
+ "name": "together/meta-llama/Llama-3.3-70B-Instruct-Turbo",
2938
  "type": "chat",
2939
  "input_price_per_1m": 0.88,
2940
  "output_price_per_1m": 0.88,
2941
  "currency": "USD",
2942
  "context_window": 131072,
2943
  "size_b": 70,
2944
+ "capabilities": [
2945
+ "tools"
2946
+ ],
2947
+ "hf_id": "meta-llama/Llama-3.3-70B-Instruct",
2948
  "hf_private": false
2949
  },
2950
  {
 
2984
  "hf_private": true
2985
  },
2986
  {
2987
+ "name": "bedrock/claude-haiku-4-5",
2988
  "type": "vision",
2989
  "input_price_per_1m": 1,
2990
  "output_price_per_1m": 5,
 
2996
  "hf_private": true
2997
  },
2998
  {
2999
+ "name": "vertex/claude-haiku-4-5",
3000
  "type": "vision",
3001
  "input_price_per_1m": 1,
3002
  "output_price_per_1m": 5,
 
3021
  "size_b": 753.9,
3022
  "hf_private": false
3023
  },
3024
+ {
3025
+ "name": "openai/o3",
3026
+ "type": "vision",
3027
+ "input_price_per_1m": 1,
3028
+ "output_price_per_1m": 4,
3029
+ "currency": "USD",
3030
+ "capabilities": [
3031
+ "vision",
3032
+ "reasoning"
3033
+ ],
3034
+ "context_window": 200000,
3035
+ "hf_private": true
3036
+ },
3037
  {
3038
  "name": "zai/GLM-5",
3039
  "type": "vision",
 
3050
  "hf_private": false
3051
  },
3052
  {
3053
+ "name": "perplexity/sonar",
3054
+ "type": "chat",
3055
  "input_price_per_1m": 1,
3056
+ "output_price_per_1m": 1,
3057
  "currency": "USD",
3058
+ "context_window": 131072,
3059
  "capabilities": [
3060
  "vision"
3061
  ],
 
3062
  "hf_private": true
3063
  },
3064
  {
3065
+ "name": "anthropic/claude-haiku-4-5",
3066
+ "type": "vision",
3067
  "input_price_per_1m": 1,
3068
+ "output_price_per_1m": 5,
3069
  "currency": "USD",
 
3070
  "capabilities": [
3071
+ "vision"
3072
  ],
3073
+ "context_window": 200000,
3074
+ "hf_private": true
 
3075
  },
3076
  {
3077
  "name": "groq/moonshotai/kimi-k2-instruct",
 
3088
  "hf_private": false
3089
  },
3090
  {
3091
+ "name": "groq/moonshotai/Kimi-K2-Instruct-0905",
3092
  "type": "chat",
3093
  "input_price_per_1m": 1,
3094
+ "output_price_per_1m": 3,
 
 
 
 
 
 
 
 
 
 
 
 
3095
  "currency": "USD",
3096
+ "context_window": 256000,
3097
  "capabilities": [
3098
+ "tools"
 
3099
  ],
3100
+ "hf_id": "moonshotai/Kimi-K2-Instruct",
3101
+ "size_b": 1026.5,
3102
+ "hf_private": false
3103
  },
3104
  {
3105
+ "name": "openai/o3-mini",
3106
  "type": "chat",
3107
  "input_price_per_1m": 1.1,
3108
  "output_price_per_1m": 4.4,
 
3126
  "hf_private": true
3127
  },
3128
  {
3129
+ "name": "openai-responses/o4-mini",
3130
  "type": "chat",
3131
  "input_price_per_1m": 1.1,
3132
  "output_price_per_1m": 4.4,
 
3138
  "hf_private": true
3139
  },
3140
  {
3141
+ "name": "azure/o4-mini",
3142
  "type": "chat",
3143
  "input_price_per_1m": 1.1,
3144
  "output_price_per_1m": 4.4,
 
3174
  "hf_private": false
3175
  },
3176
  {
3177
+ "name": "google/gemini-2.5-pro",
3178
  "type": "vision",
3179
  "input_price_per_1m": 1.25,
3180
  "output_price_per_1m": 10,
 
3183
  "vision",
3184
  "reasoning"
3185
  ],
3186
+ "context_window": 1048576,
3187
  "hf_private": true
3188
  },
3189
  {
3190
+ "name": "vertex/gemini-2.5-pro",
3191
  "type": "vision",
3192
  "input_price_per_1m": 1.25,
3193
  "output_price_per_1m": 10,
 
3196
  "vision",
3197
  "reasoning"
3198
  ],
3199
+ "context_window": 1048576,
3200
  "hf_private": true
3201
  },
3202
  {
3203
+ "name": "openai/gpt-5.1-chat",
3204
  "type": "vision",
3205
  "input_price_per_1m": 1.25,
3206
  "output_price_per_1m": 10,
 
3209
  "vision",
3210
  "reasoning"
3211
  ],
3212
+ "context_window": 128000,
3213
  "hf_private": true
3214
  },
3215
  {
3216
+ "name": "openai/gpt-5.1",
3217
  "type": "vision",
3218
  "input_price_per_1m": 1.25,
3219
  "output_price_per_1m": 10,
 
3226
  "hf_private": true
3227
  },
3228
  {
3229
+ "name": "openai/gpt-5-chat",
3230
  "type": "vision",
3231
  "input_price_per_1m": 1.25,
3232
  "output_price_per_1m": 10,
 
3235
  "vision",
3236
  "reasoning"
3237
  ],
3238
+ "context_window": 128000,
3239
  "hf_private": true
3240
  },
3241
  {
3242
+ "name": "together/deepseek-ai/DeepSeek-V3",
3243
+ "type": "chat",
3244
  "input_price_per_1m": 1.25,
3245
+ "output_price_per_1m": 1.25,
3246
  "currency": "USD",
3247
+ "context_window": 131072,
3248
  "capabilities": [
3249
+ "tools",
3250
  "reasoning"
3251
  ],
3252
+ "hf_id": "deepseek-ai/DeepSeek-V3.1-Terminus",
3253
+ "size_b": 671,
3254
+ "hf_private": false
3255
  },
3256
  {
3257
+ "name": "openai-responses/gpt-5.1-codex",
3258
  "type": "vision",
3259
  "input_price_per_1m": 1.25,
3260
  "output_price_per_1m": 10,
 
3263
  "vision",
3264
  "reasoning"
3265
  ],
3266
+ "context_window": 400000,
3267
  "hf_private": true
3268
  },
3269
  {
3270
+ "name": "openai-responses/gpt-5.1",
3271
+ "type": "vision",
3272
  "input_price_per_1m": 1.25,
3273
  "output_price_per_1m": 10,
3274
  "currency": "USD",
3275
  "capabilities": [
3276
+ "vision",
3277
  "reasoning"
3278
  ],
3279
+ "context_window": 400000,
3280
  "hf_private": true
3281
  },
3282
  {
3283
+ "name": "openai-responses/gpt-5-codex",
3284
+ "type": "vision",
3285
  "input_price_per_1m": 1.25,
3286
  "output_price_per_1m": 10,
3287
  "currency": "USD",
3288
  "capabilities": [
3289
+ "vision",
3290
  "reasoning"
3291
  ],
3292
+ "context_window": 400000,
3293
  "hf_private": true
3294
  },
3295
  {
3296
+ "name": "openai-responses/gpt-5",
3297
+ "type": "vision",
3298
  "input_price_per_1m": 1.25,
3299
+ "output_price_per_1m": 10,
3300
  "currency": "USD",
 
3301
  "capabilities": [
3302
+ "vision",
3303
  "reasoning"
3304
  ],
3305
+ "context_window": 400000,
3306
+ "hf_private": true
 
3307
  },
3308
  {
3309
+ "name": "azure/gpt-5",
3310
+ "type": "chat",
3311
  "input_price_per_1m": 1.25,
3312
  "output_price_per_1m": 10,
3313
  "currency": "USD",
3314
  "capabilities": [
 
3315
  "reasoning"
3316
  ],
3317
+ "context_window": 200000,
3318
  "hf_private": true
3319
  },
3320
  {
3321
+ "name": "azure/gpt-5.1",
3322
+ "type": "chat",
3323
  "input_price_per_1m": 1.25,
3324
  "output_price_per_1m": 10,
3325
  "currency": "USD",
3326
  "capabilities": [
 
3327
  "reasoning"
3328
  ],
3329
+ "context_window": 200000,
3330
  "hf_private": true
3331
  },
3332
  {
3333
+ "name": "coding/gemini-2.5-pro",
3334
  "type": "vision",
3335
  "input_price_per_1m": 1.25,
3336
  "output_price_per_1m": 10,
 
3339
  "vision",
3340
  "reasoning"
3341
  ],
3342
+ "context_window": 1048576,
3343
  "hf_private": true
3344
  },
3345
  {
 
3375
  "hf_private": true
3376
  },
3377
  {
3378
+ "name": "openai/gpt-5.2-chat",
3379
  "type": "vision",
3380
  "input_price_per_1m": 1.75,
3381
  "output_price_per_1m": 14,
 
3388
  "hf_private": true
3389
  },
3390
  {
3391
+ "name": "openai/gpt-5.2",
3392
  "type": "vision",
3393
  "input_price_per_1m": 1.75,
3394
  "output_price_per_1m": 14,
 
3401
  "hf_private": true
3402
  },
3403
  {
3404
+ "name": "openai/gpt-5.3-chat",
3405
  "type": "vision",
3406
  "input_price_per_1m": 1.75,
3407
  "output_price_per_1m": 14,
 
3410
  "vision",
3411
  "reasoning"
3412
  ],
3413
+ "context_window": 128000,
3414
  "hf_private": true
3415
  },
3416
  {
3417
+ "name": "openai-responses/gpt-5.2-codex",
3418
  "type": "vision",
3419
  "input_price_per_1m": 1.75,
3420
  "output_price_per_1m": 14,
 
3427
  "hf_private": true
3428
  },
3429
  {
3430
+ "name": "openai-responses/gpt-5.3-chat",
3431
  "type": "vision",
3432
  "input_price_per_1m": 1.75,
3433
  "output_price_per_1m": 14,
 
3436
  "vision",
3437
  "reasoning"
3438
  ],
3439
+ "context_window": 128000,
 
 
 
 
 
 
 
 
 
 
 
 
3440
  "hf_private": true
3441
  },
3442
  {
3443
+ "name": "openai-responses/gpt-5.3-codex",
3444
  "type": "vision",
3445
  "input_price_per_1m": 1.75,
3446
  "output_price_per_1m": 14,
 
3453
  "hf_private": true
3454
  },
3455
  {
3456
+ "name": "openai-responses/gpt-5.2",
3457
  "type": "vision",
3458
  "input_price_per_1m": 1.75,
3459
  "output_price_per_1m": 14,
 
3466
  "hf_private": true
3467
  },
3468
  {
3469
+ "name": "azure/gpt-5.2",
3470
+ "type": "chat",
3471
  "input_price_per_1m": 1.75,
3472
  "output_price_per_1m": 14,
3473
  "currency": "USD",
3474
  "capabilities": [
 
3475
  "reasoning"
3476
  ],
3477
+ "context_window": 200000,
3478
  "hf_private": true
3479
  },
3480
  {
3481
+ "name": "azure/openai-responses/gpt-5.2-codex",
3482
  "type": "vision",
3483
  "input_price_per_1m": 1.75,
3484
  "output_price_per_1m": 14,
 
3487
  "vision",
3488
  "reasoning"
3489
  ],
3490
+ "context_window": 400000,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3491
  "hf_private": true
3492
  },
3493
  {
3494
+ "name": "azure/gpt-5.3-codex",
3495
  "type": "vision",
3496
+ "input_price_per_1m": 1.75,
3497
+ "output_price_per_1m": 14,
3498
  "currency": "USD",
3499
  "capabilities": [
3500
  "vision",
3501
  "reasoning"
3502
  ],
3503
+ "context_window": 400000,
3504
  "hf_private": true
3505
  },
3506
  {
3507
+ "name": "google/gemini-3-pro-preview",
3508
  "type": "vision",
3509
  "input_price_per_1m": 2,
3510
  "output_price_per_1m": 12,
 
3517
  "hf_private": true
3518
  },
3519
  {
3520
+ "name": "google/gemini-3.1-pro-preview",
3521
  "type": "vision",
3522
  "input_price_per_1m": 2,
3523
  "output_price_per_1m": 12,
 
3539
  "hf_private": true
3540
  },
3541
  {
3542
+ "name": "vertex/gemini-3-pro-preview",
3543
  "type": "vision",
3544
  "input_price_per_1m": 2,
3545
  "output_price_per_1m": 12,
 
3552
  "hf_private": true
3553
  },
3554
  {
3555
+ "name": "vertex/gemini-3.1-pro-preview",
3556
  "type": "vision",
3557
  "input_price_per_1m": 2,
3558
  "output_price_per_1m": 12,
 
3578
  "hf_private": true
3579
  },
3580
  {
3581
+ "name": "nebius/deepseek-ai/DeepSeek-V3-0324-fast",
3582
+ "type": "chat",
3583
+ "input_price_per_1m": 2,
3584
+ "output_price_per_1m": 6,
3585
+ "currency": "USD",
3586
+ "context_window": 128000,
3587
+ "hf_private": true
3588
+ },
3589
+ {
3590
+ "name": "openai/gpt-4.1",
3591
  "type": "vision",
3592
  "input_price_per_1m": 2,
3593
  "output_price_per_1m": 8,
 
3599
  "hf_private": true
3600
  },
3601
  {
3602
+ "name": "openai/o4-mini-deep-research",
3603
  "type": "vision",
3604
  "input_price_per_1m": 2,
3605
  "output_price_per_1m": 8,
3606
  "currency": "USD",
3607
  "capabilities": [
3608
+ "vision",
3609
+ "reasoning"
3610
  ],
3611
+ "context_window": 100000,
3612
  "hf_private": true
3613
  },
3614
  {
 
3625
  "hf_private": true
3626
  },
3627
  {
3628
+ "name": "xai/grok-4.2-beta",
3629
  "type": "vision",
3630
  "input_price_per_1m": 2,
3631
+ "output_price_per_1m": 6,
3632
  "currency": "USD",
3633
  "capabilities": [
3634
  "vision",
3635
  "reasoning"
3636
  ],
3637
+ "context_window": 2000000,
3638
  "hf_private": true
3639
  },
3640
  {
3641
+ "name": "xai/grok-2-1212",
3642
+ "type": "chat",
3643
+ "input_price_per_1m": 2,
3644
+ "output_price_per_1m": 10,
3645
+ "currency": "USD",
3646
+ "context_window": 131072,
3647
+ "hf_private": true
3648
+ },
3649
+ {
3650
+ "name": "openai-responses/gpt-4.1",
3651
  "type": "vision",
3652
  "input_price_per_1m": 2,
3653
  "output_price_per_1m": 8,
 
3659
  "hf_private": true
3660
  },
3661
  {
3662
+ "name": "azure/gpt-4.1",
3663
+ "type": "vision",
3664
  "input_price_per_1m": 2,
3665
+ "output_price_per_1m": 8,
3666
  "currency": "USD",
3667
+ "capabilities": [
3668
+ "vision"
3669
+ ],
3670
+ "context_window": 1047576,
3671
  "hf_private": true
3672
  },
3673
  {
3674
+ "name": "azure/openai-responses/gpt-4.1",
3675
  "type": "vision",
3676
+ "input_price_per_1m": 2,
3677
+ "output_price_per_1m": 8,
3678
  "currency": "USD",
3679
  "capabilities": [
3680
+ "vision"
 
3681
  ],
3682
+ "context_window": 1047576,
3683
  "hf_private": true
3684
  },
3685
  {
3686
+ "name": "openai/gpt-5.4",
3687
  "type": "vision",
3688
  "input_price_per_1m": 2.5,
3689
  "output_price_per_1m": 15,
 
3696
  "hf_private": true
3697
  },
3698
  {
3699
+ "name": "openai/gpt-4o-2024-05-13",
3700
  "type": "vision",
3701
  "input_price_per_1m": 2.5,
3702
  "output_price_per_1m": 10,
 
3708
  "hf_private": true
3709
  },
3710
  {
3711
+ "name": "openai/gpt-4o",
3712
  "type": "vision",
3713
  "input_price_per_1m": 2.5,
3714
+ "output_price_per_1m": 10,
3715
  "currency": "USD",
3716
  "capabilities": [
3717
+ "vision"
 
3718
  ],
3719
+ "context_window": 128000,
3720
  "hf_private": true
3721
  },
3722
  {
3723
+ "name": "openai/gpt-4o-2024-11-20",
3724
  "type": "vision",
3725
  "input_price_per_1m": 2.5,
3726
  "output_price_per_1m": 10,
 
3732
  "hf_private": true
3733
  },
3734
  {
3735
+ "name": "openai/gpt-4o-2024-08-06",
3736
  "type": "vision",
3737
  "input_price_per_1m": 2.5,
3738
  "output_price_per_1m": 10,
 
3744
  "hf_private": true
3745
  },
3746
  {
3747
+ "name": "openai-responses/gpt-5.4",
3748
+ "type": "vision",
3749
+ "input_price_per_1m": 2.5,
3750
+ "output_price_per_1m": 15,
3751
+ "currency": "USD",
3752
+ "capabilities": [
3753
+ "vision",
3754
+ "reasoning"
3755
+ ],
3756
+ "context_window": 1050000,
3757
+ "hf_private": true
3758
+ },
3759
+ {
3760
+ "name": "azure/openai-responses/gpt-5.4",
3761
  "type": "vision",
3762
  "input_price_per_1m": 2.5,
3763
+ "output_price_per_1m": 15,
3764
  "currency": "USD",
3765
  "capabilities": [
3766
+ "vision",
3767
+ "reasoning"
3768
  ],
3769
+ "context_window": 1050000,
3770
  "hf_private": true
3771
  },
3772
  {
3773
+ "name": "bedrock/claude-3-7-sonnet",
3774
  "type": "vision",
3775
  "input_price_per_1m": 3,
3776
  "output_price_per_1m": 15,
 
3779
  "vision",
3780
  "reasoning"
3781
  ],
3782
+ "context_window": 200000,
3783
  "hf_private": true
3784
  },
3785
  {
3786
+ "name": "bedrock/claude-sonnet-4",
3787
  "type": "vision",
3788
  "input_price_per_1m": 3,
3789
  "output_price_per_1m": 15,
 
3792
  "vision",
3793
  "reasoning"
3794
  ],
3795
+ "context_window": 200000,
3796
  "hf_private": true
3797
  },
3798
  {
3799
+ "name": "bedrock/claude-sonnet-4-6",
3800
  "type": "vision",
3801
  "input_price_per_1m": 3,
3802
  "output_price_per_1m": 15,
 
3809
  "hf_private": true
3810
  },
3811
  {
3812
+ "name": "bedrock/claude-sonnet-4-5",
3813
  "type": "vision",
3814
  "input_price_per_1m": 3,
3815
  "output_price_per_1m": 15,
3816
  "currency": "USD",
3817
  "capabilities": [
3818
+ "vision",
3819
+ "reasoning"
3820
  ],
3821
+ "context_window": 200000,
3822
  "hf_private": true
3823
  },
3824
  {
3825
+ "name": "vertex/claude-3-7-sonnet",
3826
  "type": "vision",
3827
  "input_price_per_1m": 3,
3828
  "output_price_per_1m": 15,
 
3835
  "hf_private": true
3836
  },
3837
  {
3838
+ "name": "vertex/claude-sonnet-4-5",
3839
  "type": "vision",
3840
  "input_price_per_1m": 3,
3841
  "output_price_per_1m": 15,
 
3848
  "hf_private": true
3849
  },
3850
  {
3851
+ "name": "vertex/claude-3-5-sonnet",
3852
  "type": "vision",
3853
  "input_price_per_1m": 3,
3854
  "output_price_per_1m": 15,
3855
  "currency": "USD",
3856
  "capabilities": [
3857
+ "vision"
 
3858
  ],
3859
  "context_window": 200000,
3860
  "hf_private": true
3861
  },
3862
  {
3863
+ "name": "vertex/claude-sonnet-4",
3864
  "type": "vision",
3865
  "input_price_per_1m": 3,
3866
  "output_price_per_1m": 15,
 
3869
  "vision",
3870
  "reasoning"
3871
  ],
3872
+ "context_window": 200000,
3873
  "hf_private": true
3874
  },
3875
  {
3876
+ "name": "together/deepseek-ai/DeepSeek-R1",
3877
+ "type": "chat",
3878
  "input_price_per_1m": 3,
3879
+ "output_price_per_1m": 7,
3880
  "currency": "USD",
3881
+ "context_window": 64000,
3882
  "capabilities": [
3883
+ "tools",
3884
  "reasoning"
3885
  ],
3886
+ "hf_id": "deepseek-ai/DeepSeek-R1",
3887
+ "size_b": 671,
3888
+ "size_source": "manual",
3889
+ "hf_private": false
3890
  },
3891
  {
3892
+ "name": "perplexity/sonar-pro",
3893
+ "type": "chat",
3894
  "input_price_per_1m": 3,
3895
  "output_price_per_1m": 15,
3896
  "currency": "USD",
3897
+ "context_window": 204800,
3898
  "capabilities": [
3899
+ "vision"
 
3900
  ],
 
3901
  "hf_private": true
3902
  },
3903
  {
3904
+ "name": "anthropic/claude-sonnet-4-6",
3905
  "type": "vision",
3906
  "input_price_per_1m": 3,
3907
  "output_price_per_1m": 15,
 
3910
  "vision",
3911
  "reasoning"
3912
  ],
3913
+ "context_window": 1000000,
3914
  "hf_private": true
3915
  },
3916
  {
3917
+ "name": "anthropic/claude-sonnet-4-5",
3918
  "type": "vision",
3919
  "input_price_per_1m": 3,
3920
  "output_price_per_1m": 15,
3921
  "currency": "USD",
3922
  "capabilities": [
3923
+ "vision",
3924
+ "reasoning"
3925
  ],
3926
+ "context_window": 1000000,
3927
  "hf_private": true
3928
  },
3929
  {
3930
+ "name": "anthropic/claude-sonnet-4",
3931
  "type": "vision",
3932
  "input_price_per_1m": 3,
3933
  "output_price_per_1m": 15,
 
3936
  "vision",
3937
  "reasoning"
3938
  ],
3939
+ "context_window": 1000000,
3940
  "hf_private": true
3941
  },
3942
  {
3943
+ "name": "xai/grok-4",
3944
+ "type": "vision",
3945
  "input_price_per_1m": 3,
3946
+ "output_price_per_1m": 15,
3947
  "currency": "USD",
 
3948
  "capabilities": [
3949
+ "vision"
 
3950
  ],
3951
+ "context_window": 256000,
3952
+ "hf_private": true
 
 
3953
  },
3954
  {
3955
+ "name": "coding/claude-sonnet-4-20250514",
3956
+ "type": "vision",
3957
  "input_price_per_1m": 3,
3958
  "output_price_per_1m": 15,
3959
  "currency": "USD",
 
3960
  "capabilities": [
3961
+ "vision",
3962
+ "reasoning"
3963
  ],
3964
+ "context_window": 200000,
3965
  "hf_private": true
3966
  },
3967
  {
 
3981
  "hf_private": false
3982
  },
3983
  {
3984
+ "name": "bedrock/claude-opus-4-5",
3985
  "type": "vision",
3986
  "input_price_per_1m": 5,
3987
  "output_price_per_1m": 25,
 
3990
  "vision",
3991
  "reasoning"
3992
  ],
3993
+ "context_window": 200000,
3994
  "hf_private": true
3995
  },
3996
  {
3997
+ "name": "bedrock/claude-opus-4-6",
3998
  "type": "vision",
3999
  "input_price_per_1m": 5,
4000
  "output_price_per_1m": 25,
 
4003
  "vision",
4004
  "reasoning"
4005
  ],
4006
+ "context_window": 1000000,
4007
  "hf_private": true
4008
  },
4009
  {
4010
+ "name": "vertex/claude-opus-4-6",
4011
+ "type": "vision",
4012
  "input_price_per_1m": 5,
4013
  "output_price_per_1m": 25,
4014
  "currency": "USD",
 
4015
  "capabilities": [
4016
+ "vision",
4017
+ "reasoning"
4018
  ],
4019
+ "context_window": 1000000,
4020
  "hf_private": true
4021
  },
4022
  {
4023
+ "name": "vertex/claude-opus-4-5",
4024
  "type": "vision",
4025
  "input_price_per_1m": 5,
4026
  "output_price_per_1m": 25,
 
4033
  "hf_private": true
4034
  },
4035
  {
4036
+ "name": "openai/chatgpt-4o",
4037
  "type": "vision",
4038
  "input_price_per_1m": 5,
4039
+ "output_price_per_1m": 15,
4040
  "currency": "USD",
4041
  "capabilities": [
4042
+ "vision"
 
4043
  ],
4044
+ "context_window": 128000,
4045
  "hf_private": true
4046
  },
4047
  {
4048
+ "name": "anthropic/claude-opus-4-6",
4049
  "type": "vision",
4050
  "input_price_per_1m": 5,
4051
  "output_price_per_1m": 25,
 
4054
  "vision",
4055
  "reasoning"
4056
  ],
4057
+ "context_window": 1000000,
4058
  "hf_private": true
4059
  },
4060
  {
4061
+ "name": "anthropic/claude-opus-4-5",
4062
  "type": "vision",
4063
  "input_price_per_1m": 5,
4064
  "output_price_per_1m": 25,
 
4067
  "vision",
4068
  "reasoning"
4069
  ],
4070
+ "context_window": 200000,
4071
  "hf_private": true
4072
  },
4073
  {
4074
+ "name": "xai/grok-3",
4075
+ "type": "chat",
4076
  "input_price_per_1m": 5,
4077
+ "output_price_per_1m": 25,
4078
  "currency": "USD",
4079
+ "context_window": 131072,
4080
  "capabilities": [
4081
+ "tools"
4082
  ],
 
4083
  "hf_private": true
4084
  },
4085
  {
 
4096
  "hf_private": true
4097
  },
4098
  {
4099
+ "name": "bedrock/claude-opus-4",
4100
  "type": "vision",
4101
  "input_price_per_1m": 15,
4102
  "output_price_per_1m": 75,
 
4109
  "hf_private": true
4110
  },
4111
  {
4112
+ "name": "vertex/claude-opus-4-1",
4113
  "type": "vision",
4114
  "input_price_per_1m": 15,
4115
  "output_price_per_1m": 75,
 
4122
  "hf_private": true
4123
  },
4124
  {
4125
+ "name": "vertex/claude-opus-4",
4126
  "type": "vision",
4127
  "input_price_per_1m": 15,
4128
+ "output_price_per_1m": 75,
4129
  "currency": "USD",
4130
  "capabilities": [
4131
  "vision",
4132
  "reasoning"
4133
  ],
4134
+ "context_window": 200000,
4135
  "hf_private": true
4136
  },
4137
  {
4138
+ "name": "openai/o1",
4139
  "type": "vision",
4140
  "input_price_per_1m": 15,
4141
+ "output_price_per_1m": 60,
4142
  "currency": "USD",
4143
  "capabilities": [
4144
  "vision",
 
4148
  "hf_private": true
4149
  },
4150
  {
4151
+ "name": "anthropic/claude-opus-4",
4152
  "type": "vision",
4153
  "input_price_per_1m": 15,
4154
  "output_price_per_1m": 75,
 
4161
  "hf_private": true
4162
  },
4163
  {
4164
+ "name": "anthropic/claude-opus-4-1",
4165
  "type": "vision",
4166
  "input_price_per_1m": 15,
4167
  "output_price_per_1m": 75,
 
4174
  "hf_private": true
4175
  },
4176
  {
4177
+ "name": "openai-responses/gpt-5-pro",
4178
  "type": "vision",
4179
  "input_price_per_1m": 15,
4180
+ "output_price_per_1m": 120,
4181
  "currency": "USD",
4182
  "capabilities": [
4183
  "vision",
4184
  "reasoning"
4185
  ],
4186
+ "context_window": 400000,
4187
  "hf_private": true
4188
  },
4189
  {
4190
+ "name": "coding/claude-opus-4-20250514",
4191
  "type": "vision",
4192
  "input_price_per_1m": 15,
4193
+ "output_price_per_1m": 75,
4194
  "currency": "USD",
4195
  "capabilities": [
4196
  "vision",
 
4213
  "hf_private": true
4214
  },
4215
  {
4216
+ "name": "openai/gpt-5.4-pro",
4217
  "type": "vision",
4218
  "input_price_per_1m": 30,
4219
  "output_price_per_1m": 180,
 
4226
  "hf_private": true
4227
  },
4228
  {
4229
+ "name": "openai-responses/gpt-5.4-pro",
4230
  "type": "vision",
4231
  "input_price_per_1m": 30,
4232
  "output_price_per_1m": 180,
 
4239
  "hf_private": true
4240
  },
4241
  {
4242
+ "name": "azure/openai-responses/gpt-5.4-pro",
4243
  "type": "vision",
4244
  "input_price_per_1m": 30,
4245
  "output_price_per_1m": 180,
 
4987
  {
4988
  "name": "whisper-large-v3",
4989
  "type": "audio",
 
 
4990
  "currency": "EUR",
4991
  "hf_id": "openai/whisper-large-v3",
4992
+ "size_b": 1.55,
4993
+ "hf_private": false,
4994
+ "price_per_minute": 0.003,
4995
+ "size_source": "manual"
4996
  },
4997
  {
4998
  "name": "holo2-30b-a3b",
 
5068
  {
5069
  "name": "voxtral-small-24b-2507",
5070
  "type": "audio",
 
 
5071
  "currency": "EUR",
5072
  "size_b": 24,
5073
  "capabilities": [
 
5075
  "tools"
5076
  ],
5077
  "hf_id": "mistralai/Voxtral-Small-24B-2507",
5078
+ "hf_private": false,
5079
+ "price_per_minute": 0.15
5080
  },
5081
  {
5082
  "name": "gemma-3-27b-it",
 
5309
  },
5310
  {
5311
  "name": "Voxtral Mini Transcribe 2",
5312
+ "type": "audio",
 
 
5313
  "currency": "USD",
5314
  "api_endpoint": "voxtral-mini-latest",
5315
+ "hf_private": true,
5316
+ "price_per_minute": 0.003
5317
  },
5318
  {
5319
  "name": "Voxtral Realtime",
5320
+ "type": "audio",
 
 
5321
  "currency": "USD",
5322
  "api_endpoint": "voxtral-mini-latest",
5323
+ "hf_private": true,
5324
+ "price_per_minute": 0.006
5325
  },
5326
  {
5327
  "name": "Voxtral Small",
5328
+ "type": "audio",
5329
  "input_price_per_1m": 0.004,
5330
  "output_price_per_1m": 0.3,
5331
  "currency": "USD",
 
5340
  },
5341
  {
5342
  "name": "Voxtral Mini",
5343
+ "type": "audio",
5344
  "input_price_per_1m": 0.001,
5345
  "output_price_per_1m": 0.04,
5346
  "currency": "USD",
 
6050
  "tools",
6051
  "eu-endpoint"
6052
  ],
6053
+ "hf_private": true,
6054
+ "audio_price_per_1m": 0.075
6055
  },
6056
  {
6057
  "name": "qwen/qwen3-vl-8b-instruct",
 
6296
  "tools"
6297
  ],
6298
  "size_b": 24,
6299
+ "hf_private": false,
6300
+ "audio_price_per_1m": 100
6301
  },
6302
  {
6303
  "name": "nvidia/llama-3.3-nemotron-super-49b-v1.5",
 
6328
  "reasoning",
6329
  "eu-endpoint"
6330
  ],
6331
+ "hf_private": true,
6332
+ "audio_price_per_1m": 0.3
6333
  },
6334
  {
6335
  "name": "z-ai/glm-4-32b",
 
6371
  "reasoning",
6372
  "eu-endpoint"
6373
  ],
6374
+ "hf_private": true,
6375
+ "audio_price_per_1m": 0.3
6376
  },
6377
  {
6378
  "name": "mistralai/devstral-small",
 
6415
  "tools",
6416
  "eu-endpoint"
6417
  ],
6418
+ "hf_private": true,
6419
+ "audio_price_per_1m": 0.7
6420
  },
6421
  {
6422
  "name": "meta-llama/llama-3.3-70b-instruct",
 
7200
  "reasoning",
7201
  "eu-endpoint"
7202
  ],
7203
+ "hf_private": true,
7204
+ "audio_price_per_1m": 0.5
7205
  },
7206
  {
7207
  "name": "bytedance-seed/seed-1.6",
 
7535
  "image-gen",
7536
  "eu-endpoint"
7537
  ],
7538
+ "hf_private": true,
7539
+ "audio_price_per_1m": 1
7540
  },
7541
  {
7542
  "name": "thedrummer/cydonia-24b-v4.1",
 
7574
  "reasoning",
7575
  "eu-endpoint"
7576
  ],
7577
+ "hf_private": true,
7578
+ "audio_price_per_1m": 1
7579
  },
7580
  {
7581
  "name": "x-ai/grok-3-mini",
 
7925
  "reasoning",
7926
  "eu-endpoint"
7927
  ],
7928
+ "hf_private": true,
7929
+ "audio_price_per_1m": 1
7930
  },
7931
  {
7932
  "name": "mistralai/mistral-large-2512",
 
8038
  "audio",
8039
  "audio-out"
8040
  ],
8041
+ "hf_private": true,
8042
+ "audio_price_per_1m": 0.6
8043
  },
8044
  {
8045
  "name": "z-ai/glm-4.5v",
 
8681
  "reasoning",
8682
  "eu-endpoint"
8683
  ],
8684
+ "hf_private": true,
8685
+ "audio_price_per_1m": 1.25
8686
  },
8687
  {
8688
  "name": "google/gemini-2.5-pro-preview",
 
8698
  "reasoning",
8699
  "eu-endpoint"
8700
  ],
8701
+ "hf_private": true,
8702
+ "audio_price_per_1m": 1.25
8703
  },
8704
  {
8705
  "name": "google/gemini-2.5-pro-preview-05-06",
 
8716
  "reasoning",
8717
  "eu-endpoint"
8718
  ],
8719
+ "hf_private": true,
8720
+ "audio_price_per_1m": 1.25
8721
  },
8722
  {
8723
  "name": "sao10k/l3-euryale-70b",
 
8851
  "tools",
8852
  "reasoning"
8853
  ],
8854
+ "hf_private": true,
8855
+ "audio_price_per_1m": 2
8856
  },
8857
  {
8858
  "name": "google/gemini-3.1-pro-preview",
 
8869
  "reasoning",
8870
  "eu-endpoint"
8871
  ],
8872
+ "hf_private": true,
8873
+ "audio_price_per_1m": 2
8874
  },
8875
  {
8876
  "name": "google/gemini-3-pro-image-preview",
 
8884
  "reasoning",
8885
  "eu-endpoint"
8886
  ],
8887
+ "hf_private": true,
8888
+ "audio_price_per_1m": 2
8889
  },
8890
  {
8891
  "name": "google/gemini-3-pro-preview",
 
8902
  "reasoning",
8903
  "eu-endpoint"
8904
  ],
8905
+ "hf_private": true,
8906
+ "audio_price_per_1m": 2
8907
  },
8908
  {
8909
  "name": "openai/o4-mini-deep-research",
 
9068
  "audio",
9069
  "audio-out"
9070
  ],
9071
+ "hf_private": true,
9072
+ "audio_price_per_1m": 32
9073
  },
9074
  {
9075
  "name": "amazon/nova-premier-v1",
 
9110
  "audio-out",
9111
  "tools"
9112
  ],
9113
+ "hf_private": true,
9114
+ "audio_price_per_1m": 40
9115
  },
9116
  {
9117
  "name": "cohere/command-a",
 
10092
  {
10093
  "name": "Whisper V3 Large",
10094
  "type": "audio",
 
 
10095
  "currency": "USD",
10096
  "hf_id": "openai/whisper-large-v3",
10097
+ "size_b": 1.55,
10098
+ "hf_private": false,
10099
+ "price_per_minute": 0.00185,
10100
+ "size_source": "manual"
10101
  },
10102
  {
10103
  "name": "Whisper Large v3 Turbo",
10104
  "type": "audio",
 
 
10105
  "currency": "USD",
10106
  "hf_id": "openai/whisper-large-v3-turbo",
10107
+ "size_b": 0.81,
10108
+ "hf_private": false,
10109
+ "price_per_minute": 0.0006666666666666666,
10110
+ "size_source": "manual"
10111
  }
10112
  ]
10113
  },
 
10127
  "image-gen"
10128
  ],
10129
  "price_per_image": 0.014,
 
 
10130
  "currency": "USD",
10131
  "category": "FLUX.2",
10132
  "size_b": 4,
 
10142
  "image-gen"
10143
  ],
10144
  "price_per_image": 0.015,
 
 
10145
  "currency": "USD",
10146
  "category": "FLUX.2",
10147
  "size_b": 9,
 
10157
  "image-gen"
10158
  ],
10159
  "price_per_image": 0.025,
 
 
10160
  "currency": "USD",
10161
  "category": "FLUX.1",
10162
  "size_b": 12,
 
10172
  "image-gen"
10173
  ],
10174
  "price_per_image": 0.03,
 
 
10175
  "currency": "USD",
10176
  "category": "FLUX.2",
10177
  "size_b": 32,
 
10187
  "image-gen"
10188
  ],
10189
  "price_per_image": 0.04,
 
 
10190
  "currency": "USD",
10191
  "category": "FLUX.1",
10192
  "hf_id": "black-forest-labs/FLUX.1-pro",
 
10202
  "image-gen"
10203
  ],
10204
  "price_per_image": 0.04,
 
 
10205
  "currency": "USD",
10206
  "category": "FLUX.1",
10207
  "hf_id": "black-forest-labs/FLUX.1-pro",
 
10217
  "image-gen"
10218
  ],
10219
  "price_per_image": 0.05,
 
 
10220
  "currency": "USD",
10221
  "category": "FLUX.2",
10222
  "size_b": 32,
 
10232
  "image-gen"
10233
  ],
10234
  "price_per_image": 0.05,
 
 
10235
  "currency": "USD",
10236
  "category": "FLUX.1",
10237
  "hf_id": "black-forest-labs/FLUX.1-pro",
 
10247
  "image-gen"
10248
  ],
10249
  "price_per_image": 0.05,
 
 
10250
  "currency": "USD",
10251
  "category": "FLUX.1 Tools",
10252
  "hf_id": "black-forest-labs/FLUX.1-pro",
 
10262
  "image-gen"
10263
  ],
10264
  "price_per_image": 0.06,
 
 
10265
  "currency": "USD",
10266
  "category": "FLUX.1",
10267
  "hf_id": "black-forest-labs/FLUX.1-pro",
 
10277
  "image-gen"
10278
  ],
10279
  "price_per_image": 0.07,
 
 
10280
  "currency": "USD",
10281
  "category": "FLUX.2",
10282
  "size_b": 32,
 
10292
  "image-gen"
10293
  ],
10294
  "price_per_image": 0.08,
 
 
10295
  "currency": "USD",
10296
  "category": "FLUX.1",
10297
  "hf_id": "black-forest-labs/FLUX.1-pro",
scripts/fetch-providers.js CHANGED
@@ -48,7 +48,7 @@ function updateProviderModels(providers, providerName, models) {
48
  const existing = existingMap.get(newModel.name);
49
  if (!existing) return newModel;
50
 
51
- return {
52
  ...existing,
53
  ...newModel,
54
  size_b: newModel.size_b || existing.size_b,
@@ -56,10 +56,27 @@ function updateProviderModels(providers, providerName, models) {
56
  hf_id: newModel.hf_id || existing.hf_id,
57
  ollama_id: newModel.ollama_id || existing.ollama_id,
58
  hf_private: newModel.hf_private ?? existing.hf_private,
 
59
  capabilities: (newModel.capabilities && newModel.capabilities.length > 0)
60
  ? newModel.capabilities
61
  : existing.capabilities,
62
  };
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
63
  });
64
 
65
  return true;
@@ -72,16 +89,22 @@ const normName = (s) =>
72
  function estimateParams(config, hfId) {
73
  if (!config) return null;
74
  const h = config.hidden_size || config.d_model || config.n_embd;
75
- const l = config.num_hidden_layers || config.n_layer;
76
  const v = config.vocab_size;
77
- const i = config.intermediate_size || config.d_ff;
78
  const numExperts = config.num_local_experts || config.n_experts || config.num_experts || 1;
79
  const modelType = (config.model_type || '').toLowerCase();
 
 
 
 
 
 
80
 
81
  if (h && l && v) {
82
  const intermediate = i || (4 * h);
83
  const vocabParams = v * h;
84
- const posParams = (config.max_position_embeddings || 512) * h;
85
  const typeParams = (config.type_vocab_size || 0) * h;
86
  const embedParams = vocabParams + posParams + typeParams;
87
  const attentionParams = 4 * (h * h);
@@ -174,6 +197,16 @@ const MANUAL_HF_ID_MAP = {
174
  'mistral small 2501': 'mistralai/Mistral-Small-24B-Instruct-2501',
175
  'mistral small 2409': 'mistralai/Mistral-Small-Instruct-2409',
176
  'mistral small 24b': 'mistralai/Mistral-Small-24B-Instruct-2501',
 
 
 
 
 
 
 
 
 
 
177
  };
178
 
179
  const MANUAL_OLLAMA_ID_MAP = {
@@ -194,6 +227,17 @@ const MANUAL_SIZE_MAP = {
194
  'black-forest-labs/FLUX.2-max': 32,
195
  'black-forest-labs/FLUX.2-klein-4B': 4,
196
  'black-forest-labs/FLUX.2-klein-9B': 9,
 
 
 
 
 
 
 
 
 
 
 
197
  };
198
 
199
  const PROPRIETARY_KEYWORDS = [
 
48
  const existing = existingMap.get(newModel.name);
49
  if (!existing) return newModel;
50
 
51
+ const merged = {
52
  ...existing,
53
  ...newModel,
54
  size_b: newModel.size_b || existing.size_b,
 
56
  hf_id: newModel.hf_id || existing.hf_id,
57
  ollama_id: newModel.ollama_id || existing.ollama_id,
58
  hf_private: newModel.hf_private ?? existing.hf_private,
59
+ audio_price_per_1m: newModel.audio_price_per_1m || existing.audio_price_per_1m,
60
  capabilities: (newModel.capabilities && newModel.capabilities.length > 0)
61
  ? newModel.capabilities
62
  : existing.capabilities,
63
  };
64
+
65
+ // If new model uses a different pricing unit, clear the old ones
66
+ if (newModel.price_per_minute !== undefined) {
67
+ delete merged.input_price_per_1m;
68
+ delete merged.output_price_per_1m;
69
+ delete merged.price_per_image;
70
+ } else if (newModel.price_per_image !== undefined) {
71
+ delete merged.input_price_per_1m;
72
+ delete merged.output_price_per_1m;
73
+ delete merged.price_per_minute;
74
+ } else if (newModel.input_price_per_1m !== undefined) {
75
+ delete merged.price_per_image;
76
+ delete merged.price_per_minute;
77
+ }
78
+
79
+ return merged;
80
  });
81
 
82
  return true;
 
89
  function estimateParams(config, hfId) {
90
  if (!config) return null;
91
  const h = config.hidden_size || config.d_model || config.n_embd;
92
+ let l = config.num_hidden_layers || config.n_layer;
93
  const v = config.vocab_size;
94
+ const i = config.intermediate_size || config.d_ff || config.encoder_ffn_dim || config.decoder_ffn_dim;
95
  const numExperts = config.num_local_experts || config.n_experts || config.num_experts || 1;
96
  const modelType = (config.model_type || '').toLowerCase();
97
+ const isEncoderDecoder = config.is_encoder_decoder || !!(config.encoder_layers && config.decoder_layers);
98
+
99
+ if (isEncoderDecoder) {
100
+ // For encoder-decoder like Whisper/T5, we sum encoder and decoder layers
101
+ l = (config.encoder_layers || l) + (config.decoder_layers || 0);
102
+ }
103
 
104
  if (h && l && v) {
105
  const intermediate = i || (4 * h);
106
  const vocabParams = v * h;
107
+ const posParams = (config.max_position_embeddings || config.max_source_positions || 512) * h;
108
  const typeParams = (config.type_vocab_size || 0) * h;
109
  const embedParams = vocabParams + posParams + typeParams;
110
  const attentionParams = 4 * (h * h);
 
197
  'mistral small 2501': 'mistralai/Mistral-Small-24B-Instruct-2501',
198
  'mistral small 2409': 'mistralai/Mistral-Small-Instruct-2409',
199
  'mistral small 24b': 'mistralai/Mistral-Small-24B-Instruct-2501',
200
+ 'whisper large v3': 'openai/whisper-large-v3',
201
+ 'whisper large v3 turbo': 'openai/whisper-large-v3-turbo',
202
+ 'whisper large v2': 'openai/whisper-large-v2',
203
+ 'whisper medium': 'openai/whisper-medium',
204
+ 'whisper small': 'openai/whisper-small',
205
+ 'whisper base': 'openai/whisper-base',
206
+ 'whisper tiny': 'openai/whisper-tiny',
207
+ 'gemini 3.1 pro': 'google/gemini-3.1-pro-preview',
208
+ 'gemini 3.1 flash lite': 'google/gemini-3.1-flash-lite-preview',
209
+ 'gemini 3 flash': 'google/gemini-3-flash-preview',
210
  };
211
 
212
  const MANUAL_OLLAMA_ID_MAP = {
 
227
  'black-forest-labs/FLUX.2-max': 32,
228
  'black-forest-labs/FLUX.2-klein-4B': 4,
229
  'black-forest-labs/FLUX.2-klein-9B': 9,
230
+ 'openai/whisper-large-v3': 1.55,
231
+ 'openai/whisper-large-v3-turbo': 0.81,
232
+ 'openai/whisper-large-v2': 1.55,
233
+ 'openai/whisper-medium': 0.77,
234
+ 'openai/whisper-small': 0.24,
235
+ 'openai/whisper-base': 0.07,
236
+ 'openai/whisper-tiny': 0.04,
237
+ 'google/gemini-3.1-pro-preview': 292,
238
+ 'google/gemini-3.1-flash-lite-preview': 371,
239
+ 'google/gemini-3-flash-preview': 1000,
240
+ 'xiaomi/mimo-v2-omni': 186,
241
  };
242
 
243
  const PROPRIETARY_KEYWORDS = [
scripts/providers/groq.js CHANGED
@@ -118,10 +118,23 @@ async function fetchGroq() {
118
  const model = {
119
  name,
120
  type: tableType,
121
- input_price_per_1m: inputPrice,
122
- output_price_per_1m: outputPrice ?? 0,
123
  currency: 'USD',
124
  };
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
125
  if (size_b) model.size_b = size_b;
126
 
127
  models.push(model);
 
118
  const model = {
119
  name,
120
  type: tableType,
 
 
121
  currency: 'USD',
122
  };
123
+
124
+ if (tableType === 'audio') {
125
+ const headerText = headers[priceCol] || '';
126
+ if (headerText.includes('hour')) {
127
+ model.price_per_minute = inputPrice / 60;
128
+ } else {
129
+ // TTS: per M characters
130
+ model.input_price_per_1m = inputPrice;
131
+ model.output_price_per_1m = 0;
132
+ }
133
+ } else {
134
+ model.input_price_per_1m = inputPrice;
135
+ model.output_price_per_1m = outputPrice ?? 0;
136
+ }
137
+
138
  if (size_b) model.size_b = size_b;
139
 
140
  models.push(model);
scripts/providers/infomaniak.js CHANGED
@@ -106,10 +106,16 @@ async function fetchInfomaniak() {
106
  const model = {
107
  name,
108
  type,
109
- input_price_per_1m: inputPrice,
110
- output_price_per_1m: outputPrice ?? 0,
111
  currency,
112
  };
 
 
 
 
 
 
 
 
113
  if (size_b) model.size_b = size_b;
114
 
115
  models.push(model);
 
106
  const model = {
107
  name,
108
  type,
 
 
109
  currency,
110
  };
111
+
112
+ if (type === 'audio') {
113
+ model.price_per_minute = inputPrice;
114
+ } else {
115
+ model.input_price_per_1m = inputPrice;
116
+ model.output_price_per_1m = outputPrice ?? 0;
117
+ }
118
+
119
  if (size_b) model.size_b = size_b;
120
 
121
  models.push(model);
scripts/providers/mistral.js CHANGED
@@ -35,6 +35,13 @@ const MODEL_TYPE_MAP = {
35
  'other models': 'chat',
36
  };
37
 
 
 
 
 
 
 
 
38
  function extractApisArray(payload) {
39
  // Find the "apis":[...] block in the RSC payload string
40
  const start = payload.indexOf('"apis":[{');
@@ -117,31 +124,53 @@ async function fetchMistral() {
117
  // Find input and output prices from the price array
118
  let inputPrice = null;
119
  let outputPrice = null;
 
 
120
 
121
  for (const p of api.price) {
122
  const label = (p.value || '').toLowerCase();
123
  const priceHtml = p.price_dollar || p.price_euro || '';
124
  const val = parseUsd(priceHtml);
125
- if (label.includes('input') || label.includes('in ')) {
126
- if (inputPrice === null) inputPrice = val;
 
 
 
 
 
 
 
 
127
  } else if (label.includes('output') || label.includes('out ')) {
128
- if (outputPrice === null) outputPrice = val;
129
  }
130
  }
131
 
132
  // Skip if we couldn't get any price
133
- if (inputPrice === null && outputPrice === null) continue;
134
 
135
- const type = MODEL_TYPE_MAP[rawType] || 'chat';
136
  const size_b = getSizeB(name);
137
 
138
  const model = {
139
  name,
140
  type,
141
- input_price_per_1m: inputPrice ?? 0,
142
- output_price_per_1m: outputPrice ?? 0,
143
  currency: 'USD',
144
  };
 
 
 
 
 
 
 
 
 
 
 
 
 
 
145
  if (size_b) model.size_b = size_b;
146
  if (endpoint) model.api_endpoint = endpoint;
147
 
@@ -162,9 +191,15 @@ if (require.main === module) {
162
  models.forEach((m) => { (byType[m.type] = byType[m.type] || []).push(m); });
163
  for (const [type, ms] of Object.entries(byType)) {
164
  console.log(` [${type}]`);
165
- ms.forEach((m) =>
166
- console.log(` ${m.name.padEnd(40)} $${m.input_price_per_1m} / $${m.output_price_per_1m}`)
167
- );
 
 
 
 
 
 
168
  }
169
  })
170
  .catch((err) => {
 
35
  'other models': 'chat',
36
  };
37
 
38
+ const getModelType = (name, rawType) => {
39
+ const n = (name || '').toLowerCase();
40
+ if (n.includes('voxtral')) return 'audio';
41
+ if (n.includes('embed')) return 'embedding';
42
+ return MODEL_TYPE_MAP[rawType] || 'chat';
43
+ };
44
+
45
  function extractApisArray(payload) {
46
  // Find the "apis":[...] block in the RSC payload string
47
  const start = payload.indexOf('"apis":[{');
 
124
  // Find input and output prices from the price array
125
  let inputPrice = null;
126
  let outputPrice = null;
127
+ let audioPrice = null;
128
+ let audioPriceMin = null;
129
 
130
  for (const p of api.price) {
131
  const label = (p.value || '').toLowerCase();
132
  const priceHtml = p.price_dollar || p.price_euro || '';
133
  const val = parseUsd(priceHtml);
134
+ if (val === null) continue;
135
+
136
+ if (label.includes('audio input') || label.includes('audio entrant')) {
137
+ // Check if it's per minute or per token
138
+ if (label.includes('min')) audioPriceMin = val;
139
+ else audioPrice = val;
140
+ } else if (label.includes('transcribe') || label.includes('reconnaissance')) {
141
+ audioPriceMin = val;
142
+ } else if (label.includes('input') || label.includes('in ')) {
143
+ inputPrice = val;
144
  } else if (label.includes('output') || label.includes('out ')) {
145
+ outputPrice = val;
146
  }
147
  }
148
 
149
  // Skip if we couldn't get any price
150
+ if (inputPrice === null && outputPrice === null && audioPriceMin === null) continue;
151
 
152
+ const type = getModelType(name, rawType);
153
  const size_b = getSizeB(name);
154
 
155
  const model = {
156
  name,
157
  type,
 
 
158
  currency: 'USD',
159
  };
160
+
161
+ if (audioPriceMin !== null) {
162
+ model.price_per_minute = audioPriceMin;
163
+ }
164
+ if (audioPrice !== null) {
165
+ model.audio_price_per_1m = audioPrice;
166
+ }
167
+ if (inputPrice !== null) {
168
+ model.input_price_per_1m = inputPrice;
169
+ }
170
+ if (outputPrice !== null) {
171
+ model.output_price_per_1m = outputPrice ?? 0;
172
+ }
173
+
174
  if (size_b) model.size_b = size_b;
175
  if (endpoint) model.api_endpoint = endpoint;
176
 
 
191
  models.forEach((m) => { (byType[m.type] = byType[m.type] || []).push(m); });
192
  for (const [type, ms] of Object.entries(byType)) {
193
  console.log(` [${type}]`);
194
+ ms.forEach((m) => {
195
+ let priceStr = '';
196
+ if (m.price_per_minute !== undefined) priceStr += `$${m.price_per_minute}/min `;
197
+ if (m.audio_price_per_1m !== undefined) priceStr += `(Audio: $${m.audio_price_per_1m}/M) `;
198
+ if (m.input_price_per_1m !== undefined || m.output_price_per_1m !== undefined) {
199
+ priceStr += `$${m.input_price_per_1m ?? 0} / $${m.output_price_per_1m ?? 0}`;
200
+ }
201
+ console.log(` ${m.name.padEnd(40)} ${priceStr.trim()}`);
202
+ });
203
  }
204
  })
205
  .catch((err) => {
scripts/providers/openrouter.js CHANGED
@@ -93,6 +93,7 @@ async function fetchOpenRouter() {
93
  const pricing = model.pricing || {};
94
  const inputPrice = toPerMillion(pricing.prompt);
95
  const outputPrice = toPerMillion(pricing.completion);
 
96
  // pricing.image: per-image cost for image-gen models (e.g. FLUX) — in USD per image
97
  // (NOT the same as per-pixel input cost on vision models like Gemini, which also have prompt price set)
98
  const imagePrice = parseFloat(pricing.image || '0');
@@ -103,7 +104,7 @@ async function fetchOpenRouter() {
103
  if (model.id === 'openrouter/free') continue;
104
  // Skip models with genuinely zero pricing across all fields (unpriced/placeholder entries).
105
  // Exception: models with a :free suffix are real free models and should be kept.
106
- if (inputPrice === 0 && outputPrice === 0 && imagePrice === 0 && !model.id.endsWith(':free')) continue;
107
 
108
  const type = getModelType(model.architecture);
109
  const capabilities = getCapabilities(model.architecture, model.supported_parameters);
@@ -123,6 +124,10 @@ async function fetchOpenRouter() {
123
 
124
  if (model.hugging_face_id) modelEntry.hf_id = model.hugging_face_id;
125
 
 
 
 
 
126
  // For pure image-gen models (no per-token pricing), store the per-image price
127
  if (imagePrice > 0 && inputPrice === 0 && outputPrice === 0) {
128
  modelEntry.price_per_image = Math.round(imagePrice * 100000) / 100000;
@@ -176,6 +181,15 @@ if (require.main === module) {
176
  const eu = models.filter(m => m.capabilities?.includes('eu-endpoint'));
177
  console.log(`Fetched ${models.length} models from OpenRouter API ${apiKey ? '(authenticated)' : '(public – set OPENROUTER_API_KEY for more models)'}`);
178
  console.log(` Free: ${free.length}, Vision: ${vision.length}, Image-gen: ${imageGen.length}, EU-Endpoint: ${eu.length}`);
 
 
 
 
 
 
 
 
 
179
  console.log('\nFirst 5 EU-available:');
180
  eu.slice(0, 5).forEach((m) =>
181
  console.log(` ${m.name.padEnd(55)} $${m.input_price_per_1m} / $${m.output_price_per_1m} [${m.type}]`)
 
93
  const pricing = model.pricing || {};
94
  const inputPrice = toPerMillion(pricing.prompt);
95
  const outputPrice = toPerMillion(pricing.completion);
96
+ const audioPrice = toPerMillion(pricing.audio);
97
  // pricing.image: per-image cost for image-gen models (e.g. FLUX) — in USD per image
98
  // (NOT the same as per-pixel input cost on vision models like Gemini, which also have prompt price set)
99
  const imagePrice = parseFloat(pricing.image || '0');
 
104
  if (model.id === 'openrouter/free') continue;
105
  // Skip models with genuinely zero pricing across all fields (unpriced/placeholder entries).
106
  // Exception: models with a :free suffix are real free models and should be kept.
107
+ if (inputPrice === 0 && outputPrice === 0 && imagePrice === 0 && audioPrice === 0 && !model.id.endsWith(':free')) continue;
108
 
109
  const type = getModelType(model.architecture);
110
  const capabilities = getCapabilities(model.architecture, model.supported_parameters);
 
124
 
125
  if (model.hugging_face_id) modelEntry.hf_id = model.hugging_face_id;
126
 
127
+ if (audioPrice > 0) {
128
+ modelEntry.audio_price_per_1m = Math.round(audioPrice * 10000) / 10000;
129
+ }
130
+
131
  // For pure image-gen models (no per-token pricing), store the per-image price
132
  if (imagePrice > 0 && inputPrice === 0 && outputPrice === 0) {
133
  modelEntry.price_per_image = Math.round(imagePrice * 100000) / 100000;
 
181
  const eu = models.filter(m => m.capabilities?.includes('eu-endpoint'));
182
  console.log(`Fetched ${models.length} models from OpenRouter API ${apiKey ? '(authenticated)' : '(public – set OPENROUTER_API_KEY for more models)'}`);
183
  console.log(` Free: ${free.length}, Vision: ${vision.length}, Image-gen: ${imageGen.length}, EU-Endpoint: ${eu.length}`);
184
+
185
+ const audioModels = models.filter(m => m.audio_price_per_1m > 0);
186
+ console.log(` Audio-priced models: ${audioModels.length}`);
187
+
188
+ console.log('\nSample Audio-priced models:');
189
+ audioModels.slice(0, 5).forEach((m) =>
190
+ console.log(` ${m.name.padEnd(55)} Audio: $${m.audio_price_per_1m}/M [${m.type}]`)
191
+ );
192
+
193
  console.log('\nFirst 5 EU-available:');
194
  eu.slice(0, 5).forEach((m) =>
195
  console.log(` ${m.name.padEnd(55)} $${m.input_price_per_1m} / $${m.output_price_per_1m} [${m.type}]`)
scripts/providers/scaleway.js CHANGED
@@ -97,10 +97,16 @@ async function fetchScaleway() {
97
  const model = {
98
  name,
99
  type,
100
- input_price_per_1m: inputPrice,
101
- output_price_per_1m: outputPrice ?? 0,
102
  currency: 'EUR',
103
  };
 
 
 
 
 
 
 
 
104
  if (size_b) model.size_b = size_b;
105
 
106
  models.push(model);
 
97
  const model = {
98
  name,
99
  type,
 
 
100
  currency: 'EUR',
101
  };
102
+
103
+ if (type === 'audio') {
104
+ model.price_per_minute = inputPrice;
105
+ } else {
106
+ model.input_price_per_1m = inputPrice;
107
+ model.output_price_per_1m = outputPrice ?? 0;
108
+ }
109
+
110
  if (size_b) model.size_b = size_b;
111
 
112
  models.push(model);
src/App.css CHANGED
@@ -146,6 +146,19 @@ tr.group-divider {
146
  color: var(--primary-color);
147
  }
148
 
 
 
 
 
 
 
 
 
 
 
 
 
 
149
  .model-name {
150
  font-weight: 600;
151
  font-family: 'JetBrains Mono', monospace;
 
146
  color: var(--primary-color);
147
  }
148
 
149
+ .price-stack {
150
+ display: flex;
151
+ flex-direction: column;
152
+ gap: 0.15rem;
153
+ }
154
+
155
+ .price-subtext {
156
+ font-size: 0.75rem;
157
+ color: #64748b;
158
+ font-weight: 500;
159
+ white-space: nowrap;
160
+ }
161
+
162
  .model-name {
163
  font-weight: 600;
164
  font-family: 'JetBrains Mono', monospace;
src/App.tsx CHANGED
@@ -12,6 +12,7 @@ interface Model {
12
  output_price_per_1m?: number
13
  price_per_image?: number
14
  price_per_minute?: number
 
15
  price_per_1m_tokens_30d?: number
16
  currency: string
17
  capabilities?: string[]
@@ -577,12 +578,23 @@ function App() {
577
  </td>
578
  <td className="size-cell">{model.size_b ? `${model.size_b}B` : '-'}</td>
579
  <td>
580
- {model.price_per_image !== undefined && !model.input_price_per_1m
581
- ? `$${model.price_per_image}/MP`
582
- : formatPrice(model.input_price_per_1m, model.currency)}
 
 
 
 
 
 
 
 
 
583
  </td>
584
  <td>
585
  {model.price_per_image !== undefined && !model.output_price_per_1m
 
 
586
  ? '–'
587
  : formatPrice(model.output_price_per_1m, model.currency)}
588
  </td>
 
12
  output_price_per_1m?: number
13
  price_per_image?: number
14
  price_per_minute?: number
15
+ audio_price_per_1m?: number
16
  price_per_1m_tokens_30d?: number
17
  currency: string
18
  capabilities?: string[]
 
578
  </td>
579
  <td className="size-cell">{model.size_b ? `${model.size_b}B` : '-'}</td>
580
  <td>
581
+ <div className="price-stack">
582
+ {model.price_per_image !== undefined && !model.input_price_per_1m
583
+ ? `$${model.price_per_image}/MP`
584
+ : model.price_per_minute !== undefined
585
+ ? `${formatPrice(model.price_per_minute, model.currency)}/min`
586
+ : formatPrice(model.input_price_per_1m, model.currency)}
587
+ {model.audio_price_per_1m !== undefined && (
588
+ <div className="price-subtext" title="Audio token price">
589
+ {CAP_ICON.audio} {formatPrice(model.audio_price_per_1m, model.currency)}/M
590
+ </div>
591
+ )}
592
+ </div>
593
  </td>
594
  <td>
595
  {model.price_per_image !== undefined && !model.output_price_per_1m
596
+ ? '–'
597
+ : model.price_per_minute !== undefined
598
  ? '–'
599
  : formatPrice(model.output_price_per_1m, model.currency)}
600
  </td>