zai-org/GLM-4.6
|
novita |
live |
0.6 |
2.2 |
204800 |
0.58 |
41 |
Yes |
No |
zai-org/GLM-4.6
|
zai-org |
live |
- |
- |
- |
1.72 |
61 |
Yes |
No |
deepseek-ai/DeepSeek-V3.2-Exp
|
novita |
live |
0.27 |
0.41 |
163840 |
0.68 |
37 |
Yes |
No |
openai/gpt-oss-120b
|
fireworks-ai |
live |
0.15 |
0.6 |
131072 |
0.98 |
148 |
Yes |
No |
openai/gpt-oss-120b
|
cerebras |
live |
0.25 |
0.69 |
- |
0.29 |
775 |
Yes |
No |
openai/gpt-oss-120b
|
nebius |
live |
0.15 |
0.6 |
131072 |
0.49 |
102 |
Yes |
Yes |
openai/gpt-oss-120b
|
novita |
offline |
0.1 |
0.5 |
131072 |
0.39 |
122 |
Yes |
Yes |
openai/gpt-oss-120b
|
together |
live |
0.15 |
0.6 |
131072 |
0.51 |
74 |
Yes |
Yes |
openai/gpt-oss-120b
|
nscale |
live |
0.1 |
0.4 |
131072 |
0.41 |
94 |
Yes |
Yes |
openai/gpt-oss-120b
|
groq |
live |
0.15 |
0.75 |
131072 |
0.13 |
442 |
Yes |
No |
openai/gpt-oss-120b
|
hyperbolic |
live |
0.3 |
0.3 |
131072 |
0.71 |
272 |
Yes |
No |
openai/gpt-oss-120b
|
sambanova |
live |
0.22 |
0.59 |
131072 |
1.73 |
346 |
Yes |
Yes |
openai/gpt-oss-120b
|
scaleway |
live |
- |
- |
- |
0.35 |
140 |
Yes |
Yes |
Qwen/Qwen3-VL-235B-A22B-Thinking
|
novita |
live |
0.98 |
3.95 |
131072 |
0.90 |
47 |
No |
No |
Qwen/Qwen3-VL-235B-A22B-Instruct
|
novita |
live |
0.3 |
1.5 |
131072 |
0.71 |
42 |
Yes |
Yes |
zai-org/GLM-4.6-FP8
|
zai-org |
live |
- |
- |
- |
1.30 |
53 |
Yes |
No |
openai/gpt-oss-20b
|
fireworks-ai |
live |
0.05 |
0.2 |
131072 |
0.61 |
246 |
Yes |
No |
openai/gpt-oss-20b
|
nebius |
live |
0.05 |
0.2 |
131072 |
0.47 |
61 |
Yes |
Yes |
openai/gpt-oss-20b
|
novita |
live |
0.05 |
0.2 |
131072 |
4.87 |
69 |
No |
Yes |
openai/gpt-oss-20b
|
together |
live |
0.05 |
0.2 |
131072 |
0.79 |
101 |
Yes |
No |
openai/gpt-oss-20b
|
nscale |
live |
0.05 |
0.2 |
131072 |
0.29 |
144 |
Yes |
Yes |
openai/gpt-oss-20b
|
groq |
live |
0.1 |
0.5 |
131072 |
0.13 |
881 |
Yes |
No |
openai/gpt-oss-20b
|
hyperbolic |
live |
0.1 |
0.1 |
131072 |
0.46 |
103 |
No |
No |
meta-llama/Llama-3.1-8B-Instruct
|
fireworks-ai |
live |
0.2 |
0.2 |
131072 |
0.39 |
178 |
No |
No |
meta-llama/Llama-3.1-8B-Instruct
|
cerebras |
live |
0.1 |
0.1 |
- |
0.21 |
1401 |
No |
No |
meta-llama/Llama-3.1-8B-Instruct
|
nebius |
live |
0.03 |
0.09 |
131072 |
0.43 |
160 |
Yes |
No |
meta-llama/Llama-3.1-8B-Instruct
|
novita |
live |
0.02 |
0.05 |
16384 |
0.72 |
68 |
No |
No |
meta-llama/Llama-3.1-8B-Instruct
|
nscale |
live |
0.06 |
0.06 |
131072 |
0.54 |
60 |
No |
Yes |
meta-llama/Llama-3.1-8B-Instruct
|
sambanova |
live |
0.1 |
0.2 |
16384 |
0.94 |
438 |
Yes |
Yes |
meta-llama/Llama-3.1-8B-Instruct
|
scaleway |
live |
- |
- |
- |
0.40 |
77 |
Yes |
Yes |
Kwaipilot/KAT-Dev
|
novita |
live |
0.15 |
0.4 |
65536 |
1.74 |
37 |
Yes |
Yes |
Qwen/Qwen3-Next-80B-A3B-Instruct
|
novita |
live |
0.15 |
1.5 |
131072 |
0.77 |
116 |
Yes |
No |
Qwen/Qwen3-Next-80B-A3B-Instruct
|
together |
live |
0.15 |
1.5 |
262144 |
0.74 |
127 |
Yes |
Yes |
Qwen/Qwen3-Next-80B-A3B-Instruct
|
hyperbolic |
live |
0.3 |
0.3 |
262144 |
0.43 |
140 |
Yes |
No |
Qwen/Qwen3-4B-Instruct-2507
|
nscale |
live |
0.01 |
0.03 |
262144 |
0.41 |
60 |
Yes |
No |
moonshotai/Kimi-K2-Instruct-0905
|
novita |
live |
0.6 |
2.5 |
262144 |
2.23 |
14 |
Yes |
Yes |
moonshotai/Kimi-K2-Instruct-0905
|
together |
live |
1 |
3 |
262144 |
0.57 |
30 |
Yes |
Yes |
moonshotai/Kimi-K2-Instruct-0905
|
groq |
live |
- |
- |
262144 |
0.44 |
162 |
Yes |
No |
zai-org/GLM-4.5-Air
|
fireworks-ai |
live |
0.22 |
0.88 |
131072 |
0.71 |
108 |
Yes |
No |
zai-org/GLM-4.5-Air
|
nebius |
live |
0.2 |
1.2 |
131072 |
0.60 |
70 |
Yes |
Yes |
zai-org/GLM-4.5-Air
|
zai-org |
live |
- |
- |
- |
1.14 |
47 |
Yes |
No |
mistralai/Mistral-7B-Instruct-v0.3
|
novita |
live |
0.029 |
0.059 |
32768 |
0.78 |
113 |
No |
No |
mistralai/Mistral-7B-Instruct-v0.3
|
together |
live |
0.2 |
0.2 |
32768 |
0.21 |
186 |
No |
Yes |
swiss-ai/Apertus-8B-Instruct-2509
|
publicai |
live |
- |
- |
- |
1.26 |
31 |
No |
Yes |
deepseek-ai/DeepSeek-R1
|
fireworks-ai |
live |
3 |
8 |
163840 |
1.73 |
30 |
No |
No |
deepseek-ai/DeepSeek-R1
|
novita |
live |
0.7 |
2.5 |
64000 |
0.66 |
33 |
Yes |
No |
deepseek-ai/DeepSeek-R1
|
together |
live |
3 |
7 |
163840 |
0.60 |
55 |
No |
Yes |
deepseek-ai/DeepSeek-R1
|
hyperbolic |
live |
2 |
2 |
163840 |
1.20 |
46 |
No |
No |
deepseek-ai/DeepSeek-R1
|
sambanova |
live |
- |
- |
- |
0.96 |
130 |
Yes |
Yes |
meta-llama/Llama-3.2-1B-Instruct
|
novita |
live |
- |
- |
131000 |
0.81 |
204 |
No |
No |
meta-llama/Llama-3.2-1B-Instruct
|
sambanova |
offline |
- |
- |
- |
0.44 |
- |
- |
- |
deepseek-ai/DeepSeek-V3.1-Terminus
|
novita |
live |
0.27 |
1 |
98304 |
0.95 |
55 |
No |
Yes |
Qwen/Qwen2.5-VL-7B-Instruct
|
hyperbolic |
live |
0.2 |
0.2 |
32768 |
0.38 |
40 |
No |
No |
meta-llama/Meta-Llama-3-8B-Instruct
|
novita |
live |
0.04 |
0.04 |
8192 |
0.79 |
69 |
No |
No |
meta-llama/Meta-Llama-3-8B-Instruct
|
together |
offline |
- |
- |
- |
- |
- |
- |
- |
meta-llama/Meta-Llama-3-8B-Instruct
|
groq |
offline |
0.05 |
0.08 |
8192 |
0.19 |
1056 |
Yes |
No |
meta-llama/Llama-3.2-3B-Instruct
|
novita |
live |
0.03 |
0.05 |
32768 |
0.71 |
116 |
Yes |
No |
meta-llama/Llama-3.2-3B-Instruct
|
together |
live |
0.06 |
0.06 |
131072 |
0.29 |
153 |
Yes |
Yes |
meta-llama/Llama-3.2-3B-Instruct
|
hyperbolic |
live |
0.1 |
0.1 |
131072 |
0.50 |
144 |
No |
No |
meta-llama/Llama-3.2-3B-Instruct
|
sambanova |
offline |
- |
- |
- |
0.38 |
- |
- |
- |
Qwen/Qwen3-4B-Thinking-2507
|
nscale |
live |
0.01 |
0.03 |
262144 |
0.56 |
35 |
Yes |
No |
meta-llama/Llama-3.3-70B-Instruct
|
fireworks-ai |
live |
0.9 |
0.9 |
131072 |
0.54 |
93 |
No |
No |
meta-llama/Llama-3.3-70B-Instruct
|
cerebras |
live |
0.85 |
1.2 |
- |
0.26 |
1118 |
Yes |
No |
meta-llama/Llama-3.3-70B-Instruct
|
nebius |
live |
0.25 |
0.75 |
131072 |
0.31 |
128 |
Yes |
Yes |
meta-llama/Llama-3.3-70B-Instruct
|
novita |
live |
0.13 |
0.39 |
131072 |
0.56 |
32 |
Yes |
No |
meta-llama/Llama-3.3-70B-Instruct
|
together |
live |
0.88 |
0.88 |
131072 |
0.59 |
121 |
Yes |
Yes |
meta-llama/Llama-3.3-70B-Instruct
|
nscale |
live |
0.4 |
0.4 |
131072 |
0.70 |
17 |
No |
Yes |
meta-llama/Llama-3.3-70B-Instruct
|
groq |
live |
0.59 |
0.79 |
131072 |
0.14 |
373 |
Yes |
No |
meta-llama/Llama-3.3-70B-Instruct
|
hyperbolic |
live |
0.4 |
0.4 |
131072 |
0.89 |
81 |
No |
No |
meta-llama/Llama-3.3-70B-Instruct
|
sambanova |
live |
0.6 |
1.2 |
131072 |
0.32 |
320 |
Yes |
Yes |
meta-llama/Llama-3.3-70B-Instruct
|
scaleway |
live |
- |
- |
- |
0.60 |
25 |
Yes |
Yes |
zai-org/GLM-4.5
|
fireworks-ai |
live |
0.55 |
2.19 |
131072 |
1.14 |
62 |
Yes |
No |
zai-org/GLM-4.5
|
nebius |
live |
0.6 |
2.2 |
131072 |
0.37 |
33 |
Yes |
Yes |
zai-org/GLM-4.5
|
novita |
live |
0.6 |
2.2 |
131072 |
1.23 |
84 |
Yes |
No |
zai-org/GLM-4.5
|
zai-org |
live |
- |
- |
- |
1.17 |
77 |
Yes |
No |
Qwen/Qwen3-30B-A3B-Instruct-2507
|
nebius |
live |
0.1 |
0.3 |
262144 |
0.46 |
52 |
Yes |
Yes |
Qwen/Qwen2.5-7B-Instruct
|
together |
live |
0.3 |
0.3 |
32768 |
0.24 |
134 |
Yes |
Yes |
Qwen/Qwen3-8B
|
nscale |
live |
0.07 |
0.18 |
40960 |
0.47 |
53 |
Yes |
No |
Qwen/Qwen3-Next-80B-A3B-Thinking
|
novita |
live |
0.15 |
1.5 |
131072 |
0.83 |
143 |
Yes |
No |
Qwen/Qwen3-Next-80B-A3B-Thinking
|
together |
live |
0.15 |
1.5 |
262144 |
0.89 |
163 |
Yes |
Yes |
Qwen/Qwen3-Next-80B-A3B-Thinking
|
hyperbolic |
live |
0.3 |
0.3 |
262144 |
0.48 |
179 |
Yes |
No |
Qwen/Qwen3-Coder-30B-A3B-Instruct
|
fireworks-ai |
live |
0.15 |
0.6 |
262144 |
0.90 |
97 |
Yes |
No |
Qwen/Qwen3-Coder-30B-A3B-Instruct
|
nebius |
live |
0.1 |
0.3 |
262144 |
0.36 |
64 |
Yes |
Yes |
Qwen/Qwen3-Coder-30B-A3B-Instruct
|
scaleway |
live |
- |
- |
- |
0.49 |
105 |
Yes |
Yes |
google/gemma-3-27b-it
|
nebius |
live |
0.2 |
0.6 |
110000 |
0.40 |
77 |
No |
Yes |
google/gemma-3-27b-it
|
scaleway |
live |
- |
- |
- |
0.51 |
43 |
Yes |
Yes |
zai-org/GLM-4.5V
|
novita |
live |
0.6 |
1.8 |
65536 |
1.34 |
73 |
Yes |
No |
meta-llama/Llama-4-Scout-17B-16E-Instruct
|
fireworks-ai |
live |
0.15 |
0.6 |
1048576 |
0.49 |
68 |
Yes |
No |
meta-llama/Llama-4-Scout-17B-16E-Instruct
|
cerebras |
live |
0.65 |
0.85 |
- |
0.20 |
1139 |
Yes |
No |
meta-llama/Llama-4-Scout-17B-16E-Instruct
|
novita |
live |
0.1 |
0.5 |
131072 |
0.75 |
30 |
Yes |
No |
meta-llama/Llama-4-Scout-17B-16E-Instruct
|
together |
live |
0.18 |
0.59 |
1048576 |
0.25 |
40 |
Yes |
Yes |
meta-llama/Llama-4-Scout-17B-16E-Instruct
|
nscale |
live |
0.09 |
0.29 |
890000 |
0.43 |
34 |
Yes |
Yes |
meta-llama/Llama-4-Scout-17B-16E-Instruct
|
groq |
live |
0.11 |
0.34 |
131072 |
0.32 |
327 |
No |
No |
meta-llama/Llama-4-Scout-17B-16E-Instruct
|
sambanova |
offline |
- |
- |
- |
0.86 |
- |
- |
- |
moonshotai/Kimi-K2-Instruct
|
fireworks-ai |
live |
0.6 |
2.5 |
131072 |
1.86 |
34 |
Yes |
No |
moonshotai/Kimi-K2-Instruct
|
nebius |
live |
0.5 |
2.4 |
131072 |
0.44 |
62 |
Yes |
Yes |
moonshotai/Kimi-K2-Instruct
|
novita |
live |
0.57 |
2.3 |
131072 |
1.42 |
74 |
Yes |
Yes |
moonshotai/Kimi-K2-Instruct
|
together |
live |
1 |
3 |
131072 |
0.78 |
50 |
Yes |
Yes |
deepseek-ai/DeepSeek-V3.1
|
fireworks-ai |
live |
- |
- |
163840 |
1.36 |
68 |
Yes |
No |
deepseek-ai/DeepSeek-V3.1
|
novita |
live |
0.27 |
1 |
131072 |
1.10 |
57 |
Yes |
Yes |
deepseek-ai/DeepSeek-V3.1
|
together |
live |
0.6 |
1.7 |
131072 |
1.04 |
102 |
Yes |
No |
NousResearch/Hermes-4-70B
|
nebius |
live |
0.13 |
0.4 |
131072 |
0.33 |
66 |
No |
No |
deepseek-ai/DeepSeek-R1-Distill-Llama-8B
|
novita |
live |
0.04 |
0.04 |
32000 |
1.03 |
51 |
No |
Yes |
deepseek-ai/DeepSeek-R1-Distill-Llama-8B
|
nscale |
live |
0.05 |
0.05 |
131072 |
0.43 |
56 |
No |
Yes |
deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B
|
nscale |
live |
0.1 |
0.1 |
131072 |
0.43 |
131 |
No |
No |
swiss-ai/Apertus-70B-Instruct-2509
|
publicai |
live |
- |
- |
- |
0.91 |
45 |
No |
No |
google/gemma-2-2b-it
|
nebius |
live |
0.02 |
0.06 |
8192 |
0.46 |
115 |
No |
Yes |
Qwen/Qwen3-Coder-480B-A35B-Instruct
|
fireworks-ai |
live |
0.45 |
1.8 |
262144 |
0.64 |
30 |
Yes |
No |
Qwen/Qwen3-Coder-480B-A35B-Instruct
|
cerebras |
live |
2 |
2 |
- |
0.22 |
617 |
Yes |
No |
Qwen/Qwen3-Coder-480B-A35B-Instruct
|
nebius |
live |
0.4 |
1.8 |
262144 |
0.49 |
66 |
Yes |
Yes |
Qwen/Qwen3-Coder-480B-A35B-Instruct
|
novita |
live |
0.29 |
1.2 |
262144 |
0.78 |
53 |
Yes |
Yes |
Qwen/Qwen3-Coder-480B-A35B-Instruct
|
together |
live |
2 |
2 |
262144 |
0.73 |
46 |
Yes |
Yes |
Qwen/Qwen3-Coder-480B-A35B-Instruct
|
hyperbolic |
live |
2 |
2 |
262144 |
1.14 |
54 |
Yes |
No |
Qwen/Qwen3-14B
|
nebius |
live |
0.08 |
0.24 |
40960 |
0.45 |
78 |
Yes |
Yes |
Qwen/Qwen3-14B
|
nscale |
live |
0.07 |
0.2 |
40960 |
0.53 |
36 |
Yes |
Yes |
deepseek-ai/DeepSeek-R1-0528
|
fireworks-ai |
live |
3 |
8 |
163840 |
1.12 |
64 |
Yes |
No |
deepseek-ai/DeepSeek-R1-0528
|
nebius |
live |
0.8 |
2.4 |
163840 |
0.58 |
30 |
Yes |
Yes |
deepseek-ai/DeepSeek-R1-0528
|
novita |
live |
0.7 |
2.5 |
163840 |
0.87 |
22 |
Yes |
No |
deepseek-ai/DeepSeek-R1-0528
|
together |
live |
3 |
7 |
163840 |
0.52 |
67 |
No |
Yes |
deepseek-ai/DeepSeek-R1-0528
|
hyperbolic |
live |
3 |
3 |
163840 |
0.62 |
50 |
No |
No |
deepseek-ai/DeepSeek-R1-0528
|
sambanova |
live |
5 |
7 |
32768 |
1.69 |
128 |
Yes |
Yes |
HuggingFaceTB/SmolLM3-3B
|
hf-inference |
live |
- |
- |
- |
0.21 |
83 |
Yes |
Yes |
deepseek-ai/DeepSeek-V3-0324
|
fireworks-ai |
live |
0.9 |
0.9 |
163840 |
1.57 |
61 |
Yes |
No |
deepseek-ai/DeepSeek-V3-0324
|
nebius |
live |
0.75 |
2.25 |
32768 |
1.27 |
113 |
No |
No |
deepseek-ai/DeepSeek-V3-0324
|
novita |
live |
0.27 |
1.12 |
163840 |
1.09 |
30 |
Yes |
Yes |
deepseek-ai/DeepSeek-V3-0324
|
together |
live |
1.25 |
1.25 |
131072 |
0.79 |
44 |
Yes |
Yes |
deepseek-ai/DeepSeek-V3-0324
|
hyperbolic |
live |
1.25 |
1.25 |
163840 |
1.58 |
30 |
Yes |
No |
deepseek-ai/DeepSeek-V3-0324
|
sambanova |
live |
3 |
4.5 |
32768 |
0.55 |
190 |
Yes |
Yes |
Qwen/Qwen3-32B
|
cerebras |
live |
0.4 |
0.8 |
- |
0.24 |
790 |
No |
No |
Qwen/Qwen3-32B
|
nebius |
live |
0.1 |
0.3 |
40960 |
0.40 |
45 |
Yes |
Yes |
Qwen/Qwen3-32B
|
novita |
live |
0.1 |
0.45 |
40960 |
1.01 |
37 |
No |
No |
Qwen/Qwen3-32B
|
nscale |
live |
0.08 |
0.25 |
40960 |
0.64 |
26 |
Yes |
Yes |
Qwen/Qwen3-32B
|
groq |
live |
0.29 |
0.59 |
131072 |
0.16 |
247 |
Yes |
No |
Qwen/Qwen3-32B
|
sambanova |
live |
0.4 |
0.8 |
32768 |
1.24 |
234 |
Yes |
Yes |
Qwen/Qwen3-30B-A3B
|
fireworks-ai |
live |
0.15 |
0.6 |
131072 |
0.77 |
140 |
Yes |
No |
Qwen/Qwen3-30B-A3B
|
nebius |
live |
0.1 |
0.3 |
40960 |
0.43 |
87 |
Yes |
Yes |
Qwen/Qwen3-30B-A3B
|
novita |
live |
0.09 |
0.45 |
40960 |
0.81 |
91 |
No |
No |
mistralai/Mixtral-8x7B-Instruct-v0.1
|
together |
live |
0.6 |
0.6 |
32768 |
0.44 |
51 |
No |
Yes |
deepseek-ai/DeepSeek-R1-0528-Qwen3-8B
|
novita |
live |
0.06 |
0.09 |
128000 |
0.72 |
54 |
No |
No |
NousResearch/Hermes-3-Llama-3.1-405B
|
nebius |
live |
1 |
3 |
131072 |
0.51 |
30 |
No |
Yes |
Qwen/Qwen3-30B-A3B-Thinking-2507
|
nebius |
live |
0.1 |
0.3 |
262144 |
0.43 |
107 |
Yes |
Yes |
meta-llama/Llama-3.1-70B-Instruct
|
fireworks-ai |
live |
0.9 |
0.9 |
131072 |
1.04 |
105 |
No |
No |
Sao10K/L3-8B-Stheno-v3.2
|
novita |
live |
0.05 |
0.05 |
8192 |
0.95 |
98 |
No |
No |
deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
|
nscale |
live |
0.15 |
0.15 |
131072 |
0.37 |
69 |
No |
No |
deepseek-ai/DeepSeek-Prover-V2-671B
|
novita |
live |
0.7 |
2.5 |
160000 |
0.83 |
55 |
No |
No |
zai-org/GLM-4.5-Air-FP8
|
together |
live |
0.2 |
1.1 |
131072 |
0.36 |
117 |
Yes |
Yes |
baidu/ERNIE-4.5-VL-28B-A3B-PT
|
novita |
live |
0.14 |
0.56 |
30000 |
1.06 |
76 |
No |
No |
CohereLabs/aya-expanse-8b
|
cohere |
live |
- |
- |
- |
0.21 |
72 |
No |
No |
CohereLabs/c4ai-command-r7b-12-2024
|
cohere |
live |
- |
- |
- |
0.24 |
122 |
Yes |
No |
deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
|
novita |
live |
0.15 |
0.15 |
32768 |
1.12 |
53 |
No |
No |
deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
|
nscale |
live |
0.2 |
0.2 |
131072 |
0.44 |
36 |
No |
Yes |
Qwen/Qwen2.5-72B-Instruct
|
fireworks-ai |
offline |
- |
- |
- |
0.40 |
- |
Yes |
No |
Qwen/Qwen2.5-72B-Instruct
|
nebius |
live |
0.13 |
0.4 |
131072 |
0.48 |
26 |
Yes |
No |
Qwen/Qwen2.5-72B-Instruct
|
novita |
live |
0.38 |
0.4 |
32000 |
1.89 |
19 |
Yes |
No |
Qwen/Qwen2.5-72B-Instruct
|
together |
live |
1.2 |
1.2 |
131072 |
0.36 |
85 |
Yes |
Yes |
Qwen/Qwen2.5-72B-Instruct
|
hyperbolic |
live |
0.4 |
0.4 |
131072 |
1.22 |
25 |
No |
No |
Qwen/Qwen2.5-VL-72B-Instruct
|
nebius |
live |
0.25 |
0.75 |
32000 |
0.39 |
31 |
No |
Yes |
Qwen/Qwen2.5-VL-72B-Instruct
|
hyperbolic |
live |
0.6 |
0.6 |
32768 |
0.41 |
34 |
No |
No |
meta-llama/Llama-4-Maverick-17B-128E-Instruct
|
fireworks-ai |
live |
0.22 |
0.88 |
1048576 |
1.50 |
66 |
Yes |
No |
meta-llama/Llama-4-Maverick-17B-128E-Instruct
|
cerebras |
live |
0.2 |
0.6 |
- |
0.24 |
805 |
Yes |
No |
meta-llama/Llama-4-Maverick-17B-128E-Instruct
|
groq |
live |
0.2 |
0.6 |
131072 |
0.14 |
523 |
Yes |
No |
meta-llama/Llama-4-Maverick-17B-128E-Instruct
|
sambanova |
live |
0.63 |
1.8 |
131072 |
1.37 |
363 |
Yes |
Yes |
aisingapore/Gemma-SEA-LION-v4-27B-IT
|
publicai |
live |
- |
- |
- |
1.70 |
46 |
No |
Yes |
CohereLabs/command-a-reasoning-08-2025
|
cohere |
live |
- |
- |
- |
0.19 |
93 |
Yes |
No |
Qwen/Qwen3-235B-A22B-Instruct-2507
|
fireworks-ai |
live |
0.22 |
0.88 |
262144 |
0.81 |
36 |
Yes |
No |
Qwen/Qwen3-235B-A22B-Instruct-2507
|
cerebras |
live |
0.6 |
1.2 |
- |
0.24 |
465 |
Yes |
No |
Qwen/Qwen3-235B-A22B-Instruct-2507
|
nebius |
live |
0.2 |
0.6 |
262144 |
0.36 |
25 |
Yes |
Yes |
Qwen/Qwen3-235B-A22B-Instruct-2507
|
novita |
live |
0.15 |
0.8 |
131072 |
0.71 |
48 |
Yes |
Yes |
Qwen/Qwen3-235B-A22B-Instruct-2507
|
together |
live |
0.2 |
0.6 |
262144 |
0.43 |
45 |
Yes |
Yes |
Qwen/Qwen3-235B-A22B-Instruct-2507
|
nscale |
live |
0.2 |
0.6 |
32768 |
0.61 |
24 |
Yes |
Yes |
Qwen/Qwen3-235B-A22B-Instruct-2507
|
hyperbolic |
live |
2 |
2 |
262144 |
0.92 |
45 |
Yes |
No |
Qwen/Qwen3-235B-A22B-Instruct-2507
|
scaleway |
live |
- |
- |
- |
0.39 |
65 |
Yes |
Yes |
deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
|
novita |
live |
0.3 |
0.3 |
64000 |
0.83 |
21 |
No |
Yes |
deepseek-ai/DeepSeek-R1-Distill-Qwen-32B
|
nscale |
live |
0.3 |
0.3 |
131072 |
0.57 |
26 |
No |
Yes |
Qwen/Qwen2.5-Coder-32B-Instruct
|
together |
live |
0.8 |
0.8 |
16384 |
0.39 |
89 |
Yes |
Yes |
Qwen/Qwen2.5-Coder-32B-Instruct
|
nscale |
live |
0.06 |
0.2 |
131072 |
0.48 |
28 |
No |
Yes |
Qwen/Qwen2.5-Coder-32B-Instruct
|
hyperbolic |
live |
0.2 |
0.2 |
32768 |
1.66 |
82 |
No |
No |
Qwen/Qwen2.5-Coder-32B-Instruct
|
scaleway |
live |
- |
- |
- |
0.51 |
31 |
Yes |
No |
Qwen/Qwen3-235B-A22B-Thinking-2507
|
fireworks-ai |
live |
0.22 |
0.88 |
262144 |
0.95 |
51 |
Yes |
No |
Qwen/Qwen3-235B-A22B-Thinking-2507
|
cerebras |
live |
0.6 |
1.2 |
- |
0.23 |
605 |
No |
No |
Qwen/Qwen3-235B-A22B-Thinking-2507
|
novita |
live |
0.3 |
3 |
131072 |
0.93 |
41 |
Yes |
No |
meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8
|
novita |
live |
0.17 |
0.85 |
1048576 |
1.54 |
53 |
No |
No |
meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8
|
together |
live |
0.27 |
0.85 |
1048576 |
1.04 |
63 |
Yes |
Yes |
mistralai/Mistral-Small-24B-Instruct-2501
|
together |
live |
0.8 |
0.8 |
32768 |
0.28 |
61 |
Yes |
Yes |
CohereLabs/aya-expanse-32b
|
cohere |
live |
- |
- |
- |
0.15 |
64 |
No |
No |
Qwen/Qwen2.5-VL-32B-Instruct
|
fireworks-ai |
live |
0.22 |
0.88 |
128000 |
1.44 |
40 |
No |
No |
zai-org/GLM-4-32B-0414
|
novita |
live |
0.55 |
1.66 |
32000 |
1.06 |
36 |
No |
No |
NousResearch/Hermes-4-405B
|
nebius |
live |
1 |
3 |
131072 |
0.32 |
37 |
No |
No |
MiniMaxAI/MiniMax-M1-80k
|
novita |
live |
0.55 |
2.2 |
1000000 |
1.19 |
40 |
No |
No |
zai-org/GLM-4.1V-9B-Thinking
|
novita |
live |
0.035 |
0.138 |
65536 |
0.75 |
104 |
No |
No |
Qwen/Qwen2.5-Coder-7B-Instruct
|
nscale |
live |
0.01 |
0.03 |
131072 |
0.49 |
60 |
No |
Yes |
baidu/ERNIE-4.5-0.3B-PT
|
novita |
live |
- |
- |
120000 |
0.98 |
103 |
No |
No |
Qwen/Qwen3-235B-A22B
|
fireworks-ai |
live |
0.22 |
0.88 |
131072 |
0.79 |
59 |
Yes |
No |
Qwen/Qwen3-235B-A22B
|
novita |
live |
0.2 |
0.8 |
40960 |
1.73 |
9 |
No |
No |
Qwen/Qwen3-235B-A22B
|
together |
live |
0.2 |
0.6 |
40960 |
1.07 |
45 |
Yes |
Yes |
Qwen/Qwen3-235B-A22B
|
nscale |
live |
0.2 |
0.6 |
32000 |
0.79 |
24 |
Yes |
Yes |
Qwen/QwQ-32B
|
fireworks-ai |
offline |
- |
- |
- |
0.56 |
- |
No |
No |
Qwen/QwQ-32B
|
nebius |
live |
0.5 |
1.5 |
131072 |
0.43 |
87 |
No |
No |
Qwen/QwQ-32B
|
nscale |
live |
0.18 |
0.2 |
131072 |
0.83 |
24 |
Yes |
Yes |
Qwen/QwQ-32B
|
groq |
offline |
- |
- |
- |
- |
- |
- |
- |
Qwen/QwQ-32B
|
hyperbolic |
live |
0.4 |
0.4 |
131072 |
2.18 |
78 |
No |
No |
Qwen/QwQ-32B
|
sambanova |
offline |
- |
- |
- |
0.41 |
- |
- |
- |
nvidia/Llama-3_1-Nemotron-Ultra-253B-v1
|
nebius |
live |
0.6 |
1.8 |
131072 |
0.42 |
38 |
No |
Yes |
marin-community/marin-8b-instruct
|
together |
live |
0.18 |
0.18 |
4096 |
1.50 |
137 |
No |
Yes |
Qwen/Qwen3-235B-A22B-FP8
|
together |
live |
0.2 |
0.6 |
40960 |
0.60 |
56 |
Yes |
Yes |
baidu/ERNIE-4.5-300B-A47B-Base-PT
|
novita |
live |
0.28 |
1.1 |
123000 |
1.23 |
28 |
No |
Yes |
baidu/ERNIE-4.5-21B-A3B-PT
|
novita |
live |
0.07 |
0.28 |
120000 |
1.24 |
77 |
No |
No |
baidu/ERNIE-4.5-VL-424B-A47B-Base-PT
|
novita |
live |
0.42 |
1.25 |
123000 |
2.01 |
37 |
No |
No |
SentientAGI/Dobby-Unhinged-Llama-3.3-70B
|
fireworks-ai |
live |
0.9 |
0.9 |
131072 |
0.44 |
49 |
No |
No |
deepseek-ai/DeepSeek-V3
|
fireworks-ai |
live |
0.9 |
0.9 |
131072 |
1.04 |
79 |
Yes |
No |
deepseek-ai/DeepSeek-V3
|
nebius |
live |
0.5 |
1.5 |
163840 |
0.53 |
21 |
No |
Yes |
deepseek-ai/DeepSeek-V3
|
novita |
live |
0.4 |
1.3 |
64000 |
1.12 |
26 |
Yes |
No |
deepseek-ai/DeepSeek-V3
|
together |
live |
1.25 |
1.25 |
131072 |
0.65 |
56 |
Yes |
Yes |
Qwen/QwQ-32B-Preview
|
fireworks-ai |
offline |
- |
- |
- |
- |
- |
- |
- |
Qwen/QwQ-32B-Preview
|
together |
live |
- |
- |
- |
0.63 |
87 |
Yes |
Yes |
Qwen/QwQ-32B-Preview
|
hyperbolic |
offline |
- |
- |
- |
- |
- |
- |
- |
Qwen/QwQ-32B-Preview
|
sambanova |
offline |
- |
- |
- |
0.35 |
- |
- |
- |
deepseek-ai/DeepSeek-R1-Distill-Llama-70B
|
novita |
live |
0.8 |
0.8 |
32000 |
2.16 |
30 |
No |
Yes |
deepseek-ai/DeepSeek-R1-Distill-Llama-70B
|
nscale |
live |
0.75 |
0.75 |
131072 |
0.63 |
17 |
No |
Yes |
deepseek-ai/DeepSeek-R1-Distill-Llama-70B
|
groq |
live |
0.75 |
0.99 |
131072 |
0.15 |
207 |
Yes |
No |
deepseek-ai/DeepSeek-R1-Distill-Llama-70B
|
sambanova |
live |
0.7 |
1.4 |
131072 |
1.28 |
178 |
No |
No |
deepseek-ai/DeepSeek-R1-Distill-Llama-70B
|
scaleway |
live |
- |
- |
- |
1.01 |
23 |
No |
Yes |
Sao10K/L3-8B-Lunaris-v1
|
novita |
live |
0.05 |
0.05 |
8192 |
0.77 |
70 |
No |
No |
Sao10K/L3-70B-Euryale-v2.1
|
novita |
live |
1.48 |
1.48 |
8192 |
1.00 |
57 |
No |
No |
CohereLabs/c4ai-command-r-08-2024
|
cohere |
live |
- |
- |
- |
0.27 |
52 |
Yes |
No |
google/gemma-2-9b-it
|
nebius |
live |
0.03 |
0.09 |
8192 |
0.35 |
142 |
No |
Yes |
google/gemma-2-9b-it
|
groq |
live |
0.2 |
0.2 |
8192 |
0.31 |
457 |
Yes |
No |
deepcogito/cogito-v2-preview-llama-70B
|
together |
live |
0.88 |
0.88 |
32768 |
0.76 |
53 |
Yes |
Yes |
deepcogito/cogito-v2-preview-llama-109B-MoE
|
together |
live |
0.18 |
0.59 |
32767 |
0.65 |
71 |
Yes |
Yes |
deepcogito/cogito-v2-preview-llama-405B
|
together |
live |
3.5 |
3.5 |
32768 |
0.84 |
26 |
Yes |
Yes |
deepcogito/cogito-v2-preview-deepseek-671B-MoE
|
together |
live |
1.25 |
1.25 |
163840 |
0.27 |
48 |
No |
Yes |
Qwen/Qwen2.5-Coder-7B
|
nebius |
live |
0.03 |
0.09 |
32768 |
0.55 |
191 |
No |
Yes |
arcee-ai/AFM-4.5B
|
together |
live |
0.1 |
0.4 |
65536 |
0.63 |
181 |
No |
Yes |
CohereLabs/c4ai-command-a-03-2025
|
cohere |
live |
- |
- |
- |
0.25 |
57 |
Yes |
No |
mistralai/Mixtral-8x22B-Instruct-v0.1
|
fireworks-ai |
live |
1.2 |
1.2 |
65536 |
0.45 |
68 |
No |
No |
mistralai/Mixtral-8x22B-Instruct-v0.1
|
together |
offline |
- |
- |
- |
- |
- |
- |
- |
mistralai/Mixtral-8x22B-Instruct-v0.1
|
nscale |
live |
1.2 |
1.2 |
65536 |
0.57 |
21 |
No |
Yes |
Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8
|
together |
live |
2 |
2 |
262144 |
1.35 |
46 |
Yes |
Yes |
meta-llama/Llama-3.1-405B-Instruct
|
fireworks-ai |
live |
3 |
3 |
131072 |
0.49 |
64 |
Yes |
No |
meta-llama/Llama-3.1-405B-Instruct
|
nebius |
live |
1 |
3 |
131072 |
0.52 |
32 |
Yes |
Yes |
meta-llama/Llama-3.1-405B-Instruct
|
sambanova |
offline |
- |
- |
- |
0.47 |
112 |
Yes |
Yes |
Qwen/Qwen2.5-Coder-3B-Instruct
|
nscale |
live |
0.01 |
0.03 |
32768 |
0.38 |
78 |
No |
Yes |
tokyotech-llm/Llama-3.3-Swallow-70B-Instruct-v0.4
|
sambanova |
live |
0.6 |
1.2 |
131072 |
2.77 |
134 |
No |
Yes |
CohereLabs/aya-vision-8b
|
cohere |
live |
- |
- |
- |
0.26 |
70 |
No |
No |
CohereLabs/c4ai-command-r7b-arabic-02-2025
|
cohere |
live |
- |
- |
- |
0.27 |
74 |
Yes |
No |
katanemo/Arch-Router-1.5B
|
hf-inference |
live |
- |
- |
- |
0.13 |
75 |
No |
Yes |
CohereLabs/command-a-vision-07-2025
|
cohere |
live |
- |
- |
- |
0.19 |
40 |
No |
No |
alpindale/WizardLM-2-8x22B
|
novita |
live |
0.62 |
0.62 |
65535 |
0.85 |
32 |
No |
No |
CohereLabs/command-a-translate-08-2025
|
cohere |
live |
- |
- |
- |
0.28 |
54 |
Yes |
No |
meta-llama/Meta-Llama-3-70B-Instruct
|
novita |
live |
0.51 |
0.74 |
8192 |
0.88 |
19 |
No |
Yes |
meta-llama/Meta-Llama-3-70B-Instruct
|
together |
offline |
0.88 |
0.88 |
8192 |
0.44 |
95 |
No |
Yes |
meta-llama/Meta-Llama-3-70B-Instruct
|
groq |
offline |
0.59 |
0.79 |
8192 |
0.17 |
296 |
Yes |
No |
meta-llama/Meta-Llama-3-70B-Instruct
|
hyperbolic |
live |
0.4 |
0.4 |
8192 |
0.79 |
95 |
No |
No |
meta-llama/Llama-Guard-4-12B
|
groq |
live |
0.2 |
0.2 |
131072 |
0.23 |
8 |
No |
No |
NousResearch/Hermes-2-Pro-Llama-3-8B
|
novita |
live |
0.14 |
0.14 |
8192 |
0.74 |
92 |
No |
No |
baichuan-inc/Baichuan-M2-32B
|
novita |
live |
0.07 |
0.07 |
131072 |
2.14 |
40 |
No |
Yes |
NousResearch/Hermes-3-Llama-3.1-70B
|
hyperbolic |
live |
0.4 |
0.4 |
12288 |
0.56 |
30 |
No |
No |
CohereLabs/aya-vision-32b
|
cohere |
live |
- |
- |
- |
0.24 |
57 |
No |
No |