| Deepseek R1 05/28 |
deepseek-r1-0528
|
3.00 |
8.00 |
Provider: Fireworks AI, Context: 160000, Output Limit: 16384
|
|
| DeepSeek V3.1 |
deepseek-v3p1
|
0.56 |
1.68 |
Provider: Fireworks AI, Context: 163840, Output Limit: 163840
|
|
| DeepSeek V3.2 |
deepseek-v3p2
|
0.56 |
1.68 |
Provider: Fireworks AI, Context: 160000, Output Limit: 160000
|
|
| MiniMax-M2 |
minimax-m2
|
0.30 |
1.20 |
Provider: Fireworks AI, Context: 192000, Output Limit: 192000
|
|
| MiniMax-M2.1 |
minimax-m2p1
|
0.30 |
1.20 |
Provider: Fireworks AI, Context: 200000, Output Limit: 200000
|
|
| GLM 4.7 |
glm-4p7
|
0.60 |
2.20 |
Provider: Fireworks AI, Context: 198000, Output Limit: 198000
|
|
| Deepseek V3 03-24 |
deepseek-v3-0324
|
0.90 |
0.90 |
Provider: Fireworks AI, Context: 160000, Output Limit: 16384
|
|
| GLM 4.6 |
glm-4p6
|
0.55 |
2.19 |
Provider: Fireworks AI, Context: 198000, Output Limit: 198000
|
|
| Kimi K2 Thinking |
kimi-k2-thinking
|
0.60 |
2.50 |
Provider: Fireworks AI, Context: 256000, Output Limit: 256000
|
|
| Kimi K2 Instruct |
kimi-k2-instruct
|
1.00 |
3.00 |
Provider: Fireworks AI, Context: 128000, Output Limit: 16384
|
|
| Qwen3 235B-A22B |
qwen3-235b-a22b
|
0.22 |
0.88 |
Provider: Fireworks AI, Context: 128000, Output Limit: 16384
|
|
| GPT OSS 20B |
gpt-oss-20b
|
0.05 |
0.20 |
Provider: Fireworks AI, Context: 131072, Output Limit: 32768
|
|
| GPT OSS 120B |
gpt-oss-120b
|
0.15 |
0.60 |
Provider: Fireworks AI, Context: 131072, Output Limit: 32768
|
|
| GLM 4.5 Air |
glm-4p5-air
|
0.22 |
0.88 |
Provider: Fireworks AI, Context: 131072, Output Limit: 131072
|
|
| Qwen3 Coder 480B A35B Instruct |
qwen3-coder-480b-a35b-instruct
|
0.45 |
1.80 |
Provider: Fireworks AI, Context: 256000, Output Limit: 32768
|
|
| GLM 4.5 |
glm-4p5
|
0.55 |
2.19 |
Provider: Fireworks AI, Context: 131072, Output Limit: 131072
|
|
| fireworks-ai-4.1b-to-16b |
fireworks-ai-4.1b-to-16b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: N/A
|
|
| fireworks-ai-56b-to-176b |
fireworks-ai-56b-to-176b
|
1.20 |
1.20 |
Source: fireworks_ai, Context: N/A
|
|
| fireworks-ai-above-16b |
fireworks-ai-above-16b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: N/A
|
|
| fireworks-ai-default |
fireworks-ai-default
|
0.00 |
0.00 |
Source: fireworks_ai, Context: N/A
|
|
| fireworks-ai-moe-up-to-56b |
fireworks-ai-moe-up-to-56b
|
0.50 |
0.50 |
Source: fireworks_ai, Context: N/A
|
|
| fireworks-ai-up-to-4b |
fireworks-ai-up-to-4b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: N/A
|
|
| deepseek-coder-v2-instruct |
deepseek-coder-v2-instruct
|
1.20 |
1.20 |
Source: fireworks_ai, Context: 65536
|
|
| deepseek-r1 |
deepseek-r1
|
3.00 |
8.00 |
Source: fireworks_ai, Context: 128000
|
|
| deepseek-r1-basic |
deepseek-r1-basic
|
0.55 |
2.19 |
Source: fireworks_ai, Context: 128000
|
|
| deepseek-v3 |
deepseek-v3
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 128000
|
|
| deepseek-v3p1-terminus |
deepseek-v3p1-terminus
|
0.56 |
1.68 |
Source: fireworks_ai, Context: 128000
|
|
| firefunction-v2 |
firefunction-v2
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 8192
|
|
| kimi-k2-instruct-0905 |
kimi-k2-instruct-0905
|
0.60 |
2.50 |
Source: fireworks_ai, Context: 262144
|
|
| llama-v3p1-405b-instruct |
llama-v3p1-405b-instruct
|
3.00 |
3.00 |
Source: fireworks_ai, Context: 128000
|
|
| llama-v3p1-8b-instruct |
llama-v3p1-8b-instruct
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 16384
|
|
| llama-v3p2-11b-vision-instruct |
llama-v3p2-11b-vision-instruct
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 16384
|
|
| llama-v3p2-1b-instruct |
llama-v3p2-1b-instruct
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 16384
|
|
| llama-v3p2-3b-instruct |
llama-v3p2-3b-instruct
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 16384
|
|
| llama-v3p2-90b-vision-instruct |
llama-v3p2-90b-vision-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 16384
|
|
| llama4-maverick-instruct-basic |
llama4-maverick-instruct-basic
|
0.22 |
0.88 |
Source: fireworks_ai, Context: 131072
|
|
| llama4-scout-instruct-basic |
llama4-scout-instruct-basic
|
0.15 |
0.60 |
Source: fireworks_ai, Context: 131072
|
|
| mixtral-8x22b-instruct-hf |
mixtral-8x22b-instruct-hf
|
1.20 |
1.20 |
Source: fireworks_ai, Context: 65536
|
|
| qwen2-72b-instruct |
qwen2-72b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-coder-32b-instruct |
qwen2p5-coder-32b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 4096
|
|
| yi-large |
yi-large
|
3.00 |
3.00 |
Source: fireworks_ai, Context: 32768
|
|
| flux-kontext-pro |
flux-kontext-pro
|
0.04 |
0.04 |
Source: fireworks_ai, Context: 4096
|
|
| SSD-1B |
ssd-1b
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 4096
|
|
| chronos-hermes-13b-v2 |
chronos-hermes-13b-v2
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| code-llama-13b |
code-llama-13b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 16384
|
|
| code-llama-13b-instruct |
code-llama-13b-instruct
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 16384
|
|
| code-llama-13b-python |
code-llama-13b-python
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 16384
|
|
| code-llama-34b |
code-llama-34b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 16384
|
|
| code-llama-34b-instruct |
code-llama-34b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 16384
|
|
| code-llama-34b-python |
code-llama-34b-python
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 16384
|
|
| code-llama-70b |
code-llama-70b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 4096
|
|
| code-llama-70b-instruct |
code-llama-70b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 4096
|
|
| code-llama-70b-python |
code-llama-70b-python
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 4096
|
|
| code-llama-7b |
code-llama-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 16384
|
|
| code-llama-7b-instruct |
code-llama-7b-instruct
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 16384
|
|
| code-llama-7b-python |
code-llama-7b-python
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 16384
|
|
| code-qwen-1p5-7b |
code-qwen-1p5-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 65536
|
|
| codegemma-2b |
codegemma-2b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 8192
|
|
| codegemma-7b |
codegemma-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 8192
|
|
| cogito-671b-v2-p1 |
cogito-671b-v2-p1
|
1.20 |
1.20 |
Source: fireworks_ai, Context: 163840
|
|
| cogito-v1-preview-llama-3b |
cogito-v1-preview-llama-3b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 131072
|
|
| cogito-v1-preview-llama-70b |
cogito-v1-preview-llama-70b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| cogito-v1-preview-llama-8b |
cogito-v1-preview-llama-8b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 131072
|
|
| cogito-v1-preview-qwen-14b |
cogito-v1-preview-qwen-14b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 131072
|
|
| cogito-v1-preview-qwen-32b |
cogito-v1-preview-qwen-32b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| flux-kontext-max |
flux-kontext-max
|
0.08 |
0.08 |
Source: fireworks_ai, Context: 4096
|
|
| dbrx-instruct |
dbrx-instruct
|
1.20 |
1.20 |
Source: fireworks_ai, Context: 32768
|
|
| deepseek-coder-1b-base |
deepseek-coder-1b-base
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 16384
|
|
| deepseek-coder-33b-instruct |
deepseek-coder-33b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 16384
|
|
| deepseek-coder-7b-base |
deepseek-coder-7b-base
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| deepseek-coder-7b-base-v1p5 |
deepseek-coder-7b-base-v1p5
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| deepseek-coder-7b-instruct-v1p5 |
deepseek-coder-7b-instruct-v1p5
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| deepseek-coder-v2-lite-base |
deepseek-coder-v2-lite-base
|
0.50 |
0.50 |
Source: fireworks_ai, Context: 163840
|
|
| deepseek-coder-v2-lite-instruct |
deepseek-coder-v2-lite-instruct
|
0.50 |
0.50 |
Source: fireworks_ai, Context: 163840
|
|
| deepseek-prover-v2 |
deepseek-prover-v2
|
1.20 |
1.20 |
Source: fireworks_ai, Context: 163840
|
|
| deepseek-r1-0528-distill-qwen3-8b |
deepseek-r1-0528-distill-qwen3-8b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 131072
|
|
| deepseek-r1-distill-llama-70b |
deepseek-r1-distill-llama-70b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| deepseek-r1-distill-llama-8b |
deepseek-r1-distill-llama-8b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 131072
|
|
| deepseek-r1-distill-qwen-14b |
deepseek-r1-distill-qwen-14b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 131072
|
|
| deepseek-r1-distill-qwen-1p5b |
deepseek-r1-distill-qwen-1p5b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 131072
|
|
| deepseek-r1-distill-qwen-32b |
deepseek-r1-distill-qwen-32b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| deepseek-r1-distill-qwen-7b |
deepseek-r1-distill-qwen-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 131072
|
|
| deepseek-v2-lite-chat |
deepseek-v2-lite-chat
|
0.50 |
0.50 |
Source: fireworks_ai, Context: 163840
|
|
| deepseek-v2p5 |
deepseek-v2p5
|
1.20 |
1.20 |
Source: fireworks_ai, Context: 32768
|
|
| devstral-small-2505 |
devstral-small-2505
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| dobby-mini-unhinged-plus-llama-3-1-8b |
dobby-mini-unhinged-plus-llama-3-1-8b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 131072
|
|
| dobby-unhinged-llama-3-3-70b-new |
dobby-unhinged-llama-3-3-70b-new
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| dolphin-2-9-2-qwen2-72b |
dolphin-2-9-2-qwen2-72b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| dolphin-2p6-mixtral-8x7b |
dolphin-2p6-mixtral-8x7b
|
0.50 |
0.50 |
Source: fireworks_ai, Context: 32768
|
|
| ernie-4p5-21b-a3b-pt |
ernie-4p5-21b-a3b-pt
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 4096
|
|
| ernie-4p5-300b-a47b-pt |
ernie-4p5-300b-a47b-pt
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 4096
|
|
| fare-20b |
fare-20b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| firefunction-v1 |
firefunction-v1
|
0.50 |
0.50 |
Source: fireworks_ai, Context: 32768
|
|
| firellava-13b |
firellava-13b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| firesearch-ocr-v6 |
firesearch-ocr-v6
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 8192
|
|
| fireworks-asr-large |
fireworks-asr-large
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 4096
|
|
| fireworks-asr-v2 |
fireworks-asr-v2
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 4096
|
|
| flux-1-dev |
flux-1-dev
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 4096
|
|
| flux-1-dev-controlnet-union |
flux-1-dev-controlnet-union
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 4096
|
|
| flux-1-dev-fp8 |
flux-1-dev-fp8
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 4096
|
|
| flux-1-schnell |
flux-1-schnell
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 4096
|
|
| flux-1-schnell-fp8 |
flux-1-schnell-fp8
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 4096
|
|
| gemma-2b-it |
gemma-2b-it
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 8192
|
|
| gemma-3-27b-it |
gemma-3-27b-it
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| gemma-7b |
gemma-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 8192
|
|
| gemma-7b-it |
gemma-7b-it
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 8192
|
|
| gemma2-9b-it |
gemma2-9b-it
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 8192
|
|
| glm-4p5v |
glm-4p5v
|
1.20 |
1.20 |
Source: fireworks_ai, Context: 131072
|
|
| gpt-oss-safeguard-120b |
gpt-oss-safeguard-120b
|
1.20 |
1.20 |
Source: fireworks_ai, Context: 131072
|
|
| gpt-oss-safeguard-20b |
gpt-oss-safeguard-20b
|
0.50 |
0.50 |
Source: fireworks_ai, Context: 131072
|
|
| hermes-2-pro-mistral-7b |
hermes-2-pro-mistral-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| internvl3-38b |
internvl3-38b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 16384
|
|
| internvl3-78b |
internvl3-78b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 16384
|
|
| internvl3-8b |
internvl3-8b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 16384
|
|
| japanese-stable-diffusion-xl |
japanese-stable-diffusion-xl
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 4096
|
|
| kat-coder |
kat-coder
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 262144
|
|
| kat-dev-32b |
kat-dev-32b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| kat-dev-72b-exp |
kat-dev-72b-exp
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| llama-guard-2-8b |
llama-guard-2-8b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 8192
|
|
| llama-guard-3-1b |
llama-guard-3-1b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 131072
|
|
| llama-guard-3-8b |
llama-guard-3-8b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 131072
|
|
| llama-v2-13b |
llama-v2-13b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| llama-v2-13b-chat |
llama-v2-13b-chat
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| llama-v2-70b |
llama-v2-70b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 4096
|
|
| llama-v2-70b-chat |
llama-v2-70b-chat
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 2048
|
|
| llama-v2-7b |
llama-v2-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| llama-v2-7b-chat |
llama-v2-7b-chat
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| llama-v3-70b-instruct |
llama-v3-70b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 8192
|
|
| llama-v3-70b-instruct-hf |
llama-v3-70b-instruct-hf
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 8192
|
|
| llama-v3-8b |
llama-v3-8b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 8192
|
|
| llama-v3-8b-instruct-hf |
llama-v3-8b-instruct-hf
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 8192
|
|
| llama-v3p1-405b-instruct-long |
llama-v3p1-405b-instruct-long
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 4096
|
|
| llama-v3p1-70b-instruct |
llama-v3p1-70b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| llama-v3p1-70b-instruct-1b |
llama-v3p1-70b-instruct-1b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 4096
|
|
| llama-v3p1-nemotron-70b-instruct |
llama-v3p1-nemotron-70b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| llama-v3p2-1b |
llama-v3p2-1b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 131072
|
|
| llama-v3p2-3b |
llama-v3p2-3b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 131072
|
|
| llama-v3p3-70b-instruct |
llama-v3p3-70b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| llamaguard-7b |
llamaguard-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| llava-yi-34b |
llava-yi-34b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 4096
|
|
| minimax-m1-80k |
minimax-m1-80k
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 4096
|
|
| ministral-3-14b-instruct-2512 |
ministral-3-14b-instruct-2512
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 256000
|
|
| ministral-3-3b-instruct-2512 |
ministral-3-3b-instruct-2512
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 256000
|
|
| ministral-3-8b-instruct-2512 |
ministral-3-8b-instruct-2512
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 256000
|
|
| mistral-7b |
mistral-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| mistral-7b-instruct-4k |
mistral-7b-instruct-4k
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| mistral-7b-instruct-v0p2 |
mistral-7b-instruct-v0p2
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| mistral-7b-instruct-v3 |
mistral-7b-instruct-v3
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| mistral-7b-v0p2 |
mistral-7b-v0p2
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| mistral-large-3-fp8 |
mistral-large-3-fp8
|
1.20 |
1.20 |
Source: fireworks_ai, Context: 256000
|
|
| mistral-nemo-base-2407 |
mistral-nemo-base-2407
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 128000
|
|
| mistral-nemo-instruct-2407 |
mistral-nemo-instruct-2407
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 128000
|
|
| mistral-small-24b-instruct-2501 |
mistral-small-24b-instruct-2501
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 32768
|
|
| mixtral-8x22b |
mixtral-8x22b
|
1.20 |
1.20 |
Source: fireworks_ai, Context: 65536
|
|
| mixtral-8x22b-instruct |
mixtral-8x22b-instruct
|
1.20 |
1.20 |
Source: fireworks_ai, Context: 65536
|
|
| mixtral-8x7b |
mixtral-8x7b
|
0.50 |
0.50 |
Source: fireworks_ai, Context: 32768
|
|
| mixtral-8x7b-instruct |
mixtral-8x7b-instruct
|
0.50 |
0.50 |
Source: fireworks_ai, Context: 32768
|
|
| mixtral-8x7b-instruct-hf |
mixtral-8x7b-instruct-hf
|
0.50 |
0.50 |
Source: fireworks_ai, Context: 32768
|
|
| mythomax-l2-13b |
mythomax-l2-13b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| nemotron-nano-v2-12b-vl |
nemotron-nano-v2-12b-vl
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 4096
|
|
| nous-capybara-7b-v1p9 |
nous-capybara-7b-v1p9
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| nous-hermes-2-mixtral-8x7b-dpo |
nous-hermes-2-mixtral-8x7b-dpo
|
0.50 |
0.50 |
Source: fireworks_ai, Context: 32768
|
|
| nous-hermes-2-yi-34b |
nous-hermes-2-yi-34b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 4096
|
|
| nous-hermes-llama2-13b |
nous-hermes-llama2-13b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| nous-hermes-llama2-70b |
nous-hermes-llama2-70b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 4096
|
|
| nous-hermes-llama2-7b |
nous-hermes-llama2-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| nvidia-nemotron-nano-12b-v2 |
nvidia-nemotron-nano-12b-v2
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 131072
|
|
| nvidia-nemotron-nano-9b-v2 |
nvidia-nemotron-nano-9b-v2
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 131072
|
|
| openchat-3p5-0106-7b |
openchat-3p5-0106-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 8192
|
|
| openhermes-2-mistral-7b |
openhermes-2-mistral-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| openhermes-2p5-mistral-7b |
openhermes-2p5-mistral-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| openorca-7b |
openorca-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| phi-2-3b |
phi-2-3b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 2048
|
|
| phi-3-mini-128k-instruct |
phi-3-mini-128k-instruct
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 131072
|
|
| phi-3-vision-128k-instruct |
phi-3-vision-128k-instruct
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32064
|
|
| phind-code-llama-34b-python-v1 |
phind-code-llama-34b-python-v1
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 16384
|
|
| phind-code-llama-34b-v1 |
phind-code-llama-34b-v1
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 16384
|
|
| phind-code-llama-34b-v2 |
phind-code-llama-34b-v2
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 16384
|
|
| playground-v2-1024px-aesthetic |
playground-v2-1024px-aesthetic
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 4096
|
|
| playground-v2-5-1024px-aesthetic |
playground-v2-5-1024px-aesthetic
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 4096
|
|
| pythia-12b |
pythia-12b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 2048
|
|
| qwen-qwq-32b-preview |
qwen-qwq-32b-preview
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 32768
|
|
| qwen-v2p5-14b-instruct |
qwen-v2p5-14b-instruct
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| qwen-v2p5-7b |
qwen-v2p5-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 131072
|
|
| qwen1p5-72b-chat |
qwen1p5-72b-chat
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2-7b-instruct |
qwen2-7b-instruct
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2-vl-2b-instruct |
qwen2-vl-2b-instruct
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2-vl-72b-instruct |
qwen2-vl-72b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2-vl-7b-instruct |
qwen2-vl-7b-instruct
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-0p5b-instruct |
qwen2p5-0p5b-instruct
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-14b |
qwen2p5-14b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 131072
|
|
| qwen2p5-1p5b-instruct |
qwen2p5-1p5b-instruct
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-32b |
qwen2p5-32b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| qwen2p5-32b-instruct |
qwen2p5-32b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-72b |
qwen2p5-72b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| qwen2p5-72b-instruct |
qwen2p5-72b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-7b-instruct |
qwen2p5-7b-instruct
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-coder-0p5b |
qwen2p5-coder-0p5b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-coder-0p5b-instruct |
qwen2p5-coder-0p5b-instruct
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-coder-14b |
qwen2p5-coder-14b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-coder-14b-instruct |
qwen2p5-coder-14b-instruct
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-coder-1p5b |
qwen2p5-coder-1p5b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-coder-1p5b-instruct |
qwen2p5-coder-1p5b-instruct
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-coder-32b |
qwen2p5-coder-32b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-coder-32b-instruct-128k |
qwen2p5-coder-32b-instruct-128k
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| qwen2p5-coder-32b-instruct-32k-rope |
qwen2p5-coder-32b-instruct-32k-rope
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-coder-32b-instruct-64k |
qwen2p5-coder-32b-instruct-64k
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 65536
|
|
| qwen2p5-coder-3b |
qwen2p5-coder-3b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-coder-3b-instruct |
qwen2p5-coder-3b-instruct
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-coder-7b |
qwen2p5-coder-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-coder-7b-instruct |
qwen2p5-coder-7b-instruct
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| qwen2p5-math-72b-instruct |
qwen2p5-math-72b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 4096
|
|
| qwen2p5-vl-32b-instruct |
qwen2p5-vl-32b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 128000
|
|
| qwen2p5-vl-3b-instruct |
qwen2p5-vl-3b-instruct
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 128000
|
|
| qwen2p5-vl-72b-instruct |
qwen2p5-vl-72b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 128000
|
|
| qwen2p5-vl-7b-instruct |
qwen2p5-vl-7b-instruct
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 128000
|
|
| qwen3-0p6b |
qwen3-0p6b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 40960
|
|
| qwen3-14b |
qwen3-14b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 40960
|
|
| qwen3-1p7b |
qwen3-1p7b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 131072
|
|
| qwen3-1p7b-fp8-draft |
qwen3-1p7b-fp8-draft
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 262144
|
|
| qwen3-1p7b-fp8-draft-131072 |
qwen3-1p7b-fp8-draft-131072
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 131072
|
|
| qwen3-1p7b-fp8-draft-40960 |
qwen3-1p7b-fp8-draft-40960
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 40960
|
|
| qwen3-235b-a22b-instruct-2507 |
qwen3-235b-a22b-instruct-2507
|
0.22 |
0.88 |
Source: fireworks_ai, Context: 262144
|
|
| qwen3-235b-a22b-thinking-2507 |
qwen3-235b-a22b-thinking-2507
|
0.22 |
0.88 |
Source: fireworks_ai, Context: 262144
|
|
| qwen3-30b-a3b |
qwen3-30b-a3b
|
0.15 |
0.60 |
Source: fireworks_ai, Context: 131072
|
|
| qwen3-30b-a3b-instruct-2507 |
qwen3-30b-a3b-instruct-2507
|
0.50 |
0.50 |
Source: fireworks_ai, Context: 262144
|
|
| qwen3-30b-a3b-thinking-2507 |
qwen3-30b-a3b-thinking-2507
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 262144
|
|
| qwen3-32b |
qwen3-32b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| qwen3-4b |
qwen3-4b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 40960
|
|
| qwen3-4b-instruct-2507 |
qwen3-4b-instruct-2507
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 262144
|
|
| qwen3-8b |
qwen3-8b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 40960
|
|
| qwen3-coder-30b-a3b-instruct |
qwen3-coder-30b-a3b-instruct
|
0.15 |
0.60 |
Source: fireworks_ai, Context: 262144
|
|
| qwen3-coder-480b-instruct-bf16 |
qwen3-coder-480b-instruct-bf16
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 4096
|
|
| qwen3-embedding-0p6b |
qwen3-embedding-0p6b
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 32768
|
|
| qwen3-embedding-4b |
qwen3-embedding-4b
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 40960
|
|
|
-
|
0.10 |
0.00 |
Source: fireworks_ai, Context: 40960
|
|
| qwen3-next-80b-a3b-instruct |
qwen3-next-80b-a3b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 4096
|
|
| qwen3-next-80b-a3b-thinking |
qwen3-next-80b-a3b-thinking
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 4096
|
|
| qwen3-reranker-0p6b |
qwen3-reranker-0p6b
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 40960
|
|
| qwen3-reranker-4b |
qwen3-reranker-4b
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 40960
|
|
| qwen3-reranker-8b |
qwen3-reranker-8b
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 40960
|
|
| qwen3-vl-235b-a22b-instruct |
qwen3-vl-235b-a22b-instruct
|
0.22 |
0.88 |
Source: fireworks_ai, Context: 262144
|
|
| qwen3-vl-235b-a22b-thinking |
qwen3-vl-235b-a22b-thinking
|
0.22 |
0.88 |
Source: fireworks_ai, Context: 262144
|
|
| qwen3-vl-30b-a3b-instruct |
qwen3-vl-30b-a3b-instruct
|
0.15 |
0.60 |
Source: fireworks_ai, Context: 262144
|
|
| qwen3-vl-30b-a3b-thinking |
qwen3-vl-30b-a3b-thinking
|
0.15 |
0.60 |
Source: fireworks_ai, Context: 262144
|
|
| qwen3-vl-32b-instruct |
qwen3-vl-32b-instruct
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 4096
|
|
| qwen3-vl-8b-instruct |
qwen3-vl-8b-instruct
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| qwq-32b |
qwq-32b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 131072
|
|
| rolm-ocr |
rolm-ocr
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 128000
|
|
| snorkel-mistral-7b-pairrm-dpo |
snorkel-mistral-7b-pairrm-dpo
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| stable-diffusion-xl-1024-v1-0 |
stable-diffusion-xl-1024-v1-0
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 4096
|
|
| stablecode-3b |
stablecode-3b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 4096
|
|
| starcoder-16b |
starcoder-16b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 8192
|
|
| starcoder-7b |
starcoder-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 8192
|
|
| starcoder2-15b |
starcoder2-15b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 16384
|
|
| starcoder2-3b |
starcoder2-3b
|
0.10 |
0.10 |
Source: fireworks_ai, Context: 16384
|
|
| starcoder2-7b |
starcoder2-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 16384
|
|
| toppy-m-7b |
toppy-m-7b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|
| whisper-v3 |
whisper-v3
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 4096
|
|
| whisper-v3-turbo |
whisper-v3-turbo
|
0.00 |
0.00 |
Source: fireworks_ai, Context: 4096
|
|
| yi-34b |
yi-34b
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 4096
|
|
| yi-34b-200k-capybara |
yi-34b-200k-capybara
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 200000
|
|
| yi-34b-chat |
yi-34b-chat
|
0.90 |
0.90 |
Source: fireworks_ai, Context: 4096
|
|
| yi-6b |
yi-6b
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 4096
|
|
| zephyr-7b-beta |
zephyr-7b-beta
|
0.20 |
0.20 |
Source: fireworks_ai, Context: 32768
|
|