Discover and compare the latest prices for Large Language Model (LLM) APIs from top providers like OpenAI GPT-4, Anthropic Claude, Google Gemini, Mate Llama 3, and others.
Model | Provider | Context | Input | Output | Date |
---|---|---|---|---|---|
claude-2.0 | Anthropic | 100K | $8 | $24 | 01/06/2024 |
claude-2.0/2.1 | AWS | $8.00 | $24.00 | 01/06/2024 | |
claude-2.1 | Anthropic | 200K | $8 | $24 | 01/06/2024 |
claude-3.5-sonnet | AWS | $3.00 | $15.00 | 01/06/2024 | |
claude-3.5-sonnet | $3.00 | $15.00 | 01/06/2024 | ||
claude-3-haiku | Anthropic | 200K | $0.25 | $1.25 | 01/06/2024 |
claude-3-haiku | AWS | 32K | $0.25 | $1.25 | 01/06/2024 |
claude-3-haiku | $0.25 | $1.25 | 01/06/2024 | ||
claude-3-opus | Anthropic | 200K | $15 | $75 | 01/08/2023 |
claude-3-opus | AWS | $15.00 | $75.00 | 01/08/2023 | |
claude-3-opus | $15.00 | $75.00 | 01/06/2024 | ||
claude-3-sonnet | Anthropic | 200K | $3 | $15 | 01/06/2024 |
claude-3-sonnet | AWS | 32K | $3 | $15 | 01/06/2024 |
claude-3-sonnet | $3.00 | $15.00 | 01/06/2024 | ||
claude-instant | AWS | 32K | $0.80 | $2.40 | 01/06/2024 |
claude-instant-1.2 | Anthropic | 100K | $0.80 | $2.40 | 01/06/2024 |
codestral | Mistral | $0.20 | $0.60 | 01/06/2024 | |
codestral-2405 | Mistral | $0.90 | $2.80 | 01/06/2024 | |
codestral-mamba-latest | Mistral | $0.20 | $0.20 | 01/06/2024 | |
codey-for-code-chat | $0.25 | $0.50 | 01/06/2024 | ||
codey-for-code-chat-32k | $0.25 | $0.50 | 01/06/2024 | ||
codey-for-code-generation-32k | $0.25 | $0.50 | 01/06/2024 | ||
command | AWS | 32K | $1.50 | $2 | 01/06/2024 |
command | Cohere | 4K | $0.30 | $0.60 | 01/06/2024 |
command-light | AWS | 32K | $0.30 | $0.60 | 01/06/2024 |
command-light | Cohere | $0.30 | $0.60 | 01/06/2024 | |
command-light-fine-tuned | Cohere | $0.30 | $0.60 | 01/06/2024 | |
command-r | AWS | $0.50 | $1.50 | 01/06/2024 | |
command-r | Cohere | 4K | $0.50 | $1.50 | 01/03/2024 |
command-r+ | AWS | $3.00 | $15.00 | 01/03/2024 | |
command-r-fine-tuned-model | Cohere | $0.30 | $1.20 | 01/06/2024 | |
command-r-new | Cohere | $0.15 | $0.60 | 01/06/2024 | |
command-r-plus | Cohere | 128K | $3 | $15 | 01/06/2024 |
deepseek-v2 | DeepSeek | 32K | $0.14 | $0.28 | 01/06/2024 |
embed-3 | Cohere | $0.10 | $0.00 | 01/06/2024 | |
fine-tuned-command-light | Cohere | $0.30 | $0.60 | 01/06/2024 | |
gemini-1.5-pro | 1M | $3.50 | $10.50 | 01/06/2024 | |
gemini-flash-1.5 | 2.8M | $0.08 | $0.30 | 01/06/2024 | |
gemini-pro | 32K | $0.50 | $1.50 | 01/04/2023 | |
gemma-7b | Groq | 8K | $0.10 | $0.10 | 01/04/2023 |
gemma-7b-it | Deepinfra | 8K | $0.07 | $0.07 | 01/04/2023 |
gpt-3.5-turbo-0125 | OpenAI | 16K | $0.50 | $1.50 | 01/06/2024 |
gpt-3.5-turbo-0301 | OpenAI | 4K | $1.50 | $2 | 01/02/2024 |
gpt-3.5-turbo-0613 | Azure | $30.00 | $40.00 | 01/09/2021 | |
gpt-3.5-turbo-0613 | OpenAI | 4K | $1.50 | $2 | 01/09/2021 |
gpt-3.5-turbo-1106 | OpenAI | 4K | $1 | $2 | 01/09/2021 |
gpt-3.5-turbo-16k-0613 | OpenAI | 4K | $3 | $4 | 01/09/2021 |
gpt-3.5-turbo-instruct | OpenAI | 4K | $1.50 | $2 | 01/09/2021 |
gpt-4 | OpenAI | 8K | $30 | $60 | 01/09/2021 |
gpt-4-0125-preview | OpenAI | 128K | $10 | $30 | 01/09/2021 |
gpt-4-1106-preview | OpenAI | 128K | $10 | $30 | 01/12/2023 |
gpt-4-1106-vision-preview | OpenAI | $1.00 | $3.00 | 01/04/2023 | |
gpt-4-32k | OpenAI | 32K | $60 | $120 | 01/09/2021 |
gpt-4o | OpenAI | 128K | $5 | $15 | 01/12/2023 |
gpt-4o-2024-05-13 | OpenAI | 128K | $5 | $15 | 01/04/2023 |
gpt-4o-2024-08-06 | OpenAI | 128K | $2.50 | $10 | 01/10/2023 |
gpt-4o-mini | OpenAI | 128K | $0.15 | $0.60 | 01/10/2023 |
gpt-4-turbo-1106-preview | Azure | $10.00 | $30.00 | 01/10/2023 | |
gpt-4-turbo-2024-04-09 | OpenAI | $10.00 | $30.00 | 01/10/2023 | |
gpt-4-turbo-2024-04-09 | OpenAI | 128K | $10 | $30 | 01/06/2024 |
gpt-4-vision-preview | OpenAI | 128K | $10 | $30 | 01/06/2024 |
imagen | $20.00 | $20.00 | 01/06/2024 | ||
imagen-image-editing | $20.00 | $20.00 | 01/06/2024 | ||
imagen-image-generation | $20.00 | $20.00 | 01/06/2024 | ||
imagen-upscaling | $3.00 | $3.00 | 01/06/2024 | ||
imagen-visual-captioning | $1.50 | $1.50 | 01/06/2024 | ||
imagen-visual-q&a | $1.50 | $1.50 | 01/06/2024 | ||
jamba-1.5-large | AWS | $2.00 | $8.00 | 01/06/2024 | |
jamba-1.5-mini | AWS | $0.20 | $0.40 | 01/06/2024 | |
jamba-instruct | AWS | $0.50 | $0.70 | 01/06/2024 | |
jurassic-2-mid | AWS | $12.50 | $12.50 | 01/06/2024 | |
jurassic-2-mid | AWS | 32K | $12.50 | $12.50 | 01/06/2024 |
jurassic-2-ultra | AWS | $18.80 | $18.80 | 01/12/2023 | |
jurassic-2-ultra | AWS | 32K | $18.80 | $18.80 | 01/06/2024 |
llama-2-13b | Replicate | 4K | $0.10 | $0.50 | 01/12/2023 |
llama-2-70b | Groq | 4K | $0.64 | $0.80 | 01/06/2024 |
llama-2-70b | Replicate | 4K | $0.65 | $2.75 | 01/06/2024 |
llama-2-7b | Groq | 2K | $0.10 | $0.10 | 01/06/2024 |
llama-2-7b | Replicate | 4K | $0.05 | $0.25 | 01/06/2024 |
llama-2-7b-chat-fp16 | Cloudflare | 3K | $0.56 | $6.66 | 01/06/2024 |
llama-2-7b-chat-int8 | Cloudflare | 2K | $0.16 | $0.24 | 01/06/2024 |
llama-2-chat-13b | AWS | 32K | $0.75 | $1 | 01/12/2023 |
llama-2-chat-70b | AWS | 32K | $1.95 | $2.56 | 01/06/2024 |
llama-3.1-405b-instruct | Fireworks | 128K | $3 | $3 | 01/06/2024 |
llama-3.1-70b-instruct | Deepinfra | 128K | $0.52 | $0.75 | 01/06/2024 |
llama-3.1-8b-instruct | Deepinfra | 128K | $0.09 | $0.09 | 01/06/2024 |
llama-3-70b | Groq | 8K | $0.59 | $0.79 | 01/06/2024 |
llama-3-70b-instruct | Deepinfra | 8K | $0.59 | $0.79 | 01/06/2024 |
llama-3-8b | Groq | 8K | $0.05 | $0.10 | 01/06/2024 |
llama-3-8b-instruct | Deepinfra | 8K | $0.08 | $0.08 | 01/06/2024 |
llama-3-instruct-70b | AWS | $2.65 | $3.50 | 01/12/2023 | |
llama-3-instruct-8b | AWS | $0.40 | $0.60 | 01/06/2024 | |
llama-3-soliloquy-8b | Lynn | 24K | $0.10 | $0.10 | 01/06/2024 |
meta-llama-3-70b-instruct | Replicate | 8K | $0.65 | $2.75 | 01/06/2024 |
meta-llama-3-8b-instruct | Replicate | 8K | $0.05 | $0.25 | 01/06/2024 |
ministral-3b-24.10 | Mistral | $0.04 | $0.04 | 01/06/2024 | |
ministral-8b-24.10 | Mistral | $0.10 | $0.10 | 01/06/2024 | |
mistral-7b | AWS | 32K | $0.15 | $0.20 | 01/06/2024 |
mistral-7b | Mistral | 32K | $0.25 | $0.25 | 01/06/2024 |
mistral-7b-instruct | Cloudflare | 32K | $0.11 | $0.19 | 01/06/2024 |
mistral-7b-instruct-v0.2 | Replicate | 32K | $0.05 | $0.25 | 01/06/2024 |
mistral-7b-v0.1 | Replicate | 32K | $0.05 | $0.25 | 01/06/2024 |
mistral-8x7b | AWS | 32K | $0.45 | $0.70 | 01/06/2024 |
mistral-large | AWS | $8.00 | $24.00 | 01/06/2024 | |
mistral-large | Mistral | 32K | $8 | $24 | 01/06/2024 |
mistral-large-2 | Mistral | $2.00 | $6.00 | 01/06/2024 | |
mistral-large-2402 | Mistral | $3.80 | $11.30 | 01/06/2024 | |
mistral-medium | Mistral | 32K | $2.00 | $8.00 | 01/06/2024 |
mistral-medium-2312 | Mistral | $2.50 | $7.50 | 01/06/2024 | |
mistral-small | Mistral | 32K | $1 | $3 | 01/06/2024 |
mistral-small-24.09 | Mistral | $0.20 | $0.60 | 01/06/2024 | |
mistral-small-2402 | Mistral | $0.90 | $2.80 | 01/06/2024 | |
mixtral-8*7b | AWS | $0.45 | $0.70 | 01/06/2024 | |
mixtral-8x7b | Groq | 32K | $0.27 | $0.27 | 01/06/2024 |
mixtral-8x7b | Mistral | 32K | $0.70 | $0.70 | 01/06/2024 |
mixtral-8x7b-instruct-v0.1 | Replicate | 32K | $0.30 | $1 | 01/06/2024 |
openchat-7b | OpenChat | 8K | $0.13 | $0.13 | 01/06/2024 |
open-mistral-7b | Mistral | $0.20 | $0.20 | 01/06/2024 | |
open-mistral-nemo-2407 | Mistral | $0.27 | $0.27 | 01/06/2024 | |
open-mixtral-8x22b | Mistral | $1.90 | $5.60 | 01/06/2024 | |
open-mixtral-8x7b | Mistral | $0.65 | $0.65 | 01/06/2024 | |
palm-2-for-chat-32k-chat-bison-32k | $0.25 | $0.50 | 01/06/2024 | ||
palm-2-for-chat-chat-bison | $0.25 | $0.50 | 01/06/2024 | ||
palm-2-for-text-32k-text-bison-32k | $0.25 | $0.50 | 01/06/2024 | ||
palm-2-for-text-text-bison | $0.25 | $0.50 | 01/06/2024 | ||
palm-2-for-texttext-unicorn | $2.50 | $7.50 | 01/06/2024 | ||
pplx-70b-online | Perplexity | 4K | $1 | $1 | 01/06/2024 |
pplx-7b-online | Perplexity | 4K | $0.20 | $0.20 | 01/06/2024 |
rerank-3 | Cohere | $2.00 | $2.00 | 01/06/2024 | |
titan-text-express | AWS | 32K | $0.80 | $1.60 | 01/06/2024 |
titan-text-lite | AWS | 32K | $0.30 | $0.40 | 01/06/2024 |
visual-captioning | $1.50 | $1.50 | 01/06/2024 | ||
visual-q&a | $1.50 | $1.50 | 01/06/2024 | ||