diff --git a/README.md b/README.md index 5261f6c..4939572 100644 --- a/README.md +++ b/README.md @@ -117,7 +117,489 @@ Units denominated in USD. All prices can be located in `model_prices.json`. * Prices last updated Jan 30, 2024 from [LiteLLM's cost dictionary](https://github.com/BerriAI/litellm/blob/main/model_prices_and_context_window.json) -| Model Name | Prompt Cost (USD) per 1M tokens | Completion Cost (USD) per 1M tokens | Max Prompt Tokens | Max Output Tokens | +| Model Name | Prompt Cost (USD) per 1M tokens | Completion Cost (USD) per 1M tokens | Max Prompt Tokens | Max Output Tokens | +|:----------------------------------------------------------------------|:----------------------------------|:--------------------------------------|:--------------------|--------------------:| +| gpt-4 | $30.00 | $60.00 | 8,192 | 4096 | +| gpt-4o | $ 5.00 | $15.00 | 128,000 | 4096 | +| gpt-4o-mini | $0.15 | $0.6 | 128,000 | 4096 | +| gpt-4o-mini-2024-07-18 | $0.15 | $0.6 | 128,000 | 4096 | +| gpt-4o-2024-05-13 | $ 5.00 | $15.00 | 128,000 | 4096 | +| gpt-4-turbo-preview | $10.00 | $30.00 | 128,000 | 4096 | +| gpt-4-0314 | $30.00 | $60.00 | 8,192 | 4096 | +| gpt-4-0613 | $30.00 | $60.00 | 8,192 | 4096 | +| gpt-4-32k | $60.00 | $120.00 | 32,768 | 4096 | +| gpt-4-32k-0314 | $60.00 | $120.00 | 32,768 | 4096 | +| gpt-4-32k-0613 | $60.00 | $120.00 | 32,768 | 4096 | +| gpt-4-turbo | $10.00 | $30.00 | 128,000 | 4096 | +| gpt-4-turbo-2024-04-09 | $10.00 | $30.00 | 128,000 | 4096 | +| gpt-4-1106-preview | $10.00 | $30.00 | 128,000 | 4096 | +| gpt-4-0125-preview | $10.00 | $30.00 | 128,000 | 4096 | +| gpt-4-vision-preview | $10.00 | $30.00 | 128,000 | 4096 | +| gpt-4-1106-vision-preview | $10.00 | $30.00 | 128,000 | 4096 | +| gpt-3.5-turbo | $1.5 | $ 2.00 | 16,385 | 4096 | +| gpt-3.5-turbo-0301 | $1.5 | $ 2.00 | 4,097 | 4096 | +| gpt-3.5-turbo-0613 | $1.5 | $ 2.00 | 4,097 | 4096 | +| gpt-3.5-turbo-1106 | $ 1.00 | $ 2.00 | 16,385 | 4096 | +| gpt-3.5-turbo-0125 | $0.5 | $1.5 | 16,385 | 4096 | +| gpt-3.5-turbo-16k | $ 3.00 | $ 4.00 | 16,385 | 4096 | +| gpt-3.5-turbo-16k-0613 | $ 3.00 | $ 4.00 | 16,385 | 4096 | +| ft:gpt-3.5-turbo | $ 3.00 | $ 6.00 | 4,097 | 4096 | +| ft:gpt-4-0613 | $30.00 | $60.00 | 8,192 | 4096 | +| ft:gpt-4o-2024-05-13 | $ 5.00 | $15.00 | 128,000 | 4096 | +| ft:davinci-002 | $ 2.00 | $ 2.00 | 16,384 | 4096 | +| ft:babbage-002 | $0.4 | $0.4 | 16,384 | 4096 | +| text-embedding-3-large | $0.13 | $ 0.00 | 8,191 | nan | +| text-embedding-3-small | $0.02 | $ 0.00 | 8,191 | nan | +| text-embedding-ada-002 | $0.1 | $ 0.00 | 8,191 | nan | +| text-embedding-ada-002-v2 | $0.1 | $ 0.00 | 8,191 | nan | +| text-moderation-stable | $ 0.00 | $ 0.00 | 32,768 | 0 | +| text-moderation-007 | $ 0.00 | $ 0.00 | 32,768 | 0 | +| text-moderation-latest | $ 0.00 | $ 0.00 | 32,768 | 0 | +| 256-x-256/dall-e-2 | -- | -- | nan | nan | +| 512-x-512/dall-e-2 | -- | -- | nan | nan | +| 1024-x-1024/dall-e-2 | -- | -- | nan | nan | +| hd/1024-x-1792/dall-e-3 | -- | -- | nan | nan | +| hd/1792-x-1024/dall-e-3 | -- | -- | nan | nan | +| hd/1024-x-1024/dall-e-3 | -- | -- | nan | nan | +| standard/1024-x-1792/dall-e-3 | -- | -- | nan | nan | +| standard/1792-x-1024/dall-e-3 | -- | -- | nan | nan | +| standard/1024-x-1024/dall-e-3 | -- | -- | nan | nan | +| whisper-1 | -- | -- | nan | nan | +| tts-1 | -- | -- | nan | nan | +| tts-1-hd | -- | -- | nan | nan | +| azure/tts-1 | -- | -- | nan | nan | +| azure/tts-1-hd | -- | -- | nan | nan | +| azure/whisper-1 | -- | -- | nan | nan | +| azure/gpt-4o | $ 5.00 | $15.00 | 128,000 | 4096 | +| azure/gpt-4-turbo-2024-04-09 | $10.00 | $30.00 | 128,000 | 4096 | +| azure/gpt-4-0125-preview | $10.00 | $30.00 | 128,000 | 4096 | +| azure/gpt-4-1106-preview | $10.00 | $30.00 | 128,000 | 4096 | +| azure/gpt-4-0613 | $30.00 | $60.00 | 8,192 | 4096 | +| azure/gpt-4-32k-0613 | $60.00 | $120.00 | 32,768 | 4096 | +| azure/gpt-4-32k | $60.00 | $120.00 | 32,768 | 4096 | +| azure/gpt-4 | $30.00 | $60.00 | 8,192 | 4096 | +| azure/gpt-4-turbo | $10.00 | $30.00 | 128,000 | 4096 | +| azure/gpt-4-turbo-vision-preview | $10.00 | $30.00 | 128,000 | 4096 | +| azure/gpt-35-turbo-16k-0613 | $ 3.00 | $ 4.00 | 16,385 | 4096 | +| azure/gpt-35-turbo-1106 | $ 1.00 | $ 2.00 | 16,384 | 4096 | +| azure/gpt-35-turbo-0125 | $0.5 | $1.5 | 16,384 | 4096 | +| azure/gpt-35-turbo-16k | $ 3.00 | $ 4.00 | 16,385 | 4096 | +| azure/gpt-35-turbo | $0.5 | $1.5 | 4,097 | 4096 | +| azure/gpt-3.5-turbo-instruct-0914 | $1.5 | $ 2.00 | 4,097 | nan | +| azure/gpt-35-turbo-instruct | $1.5 | $ 2.00 | 4,097 | nan | +| azure/mistral-large-latest | $ 8.00 | $24.00 | 32,000 | nan | +| azure/mistral-large-2402 | $ 8.00 | $24.00 | 32,000 | nan | +| azure/command-r-plus | $ 3.00 | $15.00 | 128,000 | 4096 | +| azure/ada | $0.1 | $ 0.00 | 8,191 | nan | +| azure/text-embedding-ada-002 | $0.1 | $ 0.00 | 8,191 | nan | +| azure/text-embedding-3-large | $0.13 | $ 0.00 | 8,191 | nan | +| azure/text-embedding-3-small | $0.02 | $ 0.00 | 8,191 | nan | +| azure/standard/1024-x-1024/dall-e-3 | -- | $ 0.00 | nan | nan | +| azure/hd/1024-x-1024/dall-e-3 | -- | $ 0.00 | nan | nan | +| azure/standard/1024-x-1792/dall-e-3 | -- | $ 0.00 | nan | nan | +| azure/standard/1792-x-1024/dall-e-3 | -- | $ 0.00 | nan | nan | +| azure/hd/1024-x-1792/dall-e-3 | -- | $ 0.00 | nan | nan | +| azure/hd/1792-x-1024/dall-e-3 | -- | $ 0.00 | nan | nan | +| azure/standard/1024-x-1024/dall-e-2 | -- | $ 0.00 | nan | nan | +| azure_ai/jamba-instruct | $0.5 | $0.7 | 70,000 | 4096 | +| azure_ai/mistral-large | $ 4.00 | $12.00 | 32,000 | 8191 | +| azure_ai/mistral-small | $ 1.00 | $ 3.00 | 32,000 | 8191 | +| azure_ai/Meta-Llama-3-70B-Instruct | $1.1 | $0.37 | 8,192 | 8192 | +| azure_ai/Meta-Llama-31-8B-Instruct | $0.3 | $0.61 | 128,000 | 128000 | +| azure_ai/Meta-Llama-31-70B-Instruct | $2.68 | $3.54 | 128,000 | 128000 | +| azure_ai/Meta-Llama-31-405B-Instruct | $5.33 | $16.00 | 128,000 | 128000 | +| babbage-002 | $0.4 | $0.4 | 16,384 | 4096 | +| davinci-002 | $ 2.00 | $ 2.00 | 16,384 | 4096 | +| gpt-3.5-turbo-instruct | $1.5 | $ 2.00 | 8,192 | 4096 | +| gpt-3.5-turbo-instruct-0914 | $1.5 | $ 2.00 | 8,192 | 4097 | +| claude-instant-1 | $1.63 | $5.51 | 100,000 | 8191 | +| mistral/mistral-tiny | $0.25 | $0.25 | 32,000 | 8191 | +| mistral/mistral-small | $ 1.00 | $ 3.00 | 32,000 | 8191 | +| mistral/mistral-small-latest | $ 1.00 | $ 3.00 | 32,000 | 8191 | +| mistral/mistral-medium | $2.7 | $8.1 | 32,000 | 8191 | +| mistral/mistral-medium-latest | $2.7 | $8.1 | 32,000 | 8191 | +| mistral/mistral-medium-2312 | $2.7 | $8.1 | 32,000 | 8191 | +| mistral/mistral-large-latest | $ 3.00 | $ 9.00 | 128,000 | 128000 | +| mistral/mistral-large-2402 | $ 4.00 | $12.00 | 32,000 | 8191 | +| mistral/mistral-large-2407 | $ 3.00 | $ 9.00 | 128,000 | 128000 | +| mistral/open-mistral-7b | $0.25 | $0.25 | 32,000 | 8191 | +| mistral/open-mixtral-8x7b | $0.7 | $0.7 | 32,000 | 8191 | +| mistral/open-mixtral-8x22b | $ 2.00 | $ 6.00 | 64,000 | 8191 | +| mistral/codestral-latest | $ 1.00 | $ 3.00 | 32,000 | 8191 | +| mistral/codestral-2405 | $ 1.00 | $ 3.00 | 32,000 | 8191 | +| mistral/open-mistral-nemo | $0.3 | $0.3 | 128,000 | 128000 | +| mistral/open-mistral-nemo-2407 | $0.3 | $0.3 | 128,000 | 128000 | +| mistral/open-codestral-mamba | $0.25 | $0.25 | 256,000 | 256000 | +| mistral/codestral-mamba-latest | $0.25 | $0.25 | 256,000 | 256000 | +| mistral/mistral-embed | $0.1 | -- | 8,192 | nan | +| deepseek-chat | $0.14 | $0.28 | 32,000 | 4096 | +| codestral/codestral-latest | $ 0.00 | $ 0.00 | 32,000 | 8191 | +| codestral/codestral-2405 | $ 0.00 | $ 0.00 | 32,000 | 8191 | +| text-completion-codestral/codestral-latest | $ 0.00 | $ 0.00 | 32,000 | 8191 | +| text-completion-codestral/codestral-2405 | $ 0.00 | $ 0.00 | 32,000 | 8191 | +| deepseek-coder | $0.14 | $0.28 | 128,000 | 4096 | +| groq/llama2-70b-4096 | $0.7 | $0.8 | 4,096 | 4096 | +| groq/llama3-8b-8192 | $0.05 | $0.08 | 8,192 | 8192 | +| groq/llama3-70b-8192 | $0.59 | $0.79 | 8,192 | 8192 | +| groq/llama-3.1-8b-instant | $0.59 | $0.79 | 8,192 | 8192 | +| groq/llama-3.1-70b-versatile | $0.59 | $0.79 | 8,192 | 8192 | +| groq/llama-3.1-405b-reasoning | $0.59 | $0.79 | 8,192 | 8192 | +| groq/mixtral-8x7b-32768 | $0.24 | $0.24 | 32,768 | 32768 | +| groq/gemma-7b-it | $0.07 | $0.07 | 8,192 | 8192 | +| groq/llama3-groq-70b-8192-tool-use-preview | $0.89 | $0.89 | 8,192 | 8192 | +| groq/llama3-groq-8b-8192-tool-use-preview | $0.19 | $0.19 | 8,192 | 8192 | +| friendliai/mixtral-8x7b-instruct-v0-1 | $0.4 | $0.4 | 32,768 | 32768 | +| friendliai/meta-llama-3-8b-instruct | $0.1 | $0.1 | 8,192 | 8192 | +| friendliai/meta-llama-3-70b-instruct | $0.8 | $0.8 | 8,192 | 8192 | +| claude-instant-1.2 | $0.163 | $0.551 | 100,000 | 8191 | +| claude-2 | $ 8.00 | $24.00 | 100,000 | 8191 | +| claude-2.1 | $ 8.00 | $24.00 | 200,000 | 8191 | +| claude-3-haiku-20240307 | $0.25 | $1.25 | 200,000 | 4096 | +| claude-3-opus-20240229 | $15.00 | $75.00 | 200,000 | 4096 | +| claude-3-sonnet-20240229 | $ 3.00 | $15.00 | 200,000 | 4096 | +| claude-3-5-sonnet-20240620 | $ 3.00 | $15.00 | 200,000 | 4096 | +| text-bison | -- | -- | 8,192 | 2048 | +| text-bison@001 | -- | -- | 8,192 | 1024 | +| text-bison@002 | -- | -- | 8,192 | 1024 | +| text-bison32k | $0.125 | $0.125 | 8,192 | 1024 | +| text-bison32k@002 | $0.125 | $0.125 | 8,192 | 1024 | +| text-unicorn | $10.00 | $28.00 | 8,192 | 1024 | +| text-unicorn@001 | $10.00 | $28.00 | 8,192 | 1024 | +| chat-bison | $0.125 | $0.125 | 8,192 | 4096 | +| chat-bison@001 | $0.125 | $0.125 | 8,192 | 4096 | +| chat-bison@002 | $0.125 | $0.125 | 8,192 | 4096 | +| chat-bison-32k | $0.125 | $0.125 | 32,000 | 8192 | +| chat-bison-32k@002 | $0.125 | $0.125 | 32,000 | 8192 | +| code-bison | $0.125 | $0.125 | 6,144 | 1024 | +| code-bison@001 | $0.125 | $0.125 | 6,144 | 1024 | +| code-bison@002 | $0.125 | $0.125 | 6,144 | 1024 | +| code-bison32k | $0.125 | $0.125 | 6,144 | 1024 | +| code-bison-32k@002 | $0.125 | $0.125 | 6,144 | 1024 | +| code-gecko@001 | $0.125 | $0.125 | 2,048 | 64 | +| code-gecko@002 | $0.125 | $0.125 | 2,048 | 64 | +| code-gecko | $0.125 | $0.125 | 2,048 | 64 | +| code-gecko-latest | $0.125 | $0.125 | 2,048 | 64 | +| codechat-bison@latest | $0.125 | $0.125 | 6,144 | 1024 | +| codechat-bison | $0.125 | $0.125 | 6,144 | 1024 | +| codechat-bison@001 | $0.125 | $0.125 | 6,144 | 1024 | +| codechat-bison@002 | $0.125 | $0.125 | 6,144 | 1024 | +| codechat-bison-32k | $0.125 | $0.125 | 32,000 | 8192 | +| codechat-bison-32k@002 | $0.125 | $0.125 | 32,000 | 8192 | +| gemini-pro | $0.5 | $1.5 | 32,760 | 8192 | +| gemini-1.0-pro | $0.5 | $1.5 | 32,760 | 8192 | +| gemini-1.0-pro-001 | $0.5 | $1.5 | 32,760 | 8192 | +| gemini-1.0-ultra | $0.5 | $1.5 | 8,192 | 2048 | +| gemini-1.0-ultra-001 | $0.5 | $1.5 | 8,192 | 2048 | +| gemini-1.0-pro-002 | $0.5 | $1.5 | 32,760 | 8192 | +| gemini-1.5-pro | $ 5.00 | $15.00 | 2,097,152 | 8192 | +| gemini-1.5-pro-001 | $ 5.00 | $15.00 | 1,000,000 | 8192 | +| gemini-1.5-pro-preview-0514 | $ 5.00 | $15.00 | 1,000,000 | 8192 | +| gemini-1.5-pro-preview-0215 | $ 5.00 | $15.00 | 1,000,000 | 8192 | +| gemini-1.5-pro-preview-0409 | $ 5.00 | $15.00 | 1,000,000 | 8192 | +| gemini-1.5-flash | $0.5 | $1.5 | 1,000,000 | 8192 | +| gemini-1.5-flash-001 | $0.5 | $1.5 | 1,000,000 | 8192 | +| gemini-1.5-flash-preview-0514 | $0.5 | $1.5 | 1,000,000 | 8192 | +| gemini-experimental | $ 0.00 | $ 0.00 | 1,000,000 | 8192 | +| gemini-pro-vision | $0.25 | $0.5 | 16,384 | 2048 | +| gemini-1.0-pro-vision | $0.25 | $0.5 | 16,384 | 2048 | +| gemini-1.0-pro-vision-001 | $0.25 | $0.5 | 16,384 | 2048 | +| medlm-medium | -- | -- | 32,768 | 8192 | +| medlm-large | -- | -- | 8,192 | 1024 | +| vertex_ai/claude-3-sonnet@20240229 | $ 3.00 | $15.00 | 200,000 | 4096 | +| vertex_ai/claude-3-5-sonnet@20240620 | $ 3.00 | $15.00 | 200,000 | 4096 | +| vertex_ai/claude-3-haiku@20240307 | $0.25 | $1.25 | 200,000 | 4096 | +| vertex_ai/claude-3-opus@20240229 | $15.00 | $75.00 | 200,000 | 4096 | +| vertex_ai/meta/llama3-405b-instruct-maas | $ 0.00 | $ 0.00 | 32,000 | 32000 | +| vertex_ai/imagegeneration@006 | -- | -- | nan | nan | +| text-embedding-004 | $0.00625 | $ 0.00 | 3,072 | nan | +| text-multilingual-embedding-002 | $0.00625 | $ 0.00 | 2,048 | nan | +| textembedding-gecko | $0.00625 | $ 0.00 | 3,072 | nan | +| textembedding-gecko-multilingual | $0.00625 | $ 0.00 | 3,072 | nan | +| textembedding-gecko-multilingual@001 | $0.00625 | $ 0.00 | 3,072 | nan | +| textembedding-gecko@001 | $0.00625 | $ 0.00 | 3,072 | nan | +| textembedding-gecko@003 | $0.00625 | $ 0.00 | 3,072 | nan | +| text-embedding-preview-0409 | $0.00625 | $ 0.00 | 3,072 | nan | +| text-multilingual-embedding-preview-0409 | $0.00625 | $ 0.00 | 3,072 | nan | +| palm/chat-bison | $0.125 | $0.125 | 8,192 | 4096 | +| palm/chat-bison-001 | $0.125 | $0.125 | 8,192 | 4096 | +| palm/text-bison | $0.125 | $0.125 | 8,192 | 1024 | +| palm/text-bison-001 | $0.125 | $0.125 | 8,192 | 1024 | +| palm/text-bison-safety-off | $0.125 | $0.125 | 8,192 | 1024 | +| palm/text-bison-safety-recitation-off | $0.125 | $0.125 | 8,192 | 1024 | +| gemini/gemini-1.5-flash | $0.35 | $1.05 | 1,000,000 | 8192 | +| gemini/gemini-1.5-flash-latest | $0.35 | $1.05 | 1,000,000 | 8192 | +| gemini/gemini-pro | $0.35 | $1.05 | 32,760 | 8192 | +| gemini/gemini-1.5-pro | $3.5 | $10.5 | 2,097,152 | 8192 | +| gemini/gemini-1.5-pro-latest | $3.5 | $1.05 | 1,048,576 | 8192 | +| gemini/gemini-pro-vision | $0.35 | $1.05 | 30,720 | 2048 | +| gemini/gemini-gemma-2-27b-it | $0.35 | $1.05 | nan | 8192 | +| gemini/gemini-gemma-2-9b-it | $0.35 | $1.05 | nan | 8192 | +| command-r | $0.5 | $1.5 | 128,000 | 4096 | +| command-light | $15.00 | $15.00 | 4,096 | 4096 | +| command-r-plus | $ 3.00 | $15.00 | 128,000 | 4096 | +| command-nightly | $15.00 | $15.00 | 4,096 | 4096 | +| command | $15.00 | $15.00 | 4,096 | 4096 | +| command-medium-beta | $15.00 | $15.00 | 4,096 | 4096 | +| command-xlarge-beta | $15.00 | $15.00 | 4,096 | 4096 | +| replicate/meta/llama-2-13b | $0.1 | $0.5 | 4,096 | 4096 | +| replicate/meta/llama-2-13b-chat | $0.1 | $0.5 | 4,096 | 4096 | +| replicate/meta/llama-2-70b | $0.65 | $2.75 | 4,096 | 4096 | +| replicate/meta/llama-2-70b-chat | $0.65 | $2.75 | 4,096 | 4096 | +| replicate/meta/llama-2-7b | $0.05 | $0.25 | 4,096 | 4096 | +| replicate/meta/llama-2-7b-chat | $0.05 | $0.25 | 4,096 | 4096 | +| replicate/meta/llama-3-70b | $0.65 | $2.75 | 8,192 | 8192 | +| replicate/meta/llama-3-70b-instruct | $0.65 | $2.75 | 8,192 | 8192 | +| replicate/meta/llama-3-8b | $0.05 | $0.25 | 8,086 | 8086 | +| replicate/meta/llama-3-8b-instruct | $0.05 | $0.25 | 8,086 | 8086 | +| replicate/mistralai/mistral-7b-v0.1 | $0.05 | $0.25 | 4,096 | 4096 | +| replicate/mistralai/mistral-7b-instruct-v0.2 | $0.05 | $0.25 | 4,096 | 4096 | +| replicate/mistralai/mixtral-8x7b-instruct-v0.1 | $0.3 | $ 1.00 | 4,096 | 4096 | +| openrouter/deepseek/deepseek-coder | $0.14 | $0.28 | 32,000 | 4096 | +| openrouter/microsoft/wizardlm-2-8x22b:nitro | $ 1.00 | $ 1.00 | nan | nan | +| openrouter/google/gemini-pro-1.5 | $2.5 | $7.5 | 1,000,000 | 8192 | +| openrouter/mistralai/mixtral-8x22b-instruct | $0.65 | $0.65 | nan | nan | +| openrouter/cohere/command-r-plus | $ 3.00 | $15.00 | nan | nan | +| openrouter/databricks/dbrx-instruct | $0.6 | $0.6 | nan | nan | +| openrouter/anthropic/claude-3-haiku | $0.25 | $1.25 | nan | nan | +| openrouter/anthropic/claude-3-haiku-20240307 | $0.25 | $1.25 | 200,000 | 4096 | +| openrouter/anthropic/claude-3.5-sonnet | $ 3.00 | $15.00 | 200,000 | 4096 | +| openrouter/anthropic/claude-3-sonnet | $ 3.00 | $15.00 | nan | nan | +| openrouter/mistralai/mistral-large | $ 8.00 | $24.00 | nan | nan | +| openrouter/cognitivecomputations/dolphin-mixtral-8x7b | $0.5 | $0.5 | nan | nan | +| openrouter/google/gemini-pro-vision | $0.125 | $0.375 | nan | nan | +| openrouter/fireworks/firellava-13b | $0.2 | $0.2 | nan | nan | +| openrouter/meta-llama/llama-3-8b-instruct:free | $ 0.00 | $ 0.00 | nan | nan | +| openrouter/meta-llama/llama-3-8b-instruct:extended | $0.225 | $2.25 | nan | nan | +| openrouter/meta-llama/llama-3-70b-instruct:nitro | $0.9 | $0.9 | nan | nan | +| openrouter/meta-llama/llama-3-70b-instruct | $0.59 | $0.79 | nan | nan | +| openrouter/openai/gpt-4o | $ 5.00 | $15.00 | 128,000 | 4096 | +| openrouter/openai/gpt-4o-2024-05-13 | $ 5.00 | $15.00 | 128,000 | 4096 | +| openrouter/openai/gpt-4-vision-preview | $10.00 | $30.00 | nan | nan | +| openrouter/openai/gpt-3.5-turbo | $1.5 | $ 2.00 | nan | nan | +| openrouter/openai/gpt-3.5-turbo-16k | $ 3.00 | $ 4.00 | nan | nan | +| openrouter/openai/gpt-4 | $30.00 | $60.00 | nan | nan | +| openrouter/anthropic/claude-instant-v1 | $1.63 | $5.51 | nan | 8191 | +| openrouter/anthropic/claude-2 | $11.02 | $32.68 | nan | 8191 | +| openrouter/anthropic/claude-3-opus | $15.00 | $75.00 | 200,000 | 4096 | +| openrouter/google/palm-2-chat-bison | $0.5 | $0.5 | nan | nan | +| openrouter/google/palm-2-codechat-bison | $0.5 | $0.5 | nan | nan | +| openrouter/meta-llama/llama-2-13b-chat | $0.2 | $0.2 | nan | nan | +| openrouter/meta-llama/llama-2-70b-chat | $1.5 | $1.5 | nan | nan | +| openrouter/meta-llama/codellama-34b-instruct | $0.5 | $0.5 | nan | nan | +| openrouter/nousresearch/nous-hermes-llama2-13b | $0.2 | $0.2 | nan | nan | +| openrouter/mancer/weaver | $5.625 | $5.625 | nan | nan | +| openrouter/gryphe/mythomax-l2-13b | $1.875 | $1.875 | nan | nan | +| openrouter/jondurbin/airoboros-l2-70b-2.1 | $13.875 | $13.875 | nan | nan | +| openrouter/undi95/remm-slerp-l2-13b | $1.875 | $1.875 | nan | nan | +| openrouter/pygmalionai/mythalion-13b | $1.875 | $1.875 | nan | nan | +| openrouter/mistralai/mistral-7b-instruct | $0.13 | $0.13 | nan | nan | +| openrouter/mistralai/mistral-7b-instruct:free | $ 0.00 | $ 0.00 | nan | nan | +| j2-ultra | $15.00 | $15.00 | 8,192 | 8192 | +| j2-mid | $10.00 | $10.00 | 8,192 | 8192 | +| j2-light | $ 3.00 | $ 3.00 | 8,192 | 8192 | +| dolphin | $0.5 | $0.5 | 16,384 | 16384 | +| chatdolphin | $0.5 | $0.5 | 16,384 | 16384 | +| luminous-base | $30.00 | $33.00 | nan | nan | +| luminous-base-control | $37.5 | $41.25 | nan | nan | +| luminous-extended | $45.00 | $49.5 | nan | nan | +| luminous-extended-control | $56.25 | $61.875 | nan | nan | +| luminous-supreme | $175.00 | $192.5 | nan | nan | +| luminous-supreme-control | $218.75 | $240.625 | nan | nan | +| ai21.j2-mid-v1 | $12.5 | $12.5 | 8,191 | 8191 | +| ai21.j2-ultra-v1 | $18.8 | $18.8 | 8,191 | 8191 | +| ai21.jamba-instruct-v1:0 | $0.5 | $0.7 | 70,000 | 4096 | +| amazon.titan-text-lite-v1 | $0.3 | $0.4 | 42,000 | 4000 | +| amazon.titan-text-express-v1 | $1.3 | $1.7 | 42,000 | 8000 | +| amazon.titan-embed-text-v1 | $0.1 | $ 0.00 | 8,192 | nan | +| amazon.titan-embed-text-v2:0 | $0.2 | $ 0.00 | 8,192 | nan | +| mistral.mistral-7b-instruct-v0:2 | $0.15 | $0.2 | 32,000 | 8191 | +| mistral.mixtral-8x7b-instruct-v0:1 | $0.45 | $0.7 | 32,000 | 8191 | +| mistral.mistral-large-2402-v1:0 | $ 8.00 | $24.00 | 32,000 | 8191 | +| bedrock/us-west-2/mistral.mixtral-8x7b-instruct-v0:1 | $0.45 | $0.7 | 32,000 | 8191 | +| bedrock/us-east-1/mistral.mixtral-8x7b-instruct-v0:1 | $0.45 | $0.7 | 32,000 | 8191 | +| bedrock/eu-west-3/mistral.mixtral-8x7b-instruct-v0:1 | $0.59 | $0.91 | 32,000 | 8191 | +| bedrock/us-west-2/mistral.mistral-7b-instruct-v0:2 | $0.15 | $0.2 | 32,000 | 8191 | +| bedrock/us-east-1/mistral.mistral-7b-instruct-v0:2 | $0.15 | $0.2 | 32,000 | 8191 | +| bedrock/eu-west-3/mistral.mistral-7b-instruct-v0:2 | $0.2 | $0.26 | 32,000 | 8191 | +| bedrock/us-east-1/mistral.mistral-large-2402-v1:0 | $ 8.00 | $24.00 | 32,000 | 8191 | +| bedrock/us-west-2/mistral.mistral-large-2402-v1:0 | $ 8.00 | $24.00 | 32,000 | 8191 | +| bedrock/eu-west-3/mistral.mistral-large-2402-v1:0 | $10.4 | $31.2 | 32,000 | 8191 | +| anthropic.claude-3-sonnet-20240229-v1:0 | $ 3.00 | $15.00 | 200,000 | 4096 | +| anthropic.claude-3-5-sonnet-20240620-v1:0 | $ 3.00 | $15.00 | 200,000 | 4096 | +| anthropic.claude-3-haiku-20240307-v1:0 | $0.25 | $1.25 | 200,000 | 4096 | +| anthropic.claude-3-opus-20240229-v1:0 | $15.00 | $75.00 | 200,000 | 4096 | +| anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/us-east-1/anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/us-west-2/anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/ap-northeast-1/anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-east-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-east-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/us-east-1/anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/us-west-2/anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/ap-northeast-1/anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| bedrock/us-east-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| bedrock/us-east-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/us-east-1/anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/us-west-2/anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/ap-northeast-1/anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| bedrock/us-east-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| bedrock/us-east-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| anthropic.claude-instant-v1 | $1.63 | $5.51 | 100,000 | 8191 | +| bedrock/us-east-1/anthropic.claude-instant-v1 | $0.8 | $2.4 | 100,000 | 8191 | +| bedrock/us-east-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-east-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/anthropic.claude-instant-v1 | $0.8 | $2.4 | 100,000 | 8191 | +| bedrock/ap-northeast-1/anthropic.claude-instant-v1 | $2.23 | $7.55 | 100,000 | 8191 | +| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/anthropic.claude-instant-v1 | $2.48 | $8.38 | 100,000 | 8191 | +| bedrock/eu-central-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| cohere.command-text-v14 | $1.5 | $ 2.00 | 4,096 | 4096 | +| bedrock/*/1-month-commitment/cohere.command-text-v14 | -- | -- | 4,096 | 4096 | +| bedrock/*/6-month-commitment/cohere.command-text-v14 | -- | -- | 4,096 | 4096 | +| cohere.command-light-text-v14 | $0.3 | $0.6 | 4,096 | 4096 | +| bedrock/*/1-month-commitment/cohere.command-light-text-v14 | -- | -- | 4,096 | 4096 | +| bedrock/*/6-month-commitment/cohere.command-light-text-v14 | -- | -- | 4,096 | 4096 | +| cohere.command-r-plus-v1:0 | $ 3.00 | $15.00 | 128,000 | 4096 | +| cohere.command-r-v1:0 | $0.5 | $1.5 | 128,000 | 4096 | +| cohere.embed-english-v3 | $0.1 | $ 0.00 | 512 | nan | +| cohere.embed-multilingual-v3 | $0.1 | $ 0.00 | 512 | nan | +| meta.llama2-13b-chat-v1 | $0.75 | $ 1.00 | 4,096 | 4096 | +| meta.llama2-70b-chat-v1 | $1.95 | $2.56 | 4,096 | 4096 | +| meta.llama3-8b-instruct-v1:0 | $0.4 | $0.6 | 8,192 | 8192 | +| meta.llama3-70b-instruct-v1:0 | $2.65 | $3.5 | 8,192 | 8192 | +| meta.llama3-1-8b-instruct-v1:0 | $0.4 | $0.6 | 128,000 | 2048 | +| meta.llama3-1-70b-instruct-v1:0 | $2.65 | $3.5 | 128,000 | 2048 | +| 512-x-512/50-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan | +| 512-x-512/max-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan | +| max-x-max/50-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan | +| max-x-max/max-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan | +| 1024-x-1024/50-steps/stability.stable-diffusion-xl-v1 | -- | -- | 77 | nan | +| 1024-x-1024/max-steps/stability.stable-diffusion-xl-v1 | -- | -- | 77 | nan | +| sagemaker/meta-textgeneration-llama-2-7b | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| sagemaker/meta-textgeneration-llama-2-7b-f | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| sagemaker/meta-textgeneration-llama-2-13b | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| sagemaker/meta-textgeneration-llama-2-13b-f | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| sagemaker/meta-textgeneration-llama-2-70b | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| sagemaker/meta-textgeneration-llama-2-70b-b-f | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| together-ai-up-to-4b | $0.1 | $0.1 | nan | nan | +| together-ai-4.1b-8b | $0.2 | $0.2 | nan | nan | +| together-ai-8.1b-21b | $0.3 | $0.3 | nan | nan | +| together-ai-21.1b-41b | $0.8 | $0.8 | nan | nan | +| together-ai-41.1b-80b | $0.9 | $0.9 | nan | nan | +| together-ai-81.1b-110b | $1.8 | $1.8 | nan | nan | +| together_ai/mistralai/Mixtral-8x7B-Instruct-v0.1 | $0.6 | $0.6 | nan | nan | +| together_ai/mistralai/Mistral-7B-Instruct-v0.1 | -- | -- | nan | nan | +| together_ai/togethercomputer/CodeLlama-34b-Instruct | -- | -- | nan | nan | +| ollama/codegemma | $ 0.00 | $ 0.00 | 8,192 | 8192 | +| ollama/llama2 | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| ollama/llama2:13b | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| ollama/llama2:70b | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| ollama/llama2-uncensored | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| ollama/llama3 | $ 0.00 | $ 0.00 | 8,192 | 8192 | +| ollama/llama3:70b | $ 0.00 | $ 0.00 | 8,192 | 8192 | +| ollama/mistral | $ 0.00 | $ 0.00 | 8,192 | 8192 | +| ollama/mistral-7B-Instruct-v0.1 | $ 0.00 | $ 0.00 | 8,192 | 8192 | +| ollama/mistral-7B-Instruct-v0.2 | $ 0.00 | $ 0.00 | 32,768 | 32768 | +| ollama/mixtral-8x7B-Instruct-v0.1 | $ 0.00 | $ 0.00 | 32,768 | 32768 | +| ollama/mixtral-8x22B-Instruct-v0.1 | $ 0.00 | $ 0.00 | 65,536 | 65536 | +| ollama/codellama | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| ollama/orca-mini | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| ollama/vicuna | $ 0.00 | $ 0.00 | 2,048 | 2048 | +| deepinfra/lizpreciatior/lzlv_70b_fp16_hf | $0.7 | $0.9 | 4,096 | 4096 | +| deepinfra/Gryphe/MythoMax-L2-13b | $0.22 | $0.22 | 4,096 | 4096 | +| deepinfra/mistralai/Mistral-7B-Instruct-v0.1 | $0.13 | $0.13 | 32,768 | 8191 | +| deepinfra/meta-llama/Llama-2-70b-chat-hf | $0.7 | $0.9 | 4,096 | 4096 | +| deepinfra/cognitivecomputations/dolphin-2.6-mixtral-8x7b | $0.27 | $0.27 | 32,768 | 8191 | +| deepinfra/codellama/CodeLlama-34b-Instruct-hf | $0.6 | $0.6 | 4,096 | 4096 | +| deepinfra/deepinfra/mixtral | $0.27 | $0.27 | 32,000 | 4096 | +| deepinfra/Phind/Phind-CodeLlama-34B-v2 | $0.6 | $0.6 | 16,384 | 4096 | +| deepinfra/mistralai/Mixtral-8x7B-Instruct-v0.1 | $0.27 | $0.27 | 32,768 | 8191 | +| deepinfra/deepinfra/airoboros-70b | $0.7 | $0.9 | 4,096 | 4096 | +| deepinfra/01-ai/Yi-34B-Chat | $0.6 | $0.6 | 4,096 | 4096 | +| deepinfra/01-ai/Yi-6B-200K | $0.13 | $0.13 | 200,000 | 4096 | +| deepinfra/jondurbin/airoboros-l2-70b-gpt4-1.4.1 | $0.7 | $0.9 | 4,096 | 4096 | +| deepinfra/meta-llama/Llama-2-13b-chat-hf | $0.22 | $0.22 | 4,096 | 4096 | +| deepinfra/amazon/MistralLite | $0.2 | $0.2 | 32,768 | 8191 | +| deepinfra/meta-llama/Llama-2-7b-chat-hf | $0.13 | $0.13 | 4,096 | 4096 | +| deepinfra/meta-llama/Meta-Llama-3-8B-Instruct | $0.08 | $0.08 | 8,191 | 4096 | +| deepinfra/meta-llama/Meta-Llama-3-70B-Instruct | $0.59 | $0.79 | 8,191 | 4096 | +| deepinfra/01-ai/Yi-34B-200K | $0.6 | $0.6 | 200,000 | 4096 | +| deepinfra/openchat/openchat_3.5 | $0.13 | $0.13 | 4,096 | 4096 | +| perplexity/codellama-34b-instruct | $0.35 | $1.4 | 16,384 | 16384 | +| perplexity/codellama-70b-instruct | $0.7 | $2.8 | 16,384 | 16384 | +| perplexity/pplx-7b-chat | $0.07 | $0.28 | 8,192 | 8192 | +| perplexity/pplx-70b-chat | $0.7 | $2.8 | 4,096 | 4096 | +| perplexity/pplx-7b-online | $ 0.00 | $0.28 | 4,096 | 4096 | +| perplexity/pplx-70b-online | $ 0.00 | $2.8 | 4,096 | 4096 | +| perplexity/llama-2-70b-chat | $0.7 | $2.8 | 4,096 | 4096 | +| perplexity/mistral-7b-instruct | $0.07 | $0.28 | 4,096 | 4096 | +| perplexity/mixtral-8x7b-instruct | $0.07 | $0.28 | 4,096 | 4096 | +| perplexity/sonar-small-chat | $0.07 | $0.28 | 16,384 | 16384 | +| perplexity/sonar-small-online | $ 0.00 | $0.28 | 12,000 | 12000 | +| perplexity/sonar-medium-chat | $0.6 | $1.8 | 16,384 | 16384 | +| perplexity/sonar-medium-online | $ 0.00 | $1.8 | 12,000 | 12000 | +| fireworks_ai/firefunction-v2 | $0.9 | $0.9 | 8,192 | 8192 | +| fireworks_ai/mixtral-8x22b-instruct-hf | $1.2 | $1.2 | 65,536 | 65536 | +| fireworks_ai/qwen2-72b-instruct | $0.9 | $0.9 | 32,768 | 32768 | +| fireworks_ai/yi-large | $ 3.00 | $ 3.00 | 32,768 | 32768 | +| fireworks_ai/deepseek-coder-v2-instruct | $1.2 | $1.2 | 65,536 | 8192 | +| anyscale/mistralai/Mistral-7B-Instruct-v0.1 | $0.15 | $0.15 | 16,384 | 16384 | +| anyscale/mistralai/Mixtral-8x7B-Instruct-v0.1 | $0.15 | $0.15 | 16,384 | 16384 | +| anyscale/mistralai/Mixtral-8x22B-Instruct-v0.1 | $0.9 | $0.9 | 65,536 | 65536 | +| anyscale/HuggingFaceH4/zephyr-7b-beta | $0.15 | $0.15 | 16,384 | 16384 | +| anyscale/google/gemma-7b-it | $0.15 | $0.15 | 8,192 | 8192 | +| anyscale/meta-llama/Llama-2-7b-chat-hf | $0.15 | $0.15 | 4,096 | 4096 | +| anyscale/meta-llama/Llama-2-13b-chat-hf | $0.25 | $0.25 | 4,096 | 4096 | +| anyscale/meta-llama/Llama-2-70b-chat-hf | $ 1.00 | $ 1.00 | 4,096 | 4096 | +| anyscale/codellama/CodeLlama-34b-Instruct-hf | $ 1.00 | $ 1.00 | 4,096 | 4096 | +| anyscale/codellama/CodeLlama-70b-Instruct-hf | $ 1.00 | $ 1.00 | 4,096 | 4096 | +| anyscale/meta-llama/Meta-Llama-3-8B-Instruct | $0.15 | $0.15 | 8,192 | 8192 | +| anyscale/meta-llama/Meta-Llama-3-70B-Instruct | $ 1.00 | $ 1.00 | 8,192 | 8192 | +| cloudflare/@cf/meta/llama-2-7b-chat-fp16 | $1.923 | $1.923 | 3,072 | 3072 | +| cloudflare/@cf/meta/llama-2-7b-chat-int8 | $1.923 | $1.923 | 2,048 | 2048 | +| cloudflare/@cf/mistral/mistral-7b-instruct-v0.1 | $1.923 | $1.923 | 8,192 | 8192 | +| cloudflare/@hf/thebloke/codellama-7b-instruct-awq | $1.923 | $1.923 | 4,096 | 4096 | +| voyage/voyage-01 | $0.1 | $ 0.00 | 4,096 | nan | +| voyage/voyage-lite-01 | $0.1 | $ 0.00 | 4,096 | nan | +| voyage/voyage-large-2 | $0.12 | $ 0.00 | 16,000 | nan | +| voyage/voyage-law-2 | $0.12 | $ 0.00 | 16,000 | nan | +| voyage/voyage-code-2 | $0.12 | $ 0.00 | 16,000 | nan | +| voyage/voyage-2 | $0.1 | $ 0.00 | 4,000 | nan | +| voyage/voyage-lite-02-instruct | $0.1 | $ 0.00 | 4,000 | nan | +| databricks/databricks-dbrx-instruct | $0.75 | $2.25 | 32,768 | 32768 | +| databricks/databricks-meta-llama-3-70b-instruct | $ 1.00 | $ 3.00 | 8,192 | 8192 | +| databricks/databricks-llama-2-70b-chat | $0.5 | $1.5 | 4,096 | 4096 | +| databricks/databricks-mixtral-8x7b-instruct | $0.5 | $ 1.00 | 4,096 | 4096 | +| databricks/databricks-mpt-30b-instruct | $ 1.00 | $ 1.00 | 8,192 | 8192 | +| databricks/databricks-mpt-7b-instruct | $0.5 | $0.5 | 8,192 | 8192 | +| databricks/databricks-bge-large-en | $0.1 | $ 0.00 | 512 | nan | |:--------------------------------------------------------------------------------------------|:----------------------------------|:--------------------------------------|:--------------------|--------------------:| | gpt-4 | $30.00 | $60.00 | 8,192 | 4096 | | gpt-4o | $ 5.00 | $15.00 | 128,000 | 4096 | @@ -1029,6 +1511,7 @@ Units denominated in USD. All prices can be located in `model_prices.json`. | databricks/databricks-mpt-30b-instruct | $ 1.00 | $ 1.00 | 8,192 | 8192 | | databricks/databricks-mpt-7b-instruct | $0.5 | $0.5 | 8,192 | 8192 | | databricks/databricks-bge-large-en | $0.1 | $ 0.00 | 512 | nan | + ### Callback handlers You may also calculate token costs in LLM wrapper/framework libraries using callbacks. diff --git a/pricing_table.md b/pricing_table.md index 150269a..f185e4e 100644 --- a/pricing_table.md +++ b/pricing_table.md @@ -1,466 +1,483 @@ -| Model Name | Prompt Cost (USD) per 1M tokens | Completion Cost (USD) per 1M tokens | Max Prompt Tokens | Max Output Tokens | -|:--------------------------------------------------------------------------------------------|:----------------------------------|:--------------------------------------|:--------------------|--------------------:| -| gpt-4 | $30.00 | $60.00 | 8,192 | 4096 | -| gpt-4o | $ 5.00 | $15.00 | 128,000 | 4096 | -| gpt-4o-mini | $0.15 | $0.6 | 128,000 | 4096 | -| gpt-4o-mini-2024-07-18 | $0.15 | $0.6 | 128,000 | 4096 | -| gpt-4o-2024-05-13 | $ 5.00 | $15.00 | 128,000 | 4096 | -| gpt-4-turbo-preview | $10.00 | $30.00 | 128,000 | 4096 | -| gpt-4-0314 | $30.00 | $60.00 | 8,192 | 4096 | -| gpt-4-0613 | $30.00 | $60.00 | 8,192 | 4096 | -| gpt-4-32k | $60.00 | $120.00 | 32,768 | 4096 | -| gpt-4-32k-0314 | $60.00 | $120.00 | 32,768 | 4096 | -| gpt-4-32k-0613 | $60.00 | $120.00 | 32,768 | 4096 | -| gpt-4-turbo | $10.00 | $30.00 | 128,000 | 4096 | -| gpt-4-turbo-2024-04-09 | $10.00 | $30.00 | 128,000 | 4096 | -| gpt-4-1106-preview | $10.00 | $30.00 | 128,000 | 4096 | -| gpt-4-0125-preview | $10.00 | $30.00 | 128,000 | 4096 | -| gpt-4-vision-preview | $10.00 | $30.00 | 128,000 | 4096 | -| gpt-4-1106-vision-preview | $10.00 | $30.00 | 128,000 | 4096 | -| gpt-3.5-turbo | $1.5 | $ 2.00 | 16,385 | 4096 | -| gpt-3.5-turbo-0301 | $1.5 | $ 2.00 | 4,097 | 4096 | -| gpt-3.5-turbo-0613 | $1.5 | $ 2.00 | 4,097 | 4096 | -| gpt-3.5-turbo-1106 | $ 1.00 | $ 2.00 | 16,385 | 4096 | -| gpt-3.5-turbo-0125 | $0.5 | $1.5 | 16,385 | 4096 | -| gpt-3.5-turbo-16k | $ 3.00 | $ 4.00 | 16,385 | 4096 | -| gpt-3.5-turbo-16k-0613 | $ 3.00 | $ 4.00 | 16,385 | 4096 | -| ft:gpt-3.5-turbo | $ 3.00 | $ 6.00 | 4,097 | 4096 | -| ft:gpt-4-0613 | $30.00 | $60.00 | 8,192 | 4096 | -| ft:gpt-4o-2024-05-13 | $ 5.00 | $15.00 | 128,000 | 4096 | -| ft:davinci-002 | $ 2.00 | $ 2.00 | 16,384 | 4096 | -| ft:babbage-002 | $0.4 | $0.4 | 16,384 | 4096 | -| text-embedding-3-large | $0.13 | $ 0.00 | 8,191 | nan | -| text-embedding-3-small | $0.02 | $ 0.00 | 8,191 | nan | -| text-embedding-ada-002 | $0.1 | $ 0.00 | 8,191 | nan | -| text-embedding-ada-002-v2 | $0.1 | $ 0.00 | 8,191 | nan | -| text-moderation-stable | $ 0.00 | $ 0.00 | 32,768 | 0 | -| text-moderation-007 | $ 0.00 | $ 0.00 | 32,768 | 0 | -| text-moderation-latest | $ 0.00 | $ 0.00 | 32,768 | 0 | -| 256-x-256/dall-e-2 | -- | -- | nan | nan | -| 512-x-512/dall-e-2 | -- | -- | nan | nan | -| 1024-x-1024/dall-e-2 | -- | -- | nan | nan | -| hd/1024-x-1792/dall-e-3 | -- | -- | nan | nan | -| hd/1792-x-1024/dall-e-3 | -- | -- | nan | nan | -| hd/1024-x-1024/dall-e-3 | -- | -- | nan | nan | -| standard/1024-x-1792/dall-e-3 | -- | -- | nan | nan | -| standard/1792-x-1024/dall-e-3 | -- | -- | nan | nan | -| standard/1024-x-1024/dall-e-3 | -- | -- | nan | nan | -| whisper-1 | -- | -- | nan | nan | -| tts-1 | -- | -- | nan | nan | -| tts-1-hd | -- | -- | nan | nan | -| azure/tts-1 | -- | -- | nan | nan | -| azure/tts-1-hd | -- | -- | nan | nan | -| azure/whisper-1 | -- | -- | nan | nan | -| azure/gpt-4o | $ 5.00 | $15.00 | 128,000 | 4096 | -| azure/gpt-4-turbo-2024-04-09 | $10.00 | $30.00 | 128,000 | 4096 | -| azure/gpt-4-0125-preview | $10.00 | $30.00 | 128,000 | 4096 | -| azure/gpt-4-1106-preview | $10.00 | $30.00 | 128,000 | 4096 | -| azure/gpt-4-0613 | $30.00 | $60.00 | 8,192 | 4096 | -| azure/gpt-4-32k-0613 | $60.00 | $120.00 | 32,768 | 4096 | -| azure/gpt-4-32k | $60.00 | $120.00 | 32,768 | 4096 | -| azure/gpt-4 | $30.00 | $60.00 | 8,192 | 4096 | -| azure/gpt-4-turbo | $10.00 | $30.00 | 128,000 | 4096 | -| azure/gpt-4-turbo-vision-preview | $10.00 | $30.00 | 128,000 | 4096 | -| azure/gpt-35-turbo-16k-0613 | $ 3.00 | $ 4.00 | 16,385 | 4096 | -| azure/gpt-35-turbo-1106 | $ 1.00 | $ 2.00 | 16,384 | 4096 | -| azure/gpt-35-turbo-0125 | $0.5 | $1.5 | 16,384 | 4096 | -| azure/gpt-35-turbo-16k | $ 3.00 | $ 4.00 | 16,385 | 4096 | -| azure/gpt-35-turbo | $0.5 | $1.5 | 4,097 | 4096 | -| azure/gpt-3.5-turbo-instruct-0914 | $1.5 | $ 2.00 | 4,097 | nan | -| azure/gpt-35-turbo-instruct | $1.5 | $ 2.00 | 4,097 | nan | -| azure/mistral-large-latest | $ 8.00 | $24.00 | 32,000 | nan | -| azure/mistral-large-2402 | $ 8.00 | $24.00 | 32,000 | nan | -| azure/command-r-plus | $ 3.00 | $15.00 | 128,000 | 4096 | -| azure/ada | $0.1 | $ 0.00 | 8,191 | nan | -| azure/text-embedding-ada-002 | $0.1 | $ 0.00 | 8,191 | nan | -| azure/text-embedding-3-large | $0.13 | $ 0.00 | 8,191 | nan | -| azure/text-embedding-3-small | $0.02 | $ 0.00 | 8,191 | nan | -| azure/standard/1024-x-1024/dall-e-3 | -- | $ 0.00 | nan | nan | -| azure/hd/1024-x-1024/dall-e-3 | -- | $ 0.00 | nan | nan | -| azure/standard/1024-x-1792/dall-e-3 | -- | $ 0.00 | nan | nan | -| azure/standard/1792-x-1024/dall-e-3 | -- | $ 0.00 | nan | nan | -| azure/hd/1024-x-1792/dall-e-3 | -- | $ 0.00 | nan | nan | -| azure/hd/1792-x-1024/dall-e-3 | -- | $ 0.00 | nan | nan | -| azure/standard/1024-x-1024/dall-e-2 | -- | $ 0.00 | nan | nan | -| azure_ai/jamba-instruct | $0.5 | $0.7 | 70,000 | 4096 | -| azure_ai/mistral-large | $ 4.00 | $12.00 | 32,000 | 8191 | -| azure_ai/mistral-small | $ 1.00 | $ 3.00 | 32,000 | 8191 | -| azure_ai/Meta-Llama-3-70B-Instruct | $1.1 | $0.37 | 8,192 | 8192 | -| babbage-002 | $0.4 | $0.4 | 16,384 | 4096 | -| davinci-002 | $ 2.00 | $ 2.00 | 16,384 | 4096 | -| gpt-3.5-turbo-instruct | $1.5 | $ 2.00 | 8,192 | 4096 | -| gpt-3.5-turbo-instruct-0914 | $1.5 | $ 2.00 | 8,192 | 4097 | -| claude-instant-1 | $1.63 | $5.51 | 100,000 | 8191 | -| mistral/mistral-tiny | $0.25 | $0.25 | 32,000 | 8191 | -| mistral/mistral-small | $ 1.00 | $ 3.00 | 32,000 | 8191 | -| mistral/mistral-small-latest | $ 1.00 | $ 3.00 | 32,000 | 8191 | -| mistral/mistral-medium | $2.7 | $8.1 | 32,000 | 8191 | -| mistral/mistral-medium-latest | $2.7 | $8.1 | 32,000 | 8191 | -| mistral/mistral-medium-2312 | $2.7 | $8.1 | 32,000 | 8191 | -| mistral/mistral-large-latest | $ 4.00 | $12.00 | 32,000 | 8191 | -| mistral/mistral-large-2402 | $ 4.00 | $12.00 | 32,000 | 8191 | -| mistral/open-mistral-7b | $0.25 | $0.25 | 32,000 | 8191 | -| mistral/open-mixtral-8x7b | $0.7 | $0.7 | 32,000 | 8191 | -| mistral/open-mixtral-8x22b | $ 2.00 | $ 6.00 | 64,000 | 8191 | -| mistral/codestral-latest | $ 1.00 | $ 3.00 | 32,000 | 8191 | -| mistral/codestral-2405 | $ 1.00 | $ 3.00 | 32,000 | 8191 | -| mistral/mistral-embed | $0.1 | -- | 8,192 | nan | -| deepseek-chat | $0.14 | $0.28 | 32,000 | 4096 | -| codestral/codestral-latest | $ 0.00 | $ 0.00 | 32,000 | 8191 | -| codestral/codestral-2405 | $ 0.00 | $ 0.00 | 32,000 | 8191 | -| text-completion-codestral/codestral-latest | $ 0.00 | $ 0.00 | 32,000 | 8191 | -| text-completion-codestral/codestral-2405 | $ 0.00 | $ 0.00 | 32,000 | 8191 | -| deepseek-coder | $0.14 | $0.28 | 128,000 | 4096 | -| groq/llama2-70b-4096 | $0.7 | $0.8 | 4,096 | 4096 | -| groq/llama3-8b-8192 | $0.05 | $0.08 | 8,192 | 8192 | -| groq/llama3-70b-8192 | $0.59 | $0.79 | 8,192 | 8192 | -| groq/mixtral-8x7b-32768 | $0.24 | $0.24 | 32,768 | 32768 | -| groq/gemma-7b-it | $0.07 | $0.07 | 8,192 | 8192 | -| groq/llama3-groq-70b-8192-tool-use-preview | $0.89 | $0.89 | 8,192 | 8192 | -| groq/llama3-groq-8b-8192-tool-use-preview | $0.19 | $0.19 | 8,192 | 8192 | -| friendliai/mixtral-8x7b-instruct-v0-1 | $0.4 | $0.4 | 32,768 | 32768 | -| friendliai/meta-llama-3-8b-instruct | $0.1 | $0.1 | 8,192 | 8192 | -| friendliai/meta-llama-3-70b-instruct | $0.8 | $0.8 | 8,192 | 8192 | -| claude-instant-1.2 | $0.163 | $0.551 | 100,000 | 8191 | -| claude-2 | $ 8.00 | $24.00 | 100,000 | 8191 | -| claude-2.1 | $ 8.00 | $24.00 | 200,000 | 8191 | -| claude-3-haiku-20240307 | $0.25 | $1.25 | 200,000 | 4096 | -| claude-3-opus-20240229 | $15.00 | $75.00 | 200,000 | 4096 | -| claude-3-sonnet-20240229 | $ 3.00 | $15.00 | 200,000 | 4096 | -| claude-3-5-sonnet-20240620 | $ 3.00 | $15.00 | 200,000 | 4096 | -| text-bison | -- | -- | 8,192 | 2048 | -| text-bison@001 | -- | -- | 8,192 | 1024 | -| text-bison@002 | -- | -- | 8,192 | 1024 | -| text-bison32k | $0.125 | $0.125 | 8,192 | 1024 | -| text-bison32k@002 | $0.125 | $0.125 | 8,192 | 1024 | -| text-unicorn | $10.00 | $28.00 | 8,192 | 1024 | -| text-unicorn@001 | $10.00 | $28.00 | 8,192 | 1024 | -| chat-bison | $0.125 | $0.125 | 8,192 | 4096 | -| chat-bison@001 | $0.125 | $0.125 | 8,192 | 4096 | -| chat-bison@002 | $0.125 | $0.125 | 8,192 | 4096 | -| chat-bison-32k | $0.125 | $0.125 | 32,000 | 8192 | -| chat-bison-32k@002 | $0.125 | $0.125 | 32,000 | 8192 | -| code-bison | $0.125 | $0.125 | 6,144 | 1024 | -| code-bison@001 | $0.125 | $0.125 | 6,144 | 1024 | -| code-bison@002 | $0.125 | $0.125 | 6,144 | 1024 | -| code-bison32k | $0.125 | $0.125 | 6,144 | 1024 | -| code-bison-32k@002 | $0.125 | $0.125 | 6,144 | 1024 | -| code-gecko@001 | $0.125 | $0.125 | 2,048 | 64 | -| code-gecko@002 | $0.125 | $0.125 | 2,048 | 64 | -| code-gecko | $0.125 | $0.125 | 2,048 | 64 | -| code-gecko-latest | $0.125 | $0.125 | 2,048 | 64 | -| codechat-bison@latest | $0.125 | $0.125 | 6,144 | 1024 | -| codechat-bison | $0.125 | $0.125 | 6,144 | 1024 | -| codechat-bison@001 | $0.125 | $0.125 | 6,144 | 1024 | -| codechat-bison@002 | $0.125 | $0.125 | 6,144 | 1024 | -| codechat-bison-32k | $0.125 | $0.125 | 32,000 | 8192 | -| codechat-bison-32k@002 | $0.125 | $0.125 | 32,000 | 8192 | -| gemini-pro | $0.5 | $1.5 | 32,760 | 8192 | -| gemini-1.0-pro | $0.5 | $1.5 | 32,760 | 8192 | -| gemini-1.0-pro-001 | $0.5 | $1.5 | 32,760 | 8192 | -| gemini-1.0-ultra | $0.5 | $1.5 | 8,192 | 2048 | -| gemini-1.0-ultra-001 | $0.5 | $1.5 | 8,192 | 2048 | -| gemini-1.0-pro-002 | $0.5 | $1.5 | 32,760 | 8192 | -| gemini-1.5-pro | $ 5.00 | $15.00 | 2,097,152 | 8192 | -| gemini-1.5-pro-001 | $ 5.00 | $15.00 | 1,000,000 | 8192 | -| gemini-1.5-pro-preview-0514 | $ 5.00 | $15.00 | 1,000,000 | 8192 | -| gemini-1.5-pro-preview-0215 | $ 5.00 | $15.00 | 1,000,000 | 8192 | -| gemini-1.5-pro-preview-0409 | $ 5.00 | $15.00 | 1,000,000 | 8192 | -| gemini-1.5-flash | $0.5 | $1.5 | 1,000,000 | 8192 | -| gemini-1.5-flash-001 | $0.5 | $1.5 | 1,000,000 | 8192 | -| gemini-1.5-flash-preview-0514 | $0.5 | $1.5 | 1,000,000 | 8192 | -| gemini-experimental | $ 0.00 | $ 0.00 | 1,000,000 | 8192 | -| gemini-pro-vision | $0.25 | $0.5 | 16,384 | 2048 | -| gemini-1.0-pro-vision | $0.25 | $0.5 | 16,384 | 2048 | -| gemini-1.0-pro-vision-001 | $0.25 | $0.5 | 16,384 | 2048 | -| medlm-medium | -- | -- | 32,768 | 8192 | -| medlm-large | -- | -- | 8,192 | 1024 | -| vertex_ai/claude-3-sonnet@20240229 | $ 3.00 | $15.00 | 200,000 | 4096 | -| vertex_ai/claude-3-5-sonnet@20240620 | $ 3.00 | $15.00 | 200,000 | 4096 | -| vertex_ai/claude-3-haiku@20240307 | $0.25 | $1.25 | 200,000 | 4096 | -| vertex_ai/claude-3-opus@20240229 | $15.00 | $75.00 | 200,000 | 4096 | -| vertex_ai/imagegeneration@006 | -- | -- | nan | nan | -| text-embedding-004 | $0.00625 | $ 0.00 | 3,072 | nan | -| text-multilingual-embedding-002 | $0.00625 | $ 0.00 | 2,048 | nan | -| textembedding-gecko | $0.00625 | $ 0.00 | 3,072 | nan | -| textembedding-gecko-multilingual | $0.00625 | $ 0.00 | 3,072 | nan | -| textembedding-gecko-multilingual@001 | $0.00625 | $ 0.00 | 3,072 | nan | -| textembedding-gecko@001 | $0.00625 | $ 0.00 | 3,072 | nan | -| textembedding-gecko@003 | $0.00625 | $ 0.00 | 3,072 | nan | -| text-embedding-preview-0409 | $0.00625 | $ 0.00 | 3,072 | nan | -| text-multilingual-embedding-preview-0409 | $0.00625 | $ 0.00 | 3,072 | nan | -| palm/chat-bison | $0.125 | $0.125 | 8,192 | 4096 | -| palm/chat-bison-001 | $0.125 | $0.125 | 8,192 | 4096 | -| palm/text-bison | $0.125 | $0.125 | 8,192 | 1024 | -| palm/text-bison-001 | $0.125 | $0.125 | 8,192 | 1024 | -| palm/text-bison-safety-off | $0.125 | $0.125 | 8,192 | 1024 | -| palm/text-bison-safety-recitation-off | $0.125 | $0.125 | 8,192 | 1024 | -| gemini/gemini-1.5-flash | $0.35 | $1.05 | 1,000,000 | 8192 | -| gemini/gemini-1.5-flash-latest | $0.35 | $1.05 | 1,000,000 | 8192 | -| gemini/gemini-pro | $0.35 | $1.05 | 32,760 | 8192 | -| gemini/gemini-1.5-pro | $3.5 | $10.5 | 2,097,152 | 8192 | -| gemini/gemini-1.5-pro-latest | $3.5 | $1.05 | 1,048,576 | 8192 | -| gemini/gemini-pro-vision | $0.35 | $1.05 | 30,720 | 2048 | -| command-r | $0.5 | $1.5 | 128,000 | 4096 | -| command-light | $15.00 | $15.00 | 4,096 | 4096 | -| command-r-plus | $ 3.00 | $15.00 | 128,000 | 4096 | -| command-nightly | $15.00 | $15.00 | 4,096 | 4096 | -| command | $15.00 | $15.00 | 4,096 | 4096 | -| command-medium-beta | $15.00 | $15.00 | 4,096 | 4096 | -| command-xlarge-beta | $15.00 | $15.00 | 4,096 | 4096 | -| replicate/meta/llama-2-13b | $0.1 | $0.5 | 4,096 | 4096 | -| replicate/meta/llama-2-13b-chat | $0.1 | $0.5 | 4,096 | 4096 | -| replicate/meta/llama-2-70b | $0.65 | $2.75 | 4,096 | 4096 | -| replicate/meta/llama-2-70b-chat | $0.65 | $2.75 | 4,096 | 4096 | -| replicate/meta/llama-2-7b | $0.05 | $0.25 | 4,096 | 4096 | -| replicate/meta/llama-2-7b-chat | $0.05 | $0.25 | 4,096 | 4096 | -| replicate/meta/llama-3-70b | $0.65 | $2.75 | 8,192 | 8192 | -| replicate/meta/llama-3-70b-instruct | $0.65 | $2.75 | 8,192 | 8192 | -| replicate/meta/llama-3-8b | $0.05 | $0.25 | 8,086 | 8086 | -| replicate/meta/llama-3-8b-instruct | $0.05 | $0.25 | 8,086 | 8086 | -| replicate/mistralai/mistral-7b-v0.1 | $0.05 | $0.25 | 4,096 | 4096 | -| replicate/mistralai/mistral-7b-instruct-v0.2 | $0.05 | $0.25 | 4,096 | 4096 | -| replicate/mistralai/mixtral-8x7b-instruct-v0.1 | $0.3 | $ 1.00 | 4,096 | 4096 | -| openrouter/deepseek/deepseek-coder | $0.14 | $0.28 | 32,000 | 4096 | -| openrouter/microsoft/wizardlm-2-8x22b:nitro | $ 1.00 | $ 1.00 | nan | nan | -| openrouter/google/gemini-pro-1.5 | $2.5 | $7.5 | 1,000,000 | 8192 | -| openrouter/mistralai/mixtral-8x22b-instruct | $0.65 | $0.65 | nan | nan | -| openrouter/cohere/command-r-plus | $ 3.00 | $15.00 | nan | nan | -| openrouter/databricks/dbrx-instruct | $0.6 | $0.6 | nan | nan | -| openrouter/anthropic/claude-3-haiku | $0.25 | $1.25 | nan | nan | -| openrouter/anthropic/claude-3-haiku-20240307 | $0.25 | $1.25 | 200,000 | 4096 | -| openrouter/anthropic/claude-3.5-sonnet | $ 3.00 | $15.00 | 200,000 | 4096 | -| openrouter/anthropic/claude-3-sonnet | $ 3.00 | $15.00 | nan | nan | -| openrouter/mistralai/mistral-large | $ 8.00 | $24.00 | nan | nan | -| openrouter/cognitivecomputations/dolphin-mixtral-8x7b | $0.5 | $0.5 | nan | nan | -| openrouter/google/gemini-pro-vision | $0.125 | $0.375 | nan | nan | -| openrouter/fireworks/firellava-13b | $0.2 | $0.2 | nan | nan | -| openrouter/meta-llama/llama-3-8b-instruct:free | $ 0.00 | $ 0.00 | nan | nan | -| openrouter/meta-llama/llama-3-8b-instruct:extended | $0.225 | $2.25 | nan | nan | -| openrouter/meta-llama/llama-3-70b-instruct:nitro | $0.9 | $0.9 | nan | nan | -| openrouter/meta-llama/llama-3-70b-instruct | $0.59 | $0.79 | nan | nan | -| openrouter/openai/gpt-4o | $ 5.00 | $15.00 | 128,000 | 4096 | -| openrouter/openai/gpt-4o-2024-05-13 | $ 5.00 | $15.00 | 128,000 | 4096 | -| openrouter/openai/gpt-4-vision-preview | $10.00 | $30.00 | nan | nan | -| openrouter/openai/gpt-3.5-turbo | $1.5 | $ 2.00 | nan | nan | -| openrouter/openai/gpt-3.5-turbo-16k | $ 3.00 | $ 4.00 | nan | nan | -| openrouter/openai/gpt-4 | $30.00 | $60.00 | nan | nan | -| openrouter/anthropic/claude-instant-v1 | $1.63 | $5.51 | nan | 8191 | -| openrouter/anthropic/claude-2 | $11.02 | $32.68 | nan | 8191 | -| openrouter/anthropic/claude-3-opus | $15.00 | $75.00 | 200,000 | 4096 | -| openrouter/google/palm-2-chat-bison | $0.5 | $0.5 | nan | nan | -| openrouter/google/palm-2-codechat-bison | $0.5 | $0.5 | nan | nan | -| openrouter/meta-llama/llama-2-13b-chat | $0.2 | $0.2 | nan | nan | -| openrouter/meta-llama/llama-2-70b-chat | $1.5 | $1.5 | nan | nan | -| openrouter/meta-llama/codellama-34b-instruct | $0.5 | $0.5 | nan | nan | -| openrouter/nousresearch/nous-hermes-llama2-13b | $0.2 | $0.2 | nan | nan | -| openrouter/mancer/weaver | $5.625 | $5.625 | nan | nan | -| openrouter/gryphe/mythomax-l2-13b | $1.875 | $1.875 | nan | nan | -| openrouter/jondurbin/airoboros-l2-70b-2.1 | $13.875 | $13.875 | nan | nan | -| openrouter/undi95/remm-slerp-l2-13b | $1.875 | $1.875 | nan | nan | -| openrouter/pygmalionai/mythalion-13b | $1.875 | $1.875 | nan | nan | -| openrouter/mistralai/mistral-7b-instruct | $0.13 | $0.13 | nan | nan | -| openrouter/mistralai/mistral-7b-instruct:free | $ 0.00 | $ 0.00 | nan | nan | -| j2-ultra | $15.00 | $15.00 | 8,192 | 8192 | -| j2-mid | $10.00 | $10.00 | 8,192 | 8192 | -| j2-light | $ 3.00 | $ 3.00 | 8,192 | 8192 | -| dolphin | $0.5 | $0.5 | 16,384 | 16384 | -| chatdolphin | $0.5 | $0.5 | 16,384 | 16384 | -| luminous-base | $30.00 | $33.00 | nan | nan | -| luminous-base-control | $37.5 | $41.25 | nan | nan | -| luminous-extended | $45.00 | $49.5 | nan | nan | -| luminous-extended-control | $56.25 | $61.875 | nan | nan | -| luminous-supreme | $175.00 | $192.5 | nan | nan | -| luminous-supreme-control | $218.75 | $240.625 | nan | nan | -| ai21.j2-mid-v1 | $12.5 | $12.5 | 8,191 | 8191 | -| ai21.j2-ultra-v1 | $18.8 | $18.8 | 8,191 | 8191 | -| amazon.titan-text-lite-v1 | $0.3 | $0.4 | 42,000 | 4000 | -| amazon.titan-text-express-v1 | $1.3 | $1.7 | 42,000 | 8000 | -| amazon.titan-embed-text-v1 | $0.1 | $ 0.00 | 8,192 | nan | -| amazon.titan-embed-text-v2:0 | $0.2 | $ 0.00 | 8,192 | nan | -| mistral.mistral-7b-instruct-v0:2 | $0.15 | $0.2 | 32,000 | 8191 | -| mistral.mixtral-8x7b-instruct-v0:1 | $0.45 | $0.7 | 32,000 | 8191 | -| mistral.mistral-large-2402-v1:0 | $ 8.00 | $24.00 | 32,000 | 8191 | -| bedrock/us-west-2/mistral.mixtral-8x7b-instruct-v0:1 | $0.45 | $0.7 | 32,000 | 8191 | -| bedrock/us-east-1/mistral.mixtral-8x7b-instruct-v0:1 | $0.45 | $0.7 | 32,000 | 8191 | -| bedrock/eu-west-3/mistral.mixtral-8x7b-instruct-v0:1 | $0.59 | $0.91 | 32,000 | 8191 | -| bedrock/us-west-2/mistral.mistral-7b-instruct-v0:2 | $0.15 | $0.2 | 32,000 | 8191 | -| bedrock/us-east-1/mistral.mistral-7b-instruct-v0:2 | $0.15 | $0.2 | 32,000 | 8191 | -| bedrock/eu-west-3/mistral.mistral-7b-instruct-v0:2 | $0.2 | $0.26 | 32,000 | 8191 | -| bedrock/us-east-1/mistral.mistral-large-2402-v1:0 | $ 8.00 | $24.00 | 32,000 | 8191 | -| bedrock/us-west-2/mistral.mistral-large-2402-v1:0 | $ 8.00 | $24.00 | 32,000 | 8191 | -| bedrock/eu-west-3/mistral.mistral-large-2402-v1:0 | $10.4 | $31.2 | 32,000 | 8191 | -| anthropic.claude-3-sonnet-20240229-v1:0 | $ 3.00 | $15.00 | 200,000 | 4096 | -| anthropic.claude-3-5-sonnet-20240620-v1:0 | $ 3.00 | $15.00 | 200,000 | 4096 | -| anthropic.claude-3-haiku-20240307-v1:0 | $0.25 | $1.25 | 200,000 | 4096 | -| anthropic.claude-3-opus-20240229-v1:0 | $15.00 | $75.00 | 200,000 | 4096 | -| anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/us-east-1/anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/us-west-2/anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/ap-northeast-1/anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | -| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | -| bedrock/eu-central-1/anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | -| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | -| bedrock/us-east-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | -| bedrock/us-east-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | -| bedrock/us-west-2/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | -| bedrock/us-west-2/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | -| anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/us-east-1/anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/us-west-2/anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/ap-northeast-1/anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | -| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | -| bedrock/eu-central-1/anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | -| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | -| bedrock/us-east-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | -| bedrock/us-east-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | -| bedrock/us-west-2/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | -| bedrock/us-west-2/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | -| anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/us-east-1/anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/us-west-2/anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/ap-northeast-1/anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | -| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | -| bedrock/eu-central-1/anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | -| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | -| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | -| bedrock/us-east-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | -| bedrock/us-east-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | -| bedrock/us-west-2/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | -| bedrock/us-west-2/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | -| anthropic.claude-instant-v1 | $1.63 | $5.51 | 100,000 | 8191 | -| bedrock/us-east-1/anthropic.claude-instant-v1 | $0.8 | $2.4 | 100,000 | 8191 | -| bedrock/us-east-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | -| bedrock/us-east-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | -| bedrock/us-west-2/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | -| bedrock/us-west-2/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | -| bedrock/us-west-2/anthropic.claude-instant-v1 | $0.8 | $2.4 | 100,000 | 8191 | -| bedrock/ap-northeast-1/anthropic.claude-instant-v1 | $2.23 | $7.55 | 100,000 | 8191 | -| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | -| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | -| bedrock/eu-central-1/anthropic.claude-instant-v1 | $2.48 | $8.38 | 100,000 | 8191 | -| bedrock/eu-central-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | -| bedrock/eu-central-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | -| cohere.command-text-v14 | $1.5 | $ 2.00 | 4,096 | 4096 | -| bedrock/*/1-month-commitment/cohere.command-text-v14 | -- | -- | 4,096 | 4096 | -| bedrock/*/6-month-commitment/cohere.command-text-v14 | -- | -- | 4,096 | 4096 | -| cohere.command-light-text-v14 | $0.3 | $0.6 | 4,096 | 4096 | -| bedrock/*/1-month-commitment/cohere.command-light-text-v14 | -- | -- | 4,096 | 4096 | -| bedrock/*/6-month-commitment/cohere.command-light-text-v14 | -- | -- | 4,096 | 4096 | -| cohere.command-r-plus-v1:0 | $ 3.00 | $15.00 | 128,000 | 4096 | -| cohere.command-r-v1:0 | $0.5 | $1.5 | 128,000 | 4096 | -| cohere.embed-english-v3 | $0.1 | $ 0.00 | 512 | nan | -| cohere.embed-multilingual-v3 | $0.1 | $ 0.00 | 512 | nan | -| meta.llama2-13b-chat-v1 | $0.75 | $ 1.00 | 4,096 | 4096 | -| meta.llama2-70b-chat-v1 | $1.95 | $2.56 | 4,096 | 4096 | -| meta.llama3-8b-instruct-v1:0 | $0.4 | $0.6 | 8,192 | 8192 | -| meta.llama3-70b-instruct-v1:0 | $2.65 | $3.5 | 8,192 | 8192 | -| 512-x-512/50-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan | -| 512-x-512/max-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan | -| max-x-max/50-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan | -| max-x-max/max-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan | -| 1024-x-1024/50-steps/stability.stable-diffusion-xl-v1 | -- | -- | 77 | nan | -| 1024-x-1024/max-steps/stability.stable-diffusion-xl-v1 | -- | -- | 77 | nan | -| sagemaker/meta-textgeneration-llama-2-7b | $ 0.00 | $ 0.00 | 4,096 | 4096 | -| sagemaker/meta-textgeneration-llama-2-7b-f | $ 0.00 | $ 0.00 | 4,096 | 4096 | -| sagemaker/meta-textgeneration-llama-2-13b | $ 0.00 | $ 0.00 | 4,096 | 4096 | -| sagemaker/meta-textgeneration-llama-2-13b-f | $ 0.00 | $ 0.00 | 4,096 | 4096 | -| sagemaker/meta-textgeneration-llama-2-70b | $ 0.00 | $ 0.00 | 4,096 | 4096 | -| sagemaker/meta-textgeneration-llama-2-70b-b-f | $ 0.00 | $ 0.00 | 4,096 | 4096 | -| together-ai-up-to-4b | $0.1 | $0.1 | nan | nan | -| together-ai-4.1b-8b | $0.2 | $0.2 | nan | nan | -| together-ai-8.1b-21b | $0.3 | $0.3 | nan | nan | -| together-ai-21.1b-41b | $0.8 | $0.8 | nan | nan | -| together-ai-41.1b-80b | $0.9 | $0.9 | nan | nan | -| together-ai-81.1b-110b | $1.8 | $1.8 | nan | nan | -| together_ai/mistralai/Mixtral-8x7B-Instruct-v0.1 | $0.6 | $0.6 | nan | nan | -| together_ai/mistralai/Mistral-7B-Instruct-v0.1 | -- | -- | nan | nan | -| together_ai/togethercomputer/CodeLlama-34b-Instruct | -- | -- | nan | nan | -| ollama/codegemma | $ 0.00 | $ 0.00 | 8,192 | 8192 | -| ollama/llama2 | $ 0.00 | $ 0.00 | 4,096 | 4096 | -| ollama/llama2:13b | $ 0.00 | $ 0.00 | 4,096 | 4096 | -| ollama/llama2:70b | $ 0.00 | $ 0.00 | 4,096 | 4096 | -| ollama/llama2-uncensored | $ 0.00 | $ 0.00 | 4,096 | 4096 | -| ollama/llama3 | $ 0.00 | $ 0.00 | 8,192 | 8192 | -| ollama/llama3:70b | $ 0.00 | $ 0.00 | 8,192 | 8192 | -| ollama/mistral | $ 0.00 | $ 0.00 | 8,192 | 8192 | -| ollama/mistral-7B-Instruct-v0.1 | $ 0.00 | $ 0.00 | 8,192 | 8192 | -| ollama/mistral-7B-Instruct-v0.2 | $ 0.00 | $ 0.00 | 32,768 | 32768 | -| ollama/mixtral-8x7B-Instruct-v0.1 | $ 0.00 | $ 0.00 | 32,768 | 32768 | -| ollama/mixtral-8x22B-Instruct-v0.1 | $ 0.00 | $ 0.00 | 65,536 | 65536 | -| ollama/codellama | $ 0.00 | $ 0.00 | 4,096 | 4096 | -| ollama/orca-mini | $ 0.00 | $ 0.00 | 4,096 | 4096 | -| ollama/vicuna | $ 0.00 | $ 0.00 | 2,048 | 2048 | -| deepinfra/lizpreciatior/lzlv_70b_fp16_hf | $0.7 | $0.9 | 4,096 | 4096 | -| deepinfra/Gryphe/MythoMax-L2-13b | $0.22 | $0.22 | 4,096 | 4096 | -| deepinfra/mistralai/Mistral-7B-Instruct-v0.1 | $0.13 | $0.13 | 32,768 | 8191 | -| deepinfra/meta-llama/Llama-2-70b-chat-hf | $0.7 | $0.9 | 4,096 | 4096 | -| deepinfra/cognitivecomputations/dolphin-2.6-mixtral-8x7b | $0.27 | $0.27 | 32,768 | 8191 | -| deepinfra/codellama/CodeLlama-34b-Instruct-hf | $0.6 | $0.6 | 4,096 | 4096 | -| deepinfra/deepinfra/mixtral | $0.27 | $0.27 | 32,000 | 4096 | -| deepinfra/Phind/Phind-CodeLlama-34B-v2 | $0.6 | $0.6 | 16,384 | 4096 | -| deepinfra/mistralai/Mixtral-8x7B-Instruct-v0.1 | $0.27 | $0.27 | 32,768 | 8191 | -| deepinfra/deepinfra/airoboros-70b | $0.7 | $0.9 | 4,096 | 4096 | -| deepinfra/01-ai/Yi-34B-Chat | $0.6 | $0.6 | 4,096 | 4096 | -| deepinfra/01-ai/Yi-6B-200K | $0.13 | $0.13 | 200,000 | 4096 | -| deepinfra/jondurbin/airoboros-l2-70b-gpt4-1.4.1 | $0.7 | $0.9 | 4,096 | 4096 | -| deepinfra/meta-llama/Llama-2-13b-chat-hf | $0.22 | $0.22 | 4,096 | 4096 | -| deepinfra/amazon/MistralLite | $0.2 | $0.2 | 32,768 | 8191 | -| deepinfra/meta-llama/Llama-2-7b-chat-hf | $0.13 | $0.13 | 4,096 | 4096 | -| deepinfra/meta-llama/Meta-Llama-3-8B-Instruct | $0.08 | $0.08 | 8,191 | 4096 | -| deepinfra/meta-llama/Meta-Llama-3-70B-Instruct | $0.59 | $0.79 | 8,191 | 4096 | -| deepinfra/01-ai/Yi-34B-200K | $0.6 | $0.6 | 200,000 | 4096 | -| deepinfra/openchat/openchat_3.5 | $0.13 | $0.13 | 4,096 | 4096 | -| perplexity/codellama-34b-instruct | $0.35 | $1.4 | 16,384 | 16384 | -| perplexity/codellama-70b-instruct | $0.7 | $2.8 | 16,384 | 16384 | -| perplexity/pplx-7b-chat | $0.07 | $0.28 | 8,192 | 8192 | -| perplexity/pplx-70b-chat | $0.7 | $2.8 | 4,096 | 4096 | -| perplexity/pplx-7b-online | $ 0.00 | $0.28 | 4,096 | 4096 | -| perplexity/pplx-70b-online | $ 0.00 | $2.8 | 4,096 | 4096 | -| perplexity/llama-2-70b-chat | $0.7 | $2.8 | 4,096 | 4096 | -| perplexity/mistral-7b-instruct | $0.07 | $0.28 | 4,096 | 4096 | -| perplexity/mixtral-8x7b-instruct | $0.07 | $0.28 | 4,096 | 4096 | -| perplexity/sonar-small-chat | $0.07 | $0.28 | 16,384 | 16384 | -| perplexity/sonar-small-online | $ 0.00 | $0.28 | 12,000 | 12000 | -| perplexity/sonar-medium-chat | $0.6 | $1.8 | 16,384 | 16384 | -| perplexity/sonar-medium-online | $ 0.00 | $1.8 | 12,000 | 12000 | -| fireworks_ai/firefunction-v2 | $0.9 | $0.9 | 8,192 | 8192 | -| fireworks_ai/mixtral-8x22b-instruct-hf | $1.2 | $1.2 | 65,536 | 65536 | -| fireworks_ai/qwen2-72b-instruct | $0.9 | $0.9 | 32,768 | 32768 | -| fireworks_ai/yi-large | $ 3.00 | $ 3.00 | 32,768 | 32768 | -| fireworks_ai/deepseek-coder-v2-instruct | $1.2 | $1.2 | 65,536 | 8192 | -| anyscale/mistralai/Mistral-7B-Instruct-v0.1 | $0.15 | $0.15 | 16,384 | 16384 | -| anyscale/mistralai/Mixtral-8x7B-Instruct-v0.1 | $0.15 | $0.15 | 16,384 | 16384 | -| anyscale/mistralai/Mixtral-8x22B-Instruct-v0.1 | $0.9 | $0.9 | 65,536 | 65536 | -| anyscale/HuggingFaceH4/zephyr-7b-beta | $0.15 | $0.15 | 16,384 | 16384 | -| anyscale/google/gemma-7b-it | $0.15 | $0.15 | 8,192 | 8192 | -| anyscale/meta-llama/Llama-2-7b-chat-hf | $0.15 | $0.15 | 4,096 | 4096 | -| anyscale/meta-llama/Llama-2-13b-chat-hf | $0.25 | $0.25 | 4,096 | 4096 | -| anyscale/meta-llama/Llama-2-70b-chat-hf | $ 1.00 | $ 1.00 | 4,096 | 4096 | -| anyscale/codellama/CodeLlama-34b-Instruct-hf | $ 1.00 | $ 1.00 | 4,096 | 4096 | -| anyscale/codellama/CodeLlama-70b-Instruct-hf | $ 1.00 | $ 1.00 | 4,096 | 4096 | -| anyscale/meta-llama/Meta-Llama-3-8B-Instruct | $0.15 | $0.15 | 8,192 | 8192 | -| anyscale/meta-llama/Meta-Llama-3-70B-Instruct | $ 1.00 | $ 1.00 | 8,192 | 8192 | -| cloudflare/@cf/meta/llama-2-7b-chat-fp16 | $1.923 | $1.923 | 3,072 | 3072 | -| cloudflare/@cf/meta/llama-2-7b-chat-int8 | $1.923 | $1.923 | 2,048 | 2048 | -| cloudflare/@cf/mistral/mistral-7b-instruct-v0.1 | $1.923 | $1.923 | 8,192 | 8192 | -| cloudflare/@hf/thebloke/codellama-7b-instruct-awq | $1.923 | $1.923 | 4,096 | 4096 | -| voyage/voyage-01 | $0.1 | $ 0.00 | 4,096 | nan | -| voyage/voyage-lite-01 | $0.1 | $ 0.00 | 4,096 | nan | -| voyage/voyage-large-2 | $0.12 | $ 0.00 | 16,000 | nan | -| voyage/voyage-law-2 | $0.12 | $ 0.00 | 16,000 | nan | -| voyage/voyage-code-2 | $0.12 | $ 0.00 | 16,000 | nan | -| voyage/voyage-2 | $0.1 | $ 0.00 | 4,000 | nan | -| voyage/voyage-lite-02-instruct | $0.1 | $ 0.00 | 4,000 | nan | -| databricks/databricks-dbrx-instruct | $0.75 | $2.25 | 32,768 | 32768 | -| databricks/databricks-meta-llama-3-70b-instruct | $ 1.00 | $ 3.00 | 8,192 | 8192 | -| databricks/databricks-llama-2-70b-chat | $0.5 | $1.5 | 4,096 | 4096 | -| databricks/databricks-mixtral-8x7b-instruct | $0.5 | $ 1.00 | 4,096 | 4096 | -| databricks/databricks-mpt-30b-instruct | $ 1.00 | $ 1.00 | 8,192 | 8192 | -| databricks/databricks-mpt-7b-instruct | $0.5 | $0.5 | 8,192 | 8192 | -| databricks/databricks-bge-large-en | $0.1 | $ 0.00 | 512 | nan | \ No newline at end of file +| Model Name | Prompt Cost (USD) per 1M tokens | Completion Cost (USD) per 1M tokens | Max Prompt Tokens | Max Output Tokens | +|:----------------------------------------------------------------------|:----------------------------------|:--------------------------------------|:--------------------|--------------------:| +| gpt-4 | $30.00 | $60.00 | 8,192 | 4096 | +| gpt-4o | $ 5.00 | $15.00 | 128,000 | 4096 | +| gpt-4o-mini | $0.15 | $0.6 | 128,000 | 4096 | +| gpt-4o-mini-2024-07-18 | $0.15 | $0.6 | 128,000 | 4096 | +| gpt-4o-2024-05-13 | $ 5.00 | $15.00 | 128,000 | 4096 | +| gpt-4-turbo-preview | $10.00 | $30.00 | 128,000 | 4096 | +| gpt-4-0314 | $30.00 | $60.00 | 8,192 | 4096 | +| gpt-4-0613 | $30.00 | $60.00 | 8,192 | 4096 | +| gpt-4-32k | $60.00 | $120.00 | 32,768 | 4096 | +| gpt-4-32k-0314 | $60.00 | $120.00 | 32,768 | 4096 | +| gpt-4-32k-0613 | $60.00 | $120.00 | 32,768 | 4096 | +| gpt-4-turbo | $10.00 | $30.00 | 128,000 | 4096 | +| gpt-4-turbo-2024-04-09 | $10.00 | $30.00 | 128,000 | 4096 | +| gpt-4-1106-preview | $10.00 | $30.00 | 128,000 | 4096 | +| gpt-4-0125-preview | $10.00 | $30.00 | 128,000 | 4096 | +| gpt-4-vision-preview | $10.00 | $30.00 | 128,000 | 4096 | +| gpt-4-1106-vision-preview | $10.00 | $30.00 | 128,000 | 4096 | +| gpt-3.5-turbo | $1.5 | $ 2.00 | 16,385 | 4096 | +| gpt-3.5-turbo-0301 | $1.5 | $ 2.00 | 4,097 | 4096 | +| gpt-3.5-turbo-0613 | $1.5 | $ 2.00 | 4,097 | 4096 | +| gpt-3.5-turbo-1106 | $ 1.00 | $ 2.00 | 16,385 | 4096 | +| gpt-3.5-turbo-0125 | $0.5 | $1.5 | 16,385 | 4096 | +| gpt-3.5-turbo-16k | $ 3.00 | $ 4.00 | 16,385 | 4096 | +| gpt-3.5-turbo-16k-0613 | $ 3.00 | $ 4.00 | 16,385 | 4096 | +| ft:gpt-3.5-turbo | $ 3.00 | $ 6.00 | 4,097 | 4096 | +| ft:gpt-4-0613 | $30.00 | $60.00 | 8,192 | 4096 | +| ft:gpt-4o-2024-05-13 | $ 5.00 | $15.00 | 128,000 | 4096 | +| ft:davinci-002 | $ 2.00 | $ 2.00 | 16,384 | 4096 | +| ft:babbage-002 | $0.4 | $0.4 | 16,384 | 4096 | +| text-embedding-3-large | $0.13 | $ 0.00 | 8,191 | nan | +| text-embedding-3-small | $0.02 | $ 0.00 | 8,191 | nan | +| text-embedding-ada-002 | $0.1 | $ 0.00 | 8,191 | nan | +| text-embedding-ada-002-v2 | $0.1 | $ 0.00 | 8,191 | nan | +| text-moderation-stable | $ 0.00 | $ 0.00 | 32,768 | 0 | +| text-moderation-007 | $ 0.00 | $ 0.00 | 32,768 | 0 | +| text-moderation-latest | $ 0.00 | $ 0.00 | 32,768 | 0 | +| 256-x-256/dall-e-2 | -- | -- | nan | nan | +| 512-x-512/dall-e-2 | -- | -- | nan | nan | +| 1024-x-1024/dall-e-2 | -- | -- | nan | nan | +| hd/1024-x-1792/dall-e-3 | -- | -- | nan | nan | +| hd/1792-x-1024/dall-e-3 | -- | -- | nan | nan | +| hd/1024-x-1024/dall-e-3 | -- | -- | nan | nan | +| standard/1024-x-1792/dall-e-3 | -- | -- | nan | nan | +| standard/1792-x-1024/dall-e-3 | -- | -- | nan | nan | +| standard/1024-x-1024/dall-e-3 | -- | -- | nan | nan | +| whisper-1 | -- | -- | nan | nan | +| tts-1 | -- | -- | nan | nan | +| tts-1-hd | -- | -- | nan | nan | +| azure/tts-1 | -- | -- | nan | nan | +| azure/tts-1-hd | -- | -- | nan | nan | +| azure/whisper-1 | -- | -- | nan | nan | +| azure/gpt-4o | $ 5.00 | $15.00 | 128,000 | 4096 | +| azure/gpt-4-turbo-2024-04-09 | $10.00 | $30.00 | 128,000 | 4096 | +| azure/gpt-4-0125-preview | $10.00 | $30.00 | 128,000 | 4096 | +| azure/gpt-4-1106-preview | $10.00 | $30.00 | 128,000 | 4096 | +| azure/gpt-4-0613 | $30.00 | $60.00 | 8,192 | 4096 | +| azure/gpt-4-32k-0613 | $60.00 | $120.00 | 32,768 | 4096 | +| azure/gpt-4-32k | $60.00 | $120.00 | 32,768 | 4096 | +| azure/gpt-4 | $30.00 | $60.00 | 8,192 | 4096 | +| azure/gpt-4-turbo | $10.00 | $30.00 | 128,000 | 4096 | +| azure/gpt-4-turbo-vision-preview | $10.00 | $30.00 | 128,000 | 4096 | +| azure/gpt-35-turbo-16k-0613 | $ 3.00 | $ 4.00 | 16,385 | 4096 | +| azure/gpt-35-turbo-1106 | $ 1.00 | $ 2.00 | 16,384 | 4096 | +| azure/gpt-35-turbo-0125 | $0.5 | $1.5 | 16,384 | 4096 | +| azure/gpt-35-turbo-16k | $ 3.00 | $ 4.00 | 16,385 | 4096 | +| azure/gpt-35-turbo | $0.5 | $1.5 | 4,097 | 4096 | +| azure/gpt-3.5-turbo-instruct-0914 | $1.5 | $ 2.00 | 4,097 | nan | +| azure/gpt-35-turbo-instruct | $1.5 | $ 2.00 | 4,097 | nan | +| azure/mistral-large-latest | $ 8.00 | $24.00 | 32,000 | nan | +| azure/mistral-large-2402 | $ 8.00 | $24.00 | 32,000 | nan | +| azure/command-r-plus | $ 3.00 | $15.00 | 128,000 | 4096 | +| azure/ada | $0.1 | $ 0.00 | 8,191 | nan | +| azure/text-embedding-ada-002 | $0.1 | $ 0.00 | 8,191 | nan | +| azure/text-embedding-3-large | $0.13 | $ 0.00 | 8,191 | nan | +| azure/text-embedding-3-small | $0.02 | $ 0.00 | 8,191 | nan | +| azure/standard/1024-x-1024/dall-e-3 | -- | $ 0.00 | nan | nan | +| azure/hd/1024-x-1024/dall-e-3 | -- | $ 0.00 | nan | nan | +| azure/standard/1024-x-1792/dall-e-3 | -- | $ 0.00 | nan | nan | +| azure/standard/1792-x-1024/dall-e-3 | -- | $ 0.00 | nan | nan | +| azure/hd/1024-x-1792/dall-e-3 | -- | $ 0.00 | nan | nan | +| azure/hd/1792-x-1024/dall-e-3 | -- | $ 0.00 | nan | nan | +| azure/standard/1024-x-1024/dall-e-2 | -- | $ 0.00 | nan | nan | +| azure_ai/jamba-instruct | $0.5 | $0.7 | 70,000 | 4096 | +| azure_ai/mistral-large | $ 4.00 | $12.00 | 32,000 | 8191 | +| azure_ai/mistral-small | $ 1.00 | $ 3.00 | 32,000 | 8191 | +| azure_ai/Meta-Llama-3-70B-Instruct | $1.1 | $0.37 | 8,192 | 8192 | +| azure_ai/Meta-Llama-31-8B-Instruct | $0.3 | $0.61 | 128,000 | 128000 | +| azure_ai/Meta-Llama-31-70B-Instruct | $2.68 | $3.54 | 128,000 | 128000 | +| azure_ai/Meta-Llama-31-405B-Instruct | $5.33 | $16.00 | 128,000 | 128000 | +| babbage-002 | $0.4 | $0.4 | 16,384 | 4096 | +| davinci-002 | $ 2.00 | $ 2.00 | 16,384 | 4096 | +| gpt-3.5-turbo-instruct | $1.5 | $ 2.00 | 8,192 | 4096 | +| gpt-3.5-turbo-instruct-0914 | $1.5 | $ 2.00 | 8,192 | 4097 | +| claude-instant-1 | $1.63 | $5.51 | 100,000 | 8191 | +| mistral/mistral-tiny | $0.25 | $0.25 | 32,000 | 8191 | +| mistral/mistral-small | $ 1.00 | $ 3.00 | 32,000 | 8191 | +| mistral/mistral-small-latest | $ 1.00 | $ 3.00 | 32,000 | 8191 | +| mistral/mistral-medium | $2.7 | $8.1 | 32,000 | 8191 | +| mistral/mistral-medium-latest | $2.7 | $8.1 | 32,000 | 8191 | +| mistral/mistral-medium-2312 | $2.7 | $8.1 | 32,000 | 8191 | +| mistral/mistral-large-latest | $ 3.00 | $ 9.00 | 128,000 | 128000 | +| mistral/mistral-large-2402 | $ 4.00 | $12.00 | 32,000 | 8191 | +| mistral/mistral-large-2407 | $ 3.00 | $ 9.00 | 128,000 | 128000 | +| mistral/open-mistral-7b | $0.25 | $0.25 | 32,000 | 8191 | +| mistral/open-mixtral-8x7b | $0.7 | $0.7 | 32,000 | 8191 | +| mistral/open-mixtral-8x22b | $ 2.00 | $ 6.00 | 64,000 | 8191 | +| mistral/codestral-latest | $ 1.00 | $ 3.00 | 32,000 | 8191 | +| mistral/codestral-2405 | $ 1.00 | $ 3.00 | 32,000 | 8191 | +| mistral/open-mistral-nemo | $0.3 | $0.3 | 128,000 | 128000 | +| mistral/open-mistral-nemo-2407 | $0.3 | $0.3 | 128,000 | 128000 | +| mistral/open-codestral-mamba | $0.25 | $0.25 | 256,000 | 256000 | +| mistral/codestral-mamba-latest | $0.25 | $0.25 | 256,000 | 256000 | +| mistral/mistral-embed | $0.1 | -- | 8,192 | nan | +| deepseek-chat | $0.14 | $0.28 | 32,000 | 4096 | +| codestral/codestral-latest | $ 0.00 | $ 0.00 | 32,000 | 8191 | +| codestral/codestral-2405 | $ 0.00 | $ 0.00 | 32,000 | 8191 | +| text-completion-codestral/codestral-latest | $ 0.00 | $ 0.00 | 32,000 | 8191 | +| text-completion-codestral/codestral-2405 | $ 0.00 | $ 0.00 | 32,000 | 8191 | +| deepseek-coder | $0.14 | $0.28 | 128,000 | 4096 | +| groq/llama2-70b-4096 | $0.7 | $0.8 | 4,096 | 4096 | +| groq/llama3-8b-8192 | $0.05 | $0.08 | 8,192 | 8192 | +| groq/llama3-70b-8192 | $0.59 | $0.79 | 8,192 | 8192 | +| groq/llama-3.1-8b-instant | $0.59 | $0.79 | 8,192 | 8192 | +| groq/llama-3.1-70b-versatile | $0.59 | $0.79 | 8,192 | 8192 | +| groq/llama-3.1-405b-reasoning | $0.59 | $0.79 | 8,192 | 8192 | +| groq/mixtral-8x7b-32768 | $0.24 | $0.24 | 32,768 | 32768 | +| groq/gemma-7b-it | $0.07 | $0.07 | 8,192 | 8192 | +| groq/llama3-groq-70b-8192-tool-use-preview | $0.89 | $0.89 | 8,192 | 8192 | +| groq/llama3-groq-8b-8192-tool-use-preview | $0.19 | $0.19 | 8,192 | 8192 | +| friendliai/mixtral-8x7b-instruct-v0-1 | $0.4 | $0.4 | 32,768 | 32768 | +| friendliai/meta-llama-3-8b-instruct | $0.1 | $0.1 | 8,192 | 8192 | +| friendliai/meta-llama-3-70b-instruct | $0.8 | $0.8 | 8,192 | 8192 | +| claude-instant-1.2 | $0.163 | $0.551 | 100,000 | 8191 | +| claude-2 | $ 8.00 | $24.00 | 100,000 | 8191 | +| claude-2.1 | $ 8.00 | $24.00 | 200,000 | 8191 | +| claude-3-haiku-20240307 | $0.25 | $1.25 | 200,000 | 4096 | +| claude-3-opus-20240229 | $15.00 | $75.00 | 200,000 | 4096 | +| claude-3-sonnet-20240229 | $ 3.00 | $15.00 | 200,000 | 4096 | +| claude-3-5-sonnet-20240620 | $ 3.00 | $15.00 | 200,000 | 4096 | +| text-bison | -- | -- | 8,192 | 2048 | +| text-bison@001 | -- | -- | 8,192 | 1024 | +| text-bison@002 | -- | -- | 8,192 | 1024 | +| text-bison32k | $0.125 | $0.125 | 8,192 | 1024 | +| text-bison32k@002 | $0.125 | $0.125 | 8,192 | 1024 | +| text-unicorn | $10.00 | $28.00 | 8,192 | 1024 | +| text-unicorn@001 | $10.00 | $28.00 | 8,192 | 1024 | +| chat-bison | $0.125 | $0.125 | 8,192 | 4096 | +| chat-bison@001 | $0.125 | $0.125 | 8,192 | 4096 | +| chat-bison@002 | $0.125 | $0.125 | 8,192 | 4096 | +| chat-bison-32k | $0.125 | $0.125 | 32,000 | 8192 | +| chat-bison-32k@002 | $0.125 | $0.125 | 32,000 | 8192 | +| code-bison | $0.125 | $0.125 | 6,144 | 1024 | +| code-bison@001 | $0.125 | $0.125 | 6,144 | 1024 | +| code-bison@002 | $0.125 | $0.125 | 6,144 | 1024 | +| code-bison32k | $0.125 | $0.125 | 6,144 | 1024 | +| code-bison-32k@002 | $0.125 | $0.125 | 6,144 | 1024 | +| code-gecko@001 | $0.125 | $0.125 | 2,048 | 64 | +| code-gecko@002 | $0.125 | $0.125 | 2,048 | 64 | +| code-gecko | $0.125 | $0.125 | 2,048 | 64 | +| code-gecko-latest | $0.125 | $0.125 | 2,048 | 64 | +| codechat-bison@latest | $0.125 | $0.125 | 6,144 | 1024 | +| codechat-bison | $0.125 | $0.125 | 6,144 | 1024 | +| codechat-bison@001 | $0.125 | $0.125 | 6,144 | 1024 | +| codechat-bison@002 | $0.125 | $0.125 | 6,144 | 1024 | +| codechat-bison-32k | $0.125 | $0.125 | 32,000 | 8192 | +| codechat-bison-32k@002 | $0.125 | $0.125 | 32,000 | 8192 | +| gemini-pro | $0.5 | $1.5 | 32,760 | 8192 | +| gemini-1.0-pro | $0.5 | $1.5 | 32,760 | 8192 | +| gemini-1.0-pro-001 | $0.5 | $1.5 | 32,760 | 8192 | +| gemini-1.0-ultra | $0.5 | $1.5 | 8,192 | 2048 | +| gemini-1.0-ultra-001 | $0.5 | $1.5 | 8,192 | 2048 | +| gemini-1.0-pro-002 | $0.5 | $1.5 | 32,760 | 8192 | +| gemini-1.5-pro | $ 5.00 | $15.00 | 2,097,152 | 8192 | +| gemini-1.5-pro-001 | $ 5.00 | $15.00 | 1,000,000 | 8192 | +| gemini-1.5-pro-preview-0514 | $ 5.00 | $15.00 | 1,000,000 | 8192 | +| gemini-1.5-pro-preview-0215 | $ 5.00 | $15.00 | 1,000,000 | 8192 | +| gemini-1.5-pro-preview-0409 | $ 5.00 | $15.00 | 1,000,000 | 8192 | +| gemini-1.5-flash | $0.5 | $1.5 | 1,000,000 | 8192 | +| gemini-1.5-flash-001 | $0.5 | $1.5 | 1,000,000 | 8192 | +| gemini-1.5-flash-preview-0514 | $0.5 | $1.5 | 1,000,000 | 8192 | +| gemini-experimental | $ 0.00 | $ 0.00 | 1,000,000 | 8192 | +| gemini-pro-vision | $0.25 | $0.5 | 16,384 | 2048 | +| gemini-1.0-pro-vision | $0.25 | $0.5 | 16,384 | 2048 | +| gemini-1.0-pro-vision-001 | $0.25 | $0.5 | 16,384 | 2048 | +| medlm-medium | -- | -- | 32,768 | 8192 | +| medlm-large | -- | -- | 8,192 | 1024 | +| vertex_ai/claude-3-sonnet@20240229 | $ 3.00 | $15.00 | 200,000 | 4096 | +| vertex_ai/claude-3-5-sonnet@20240620 | $ 3.00 | $15.00 | 200,000 | 4096 | +| vertex_ai/claude-3-haiku@20240307 | $0.25 | $1.25 | 200,000 | 4096 | +| vertex_ai/claude-3-opus@20240229 | $15.00 | $75.00 | 200,000 | 4096 | +| vertex_ai/meta/llama3-405b-instruct-maas | $ 0.00 | $ 0.00 | 32,000 | 32000 | +| vertex_ai/imagegeneration@006 | -- | -- | nan | nan | +| text-embedding-004 | $0.00625 | $ 0.00 | 3,072 | nan | +| text-multilingual-embedding-002 | $0.00625 | $ 0.00 | 2,048 | nan | +| textembedding-gecko | $0.00625 | $ 0.00 | 3,072 | nan | +| textembedding-gecko-multilingual | $0.00625 | $ 0.00 | 3,072 | nan | +| textembedding-gecko-multilingual@001 | $0.00625 | $ 0.00 | 3,072 | nan | +| textembedding-gecko@001 | $0.00625 | $ 0.00 | 3,072 | nan | +| textembedding-gecko@003 | $0.00625 | $ 0.00 | 3,072 | nan | +| text-embedding-preview-0409 | $0.00625 | $ 0.00 | 3,072 | nan | +| text-multilingual-embedding-preview-0409 | $0.00625 | $ 0.00 | 3,072 | nan | +| palm/chat-bison | $0.125 | $0.125 | 8,192 | 4096 | +| palm/chat-bison-001 | $0.125 | $0.125 | 8,192 | 4096 | +| palm/text-bison | $0.125 | $0.125 | 8,192 | 1024 | +| palm/text-bison-001 | $0.125 | $0.125 | 8,192 | 1024 | +| palm/text-bison-safety-off | $0.125 | $0.125 | 8,192 | 1024 | +| palm/text-bison-safety-recitation-off | $0.125 | $0.125 | 8,192 | 1024 | +| gemini/gemini-1.5-flash | $0.35 | $1.05 | 1,000,000 | 8192 | +| gemini/gemini-1.5-flash-latest | $0.35 | $1.05 | 1,000,000 | 8192 | +| gemini/gemini-pro | $0.35 | $1.05 | 32,760 | 8192 | +| gemini/gemini-1.5-pro | $3.5 | $10.5 | 2,097,152 | 8192 | +| gemini/gemini-1.5-pro-latest | $3.5 | $1.05 | 1,048,576 | 8192 | +| gemini/gemini-pro-vision | $0.35 | $1.05 | 30,720 | 2048 | +| gemini/gemini-gemma-2-27b-it | $0.35 | $1.05 | nan | 8192 | +| gemini/gemini-gemma-2-9b-it | $0.35 | $1.05 | nan | 8192 | +| command-r | $0.5 | $1.5 | 128,000 | 4096 | +| command-light | $15.00 | $15.00 | 4,096 | 4096 | +| command-r-plus | $ 3.00 | $15.00 | 128,000 | 4096 | +| command-nightly | $15.00 | $15.00 | 4,096 | 4096 | +| command | $15.00 | $15.00 | 4,096 | 4096 | +| command-medium-beta | $15.00 | $15.00 | 4,096 | 4096 | +| command-xlarge-beta | $15.00 | $15.00 | 4,096 | 4096 | +| replicate/meta/llama-2-13b | $0.1 | $0.5 | 4,096 | 4096 | +| replicate/meta/llama-2-13b-chat | $0.1 | $0.5 | 4,096 | 4096 | +| replicate/meta/llama-2-70b | $0.65 | $2.75 | 4,096 | 4096 | +| replicate/meta/llama-2-70b-chat | $0.65 | $2.75 | 4,096 | 4096 | +| replicate/meta/llama-2-7b | $0.05 | $0.25 | 4,096 | 4096 | +| replicate/meta/llama-2-7b-chat | $0.05 | $0.25 | 4,096 | 4096 | +| replicate/meta/llama-3-70b | $0.65 | $2.75 | 8,192 | 8192 | +| replicate/meta/llama-3-70b-instruct | $0.65 | $2.75 | 8,192 | 8192 | +| replicate/meta/llama-3-8b | $0.05 | $0.25 | 8,086 | 8086 | +| replicate/meta/llama-3-8b-instruct | $0.05 | $0.25 | 8,086 | 8086 | +| replicate/mistralai/mistral-7b-v0.1 | $0.05 | $0.25 | 4,096 | 4096 | +| replicate/mistralai/mistral-7b-instruct-v0.2 | $0.05 | $0.25 | 4,096 | 4096 | +| replicate/mistralai/mixtral-8x7b-instruct-v0.1 | $0.3 | $ 1.00 | 4,096 | 4096 | +| openrouter/deepseek/deepseek-coder | $0.14 | $0.28 | 32,000 | 4096 | +| openrouter/microsoft/wizardlm-2-8x22b:nitro | $ 1.00 | $ 1.00 | nan | nan | +| openrouter/google/gemini-pro-1.5 | $2.5 | $7.5 | 1,000,000 | 8192 | +| openrouter/mistralai/mixtral-8x22b-instruct | $0.65 | $0.65 | nan | nan | +| openrouter/cohere/command-r-plus | $ 3.00 | $15.00 | nan | nan | +| openrouter/databricks/dbrx-instruct | $0.6 | $0.6 | nan | nan | +| openrouter/anthropic/claude-3-haiku | $0.25 | $1.25 | nan | nan | +| openrouter/anthropic/claude-3-haiku-20240307 | $0.25 | $1.25 | 200,000 | 4096 | +| openrouter/anthropic/claude-3.5-sonnet | $ 3.00 | $15.00 | 200,000 | 4096 | +| openrouter/anthropic/claude-3-sonnet | $ 3.00 | $15.00 | nan | nan | +| openrouter/mistralai/mistral-large | $ 8.00 | $24.00 | nan | nan | +| openrouter/cognitivecomputations/dolphin-mixtral-8x7b | $0.5 | $0.5 | nan | nan | +| openrouter/google/gemini-pro-vision | $0.125 | $0.375 | nan | nan | +| openrouter/fireworks/firellava-13b | $0.2 | $0.2 | nan | nan | +| openrouter/meta-llama/llama-3-8b-instruct:free | $ 0.00 | $ 0.00 | nan | nan | +| openrouter/meta-llama/llama-3-8b-instruct:extended | $0.225 | $2.25 | nan | nan | +| openrouter/meta-llama/llama-3-70b-instruct:nitro | $0.9 | $0.9 | nan | nan | +| openrouter/meta-llama/llama-3-70b-instruct | $0.59 | $0.79 | nan | nan | +| openrouter/openai/gpt-4o | $ 5.00 | $15.00 | 128,000 | 4096 | +| openrouter/openai/gpt-4o-2024-05-13 | $ 5.00 | $15.00 | 128,000 | 4096 | +| openrouter/openai/gpt-4-vision-preview | $10.00 | $30.00 | nan | nan | +| openrouter/openai/gpt-3.5-turbo | $1.5 | $ 2.00 | nan | nan | +| openrouter/openai/gpt-3.5-turbo-16k | $ 3.00 | $ 4.00 | nan | nan | +| openrouter/openai/gpt-4 | $30.00 | $60.00 | nan | nan | +| openrouter/anthropic/claude-instant-v1 | $1.63 | $5.51 | nan | 8191 | +| openrouter/anthropic/claude-2 | $11.02 | $32.68 | nan | 8191 | +| openrouter/anthropic/claude-3-opus | $15.00 | $75.00 | 200,000 | 4096 | +| openrouter/google/palm-2-chat-bison | $0.5 | $0.5 | nan | nan | +| openrouter/google/palm-2-codechat-bison | $0.5 | $0.5 | nan | nan | +| openrouter/meta-llama/llama-2-13b-chat | $0.2 | $0.2 | nan | nan | +| openrouter/meta-llama/llama-2-70b-chat | $1.5 | $1.5 | nan | nan | +| openrouter/meta-llama/codellama-34b-instruct | $0.5 | $0.5 | nan | nan | +| openrouter/nousresearch/nous-hermes-llama2-13b | $0.2 | $0.2 | nan | nan | +| openrouter/mancer/weaver | $5.625 | $5.625 | nan | nan | +| openrouter/gryphe/mythomax-l2-13b | $1.875 | $1.875 | nan | nan | +| openrouter/jondurbin/airoboros-l2-70b-2.1 | $13.875 | $13.875 | nan | nan | +| openrouter/undi95/remm-slerp-l2-13b | $1.875 | $1.875 | nan | nan | +| openrouter/pygmalionai/mythalion-13b | $1.875 | $1.875 | nan | nan | +| openrouter/mistralai/mistral-7b-instruct | $0.13 | $0.13 | nan | nan | +| openrouter/mistralai/mistral-7b-instruct:free | $ 0.00 | $ 0.00 | nan | nan | +| j2-ultra | $15.00 | $15.00 | 8,192 | 8192 | +| j2-mid | $10.00 | $10.00 | 8,192 | 8192 | +| j2-light | $ 3.00 | $ 3.00 | 8,192 | 8192 | +| dolphin | $0.5 | $0.5 | 16,384 | 16384 | +| chatdolphin | $0.5 | $0.5 | 16,384 | 16384 | +| luminous-base | $30.00 | $33.00 | nan | nan | +| luminous-base-control | $37.5 | $41.25 | nan | nan | +| luminous-extended | $45.00 | $49.5 | nan | nan | +| luminous-extended-control | $56.25 | $61.875 | nan | nan | +| luminous-supreme | $175.00 | $192.5 | nan | nan | +| luminous-supreme-control | $218.75 | $240.625 | nan | nan | +| ai21.j2-mid-v1 | $12.5 | $12.5 | 8,191 | 8191 | +| ai21.j2-ultra-v1 | $18.8 | $18.8 | 8,191 | 8191 | +| ai21.jamba-instruct-v1:0 | $0.5 | $0.7 | 70,000 | 4096 | +| amazon.titan-text-lite-v1 | $0.3 | $0.4 | 42,000 | 4000 | +| amazon.titan-text-express-v1 | $1.3 | $1.7 | 42,000 | 8000 | +| amazon.titan-embed-text-v1 | $0.1 | $ 0.00 | 8,192 | nan | +| amazon.titan-embed-text-v2:0 | $0.2 | $ 0.00 | 8,192 | nan | +| mistral.mistral-7b-instruct-v0:2 | $0.15 | $0.2 | 32,000 | 8191 | +| mistral.mixtral-8x7b-instruct-v0:1 | $0.45 | $0.7 | 32,000 | 8191 | +| mistral.mistral-large-2402-v1:0 | $ 8.00 | $24.00 | 32,000 | 8191 | +| bedrock/us-west-2/mistral.mixtral-8x7b-instruct-v0:1 | $0.45 | $0.7 | 32,000 | 8191 | +| bedrock/us-east-1/mistral.mixtral-8x7b-instruct-v0:1 | $0.45 | $0.7 | 32,000 | 8191 | +| bedrock/eu-west-3/mistral.mixtral-8x7b-instruct-v0:1 | $0.59 | $0.91 | 32,000 | 8191 | +| bedrock/us-west-2/mistral.mistral-7b-instruct-v0:2 | $0.15 | $0.2 | 32,000 | 8191 | +| bedrock/us-east-1/mistral.mistral-7b-instruct-v0:2 | $0.15 | $0.2 | 32,000 | 8191 | +| bedrock/eu-west-3/mistral.mistral-7b-instruct-v0:2 | $0.2 | $0.26 | 32,000 | 8191 | +| bedrock/us-east-1/mistral.mistral-large-2402-v1:0 | $ 8.00 | $24.00 | 32,000 | 8191 | +| bedrock/us-west-2/mistral.mistral-large-2402-v1:0 | $ 8.00 | $24.00 | 32,000 | 8191 | +| bedrock/eu-west-3/mistral.mistral-large-2402-v1:0 | $10.4 | $31.2 | 32,000 | 8191 | +| anthropic.claude-3-sonnet-20240229-v1:0 | $ 3.00 | $15.00 | 200,000 | 4096 | +| anthropic.claude-3-5-sonnet-20240620-v1:0 | $ 3.00 | $15.00 | 200,000 | 4096 | +| anthropic.claude-3-haiku-20240307-v1:0 | $0.25 | $1.25 | 200,000 | 4096 | +| anthropic.claude-3-opus-20240229-v1:0 | $15.00 | $75.00 | 200,000 | 4096 | +| anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/us-east-1/anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/us-west-2/anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/ap-northeast-1/anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/anthropic.claude-v1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-east-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-east-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 | +| anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/us-east-1/anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/us-west-2/anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/ap-northeast-1/anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/anthropic.claude-v2 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| bedrock/us-east-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| bedrock/us-east-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 | +| anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/us-east-1/anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/us-west-2/anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/ap-northeast-1/anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/anthropic.claude-v2:1 | $ 8.00 | $24.00 | 100,000 | 8191 | +| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| bedrock/us-east-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| bedrock/us-east-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 | +| anthropic.claude-instant-v1 | $1.63 | $5.51 | 100,000 | 8191 | +| bedrock/us-east-1/anthropic.claude-instant-v1 | $0.8 | $2.4 | 100,000 | 8191 | +| bedrock/us-east-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-east-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| bedrock/us-west-2/anthropic.claude-instant-v1 | $0.8 | $2.4 | 100,000 | 8191 | +| bedrock/ap-northeast-1/anthropic.claude-instant-v1 | $2.23 | $7.55 | 100,000 | 8191 | +| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/anthropic.claude-instant-v1 | $2.48 | $8.38 | 100,000 | 8191 | +| bedrock/eu-central-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| bedrock/eu-central-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 | +| cohere.command-text-v14 | $1.5 | $ 2.00 | 4,096 | 4096 | +| bedrock/*/1-month-commitment/cohere.command-text-v14 | -- | -- | 4,096 | 4096 | +| bedrock/*/6-month-commitment/cohere.command-text-v14 | -- | -- | 4,096 | 4096 | +| cohere.command-light-text-v14 | $0.3 | $0.6 | 4,096 | 4096 | +| bedrock/*/1-month-commitment/cohere.command-light-text-v14 | -- | -- | 4,096 | 4096 | +| bedrock/*/6-month-commitment/cohere.command-light-text-v14 | -- | -- | 4,096 | 4096 | +| cohere.command-r-plus-v1:0 | $ 3.00 | $15.00 | 128,000 | 4096 | +| cohere.command-r-v1:0 | $0.5 | $1.5 | 128,000 | 4096 | +| cohere.embed-english-v3 | $0.1 | $ 0.00 | 512 | nan | +| cohere.embed-multilingual-v3 | $0.1 | $ 0.00 | 512 | nan | +| meta.llama2-13b-chat-v1 | $0.75 | $ 1.00 | 4,096 | 4096 | +| meta.llama2-70b-chat-v1 | $1.95 | $2.56 | 4,096 | 4096 | +| meta.llama3-8b-instruct-v1:0 | $0.4 | $0.6 | 8,192 | 8192 | +| meta.llama3-70b-instruct-v1:0 | $2.65 | $3.5 | 8,192 | 8192 | +| meta.llama3-1-8b-instruct-v1:0 | $0.4 | $0.6 | 128,000 | 2048 | +| meta.llama3-1-70b-instruct-v1:0 | $2.65 | $3.5 | 128,000 | 2048 | +| 512-x-512/50-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan | +| 512-x-512/max-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan | +| max-x-max/50-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan | +| max-x-max/max-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan | +| 1024-x-1024/50-steps/stability.stable-diffusion-xl-v1 | -- | -- | 77 | nan | +| 1024-x-1024/max-steps/stability.stable-diffusion-xl-v1 | -- | -- | 77 | nan | +| sagemaker/meta-textgeneration-llama-2-7b | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| sagemaker/meta-textgeneration-llama-2-7b-f | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| sagemaker/meta-textgeneration-llama-2-13b | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| sagemaker/meta-textgeneration-llama-2-13b-f | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| sagemaker/meta-textgeneration-llama-2-70b | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| sagemaker/meta-textgeneration-llama-2-70b-b-f | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| together-ai-up-to-4b | $0.1 | $0.1 | nan | nan | +| together-ai-4.1b-8b | $0.2 | $0.2 | nan | nan | +| together-ai-8.1b-21b | $0.3 | $0.3 | nan | nan | +| together-ai-21.1b-41b | $0.8 | $0.8 | nan | nan | +| together-ai-41.1b-80b | $0.9 | $0.9 | nan | nan | +| together-ai-81.1b-110b | $1.8 | $1.8 | nan | nan | +| together_ai/mistralai/Mixtral-8x7B-Instruct-v0.1 | $0.6 | $0.6 | nan | nan | +| together_ai/mistralai/Mistral-7B-Instruct-v0.1 | -- | -- | nan | nan | +| together_ai/togethercomputer/CodeLlama-34b-Instruct | -- | -- | nan | nan | +| ollama/codegemma | $ 0.00 | $ 0.00 | 8,192 | 8192 | +| ollama/llama2 | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| ollama/llama2:13b | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| ollama/llama2:70b | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| ollama/llama2-uncensored | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| ollama/llama3 | $ 0.00 | $ 0.00 | 8,192 | 8192 | +| ollama/llama3:70b | $ 0.00 | $ 0.00 | 8,192 | 8192 | +| ollama/mistral | $ 0.00 | $ 0.00 | 8,192 | 8192 | +| ollama/mistral-7B-Instruct-v0.1 | $ 0.00 | $ 0.00 | 8,192 | 8192 | +| ollama/mistral-7B-Instruct-v0.2 | $ 0.00 | $ 0.00 | 32,768 | 32768 | +| ollama/mixtral-8x7B-Instruct-v0.1 | $ 0.00 | $ 0.00 | 32,768 | 32768 | +| ollama/mixtral-8x22B-Instruct-v0.1 | $ 0.00 | $ 0.00 | 65,536 | 65536 | +| ollama/codellama | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| ollama/orca-mini | $ 0.00 | $ 0.00 | 4,096 | 4096 | +| ollama/vicuna | $ 0.00 | $ 0.00 | 2,048 | 2048 | +| deepinfra/lizpreciatior/lzlv_70b_fp16_hf | $0.7 | $0.9 | 4,096 | 4096 | +| deepinfra/Gryphe/MythoMax-L2-13b | $0.22 | $0.22 | 4,096 | 4096 | +| deepinfra/mistralai/Mistral-7B-Instruct-v0.1 | $0.13 | $0.13 | 32,768 | 8191 | +| deepinfra/meta-llama/Llama-2-70b-chat-hf | $0.7 | $0.9 | 4,096 | 4096 | +| deepinfra/cognitivecomputations/dolphin-2.6-mixtral-8x7b | $0.27 | $0.27 | 32,768 | 8191 | +| deepinfra/codellama/CodeLlama-34b-Instruct-hf | $0.6 | $0.6 | 4,096 | 4096 | +| deepinfra/deepinfra/mixtral | $0.27 | $0.27 | 32,000 | 4096 | +| deepinfra/Phind/Phind-CodeLlama-34B-v2 | $0.6 | $0.6 | 16,384 | 4096 | +| deepinfra/mistralai/Mixtral-8x7B-Instruct-v0.1 | $0.27 | $0.27 | 32,768 | 8191 | +| deepinfra/deepinfra/airoboros-70b | $0.7 | $0.9 | 4,096 | 4096 | +| deepinfra/01-ai/Yi-34B-Chat | $0.6 | $0.6 | 4,096 | 4096 | +| deepinfra/01-ai/Yi-6B-200K | $0.13 | $0.13 | 200,000 | 4096 | +| deepinfra/jondurbin/airoboros-l2-70b-gpt4-1.4.1 | $0.7 | $0.9 | 4,096 | 4096 | +| deepinfra/meta-llama/Llama-2-13b-chat-hf | $0.22 | $0.22 | 4,096 | 4096 | +| deepinfra/amazon/MistralLite | $0.2 | $0.2 | 32,768 | 8191 | +| deepinfra/meta-llama/Llama-2-7b-chat-hf | $0.13 | $0.13 | 4,096 | 4096 | +| deepinfra/meta-llama/Meta-Llama-3-8B-Instruct | $0.08 | $0.08 | 8,191 | 4096 | +| deepinfra/meta-llama/Meta-Llama-3-70B-Instruct | $0.59 | $0.79 | 8,191 | 4096 | +| deepinfra/01-ai/Yi-34B-200K | $0.6 | $0.6 | 200,000 | 4096 | +| deepinfra/openchat/openchat_3.5 | $0.13 | $0.13 | 4,096 | 4096 | +| perplexity/codellama-34b-instruct | $0.35 | $1.4 | 16,384 | 16384 | +| perplexity/codellama-70b-instruct | $0.7 | $2.8 | 16,384 | 16384 | +| perplexity/pplx-7b-chat | $0.07 | $0.28 | 8,192 | 8192 | +| perplexity/pplx-70b-chat | $0.7 | $2.8 | 4,096 | 4096 | +| perplexity/pplx-7b-online | $ 0.00 | $0.28 | 4,096 | 4096 | +| perplexity/pplx-70b-online | $ 0.00 | $2.8 | 4,096 | 4096 | +| perplexity/llama-2-70b-chat | $0.7 | $2.8 | 4,096 | 4096 | +| perplexity/mistral-7b-instruct | $0.07 | $0.28 | 4,096 | 4096 | +| perplexity/mixtral-8x7b-instruct | $0.07 | $0.28 | 4,096 | 4096 | +| perplexity/sonar-small-chat | $0.07 | $0.28 | 16,384 | 16384 | +| perplexity/sonar-small-online | $ 0.00 | $0.28 | 12,000 | 12000 | +| perplexity/sonar-medium-chat | $0.6 | $1.8 | 16,384 | 16384 | +| perplexity/sonar-medium-online | $ 0.00 | $1.8 | 12,000 | 12000 | +| fireworks_ai/firefunction-v2 | $0.9 | $0.9 | 8,192 | 8192 | +| fireworks_ai/mixtral-8x22b-instruct-hf | $1.2 | $1.2 | 65,536 | 65536 | +| fireworks_ai/qwen2-72b-instruct | $0.9 | $0.9 | 32,768 | 32768 | +| fireworks_ai/yi-large | $ 3.00 | $ 3.00 | 32,768 | 32768 | +| fireworks_ai/deepseek-coder-v2-instruct | $1.2 | $1.2 | 65,536 | 8192 | +| anyscale/mistralai/Mistral-7B-Instruct-v0.1 | $0.15 | $0.15 | 16,384 | 16384 | +| anyscale/mistralai/Mixtral-8x7B-Instruct-v0.1 | $0.15 | $0.15 | 16,384 | 16384 | +| anyscale/mistralai/Mixtral-8x22B-Instruct-v0.1 | $0.9 | $0.9 | 65,536 | 65536 | +| anyscale/HuggingFaceH4/zephyr-7b-beta | $0.15 | $0.15 | 16,384 | 16384 | +| anyscale/google/gemma-7b-it | $0.15 | $0.15 | 8,192 | 8192 | +| anyscale/meta-llama/Llama-2-7b-chat-hf | $0.15 | $0.15 | 4,096 | 4096 | +| anyscale/meta-llama/Llama-2-13b-chat-hf | $0.25 | $0.25 | 4,096 | 4096 | +| anyscale/meta-llama/Llama-2-70b-chat-hf | $ 1.00 | $ 1.00 | 4,096 | 4096 | +| anyscale/codellama/CodeLlama-34b-Instruct-hf | $ 1.00 | $ 1.00 | 4,096 | 4096 | +| anyscale/codellama/CodeLlama-70b-Instruct-hf | $ 1.00 | $ 1.00 | 4,096 | 4096 | +| anyscale/meta-llama/Meta-Llama-3-8B-Instruct | $0.15 | $0.15 | 8,192 | 8192 | +| anyscale/meta-llama/Meta-Llama-3-70B-Instruct | $ 1.00 | $ 1.00 | 8,192 | 8192 | +| cloudflare/@cf/meta/llama-2-7b-chat-fp16 | $1.923 | $1.923 | 3,072 | 3072 | +| cloudflare/@cf/meta/llama-2-7b-chat-int8 | $1.923 | $1.923 | 2,048 | 2048 | +| cloudflare/@cf/mistral/mistral-7b-instruct-v0.1 | $1.923 | $1.923 | 8,192 | 8192 | +| cloudflare/@hf/thebloke/codellama-7b-instruct-awq | $1.923 | $1.923 | 4,096 | 4096 | +| voyage/voyage-01 | $0.1 | $ 0.00 | 4,096 | nan | +| voyage/voyage-lite-01 | $0.1 | $ 0.00 | 4,096 | nan | +| voyage/voyage-large-2 | $0.12 | $ 0.00 | 16,000 | nan | +| voyage/voyage-law-2 | $0.12 | $ 0.00 | 16,000 | nan | +| voyage/voyage-code-2 | $0.12 | $ 0.00 | 16,000 | nan | +| voyage/voyage-2 | $0.1 | $ 0.00 | 4,000 | nan | +| voyage/voyage-lite-02-instruct | $0.1 | $ 0.00 | 4,000 | nan | +| databricks/databricks-dbrx-instruct | $0.75 | $2.25 | 32,768 | 32768 | +| databricks/databricks-meta-llama-3-70b-instruct | $ 1.00 | $ 3.00 | 8,192 | 8192 | +| databricks/databricks-llama-2-70b-chat | $0.5 | $1.5 | 4,096 | 4096 | +| databricks/databricks-mixtral-8x7b-instruct | $0.5 | $ 1.00 | 4,096 | 4096 | +| databricks/databricks-mpt-30b-instruct | $ 1.00 | $ 1.00 | 8,192 | 8192 | +| databricks/databricks-mpt-7b-instruct | $0.5 | $0.5 | 8,192 | 8192 | +| databricks/databricks-bge-large-en | $0.1 | $ 0.00 | 512 | nan | \ No newline at end of file diff --git a/tokencost/model_prices.json b/tokencost/model_prices.json index c549ef0..1299241 100644 --- a/tokencost/model_prices.json +++ b/tokencost/model_prices.json @@ -760,6 +760,36 @@ "litellm_provider": "azure_ai", "mode": "chat" }, + "azure_ai/Meta-Llama-31-8B-Instruct": { + "max_tokens": 128000, + "max_input_tokens": 128000, + "max_output_tokens": 128000, + "input_cost_per_token": 3e-07, + "output_cost_per_token": 6.1e-07, + "litellm_provider": "azure_ai", + "mode": "chat", + "source": "https://azuremarketplace.microsoft.com/en-us/marketplace/apps/metagenai.meta-llama-3-1-8b-instruct-offer?tab=PlansAndPrice" + }, + "azure_ai/Meta-Llama-31-70B-Instruct": { + "max_tokens": 128000, + "max_input_tokens": 128000, + "max_output_tokens": 128000, + "input_cost_per_token": 2.68e-06, + "output_cost_per_token": 3.54e-06, + "litellm_provider": "azure_ai", + "mode": "chat", + "source": "https://azuremarketplace.microsoft.com/en-us/marketplace/apps/metagenai.meta-llama-3-1-70b-instruct-offer?tab=PlansAndPrice" + }, + "azure_ai/Meta-Llama-31-405B-Instruct": { + "max_tokens": 128000, + "max_input_tokens": 128000, + "max_output_tokens": 128000, + "input_cost_per_token": 5.33e-06, + "output_cost_per_token": 1.6e-05, + "litellm_provider": "azure_ai", + "mode": "chat", + "source": "https://azuremarketplace.microsoft.com/en-us/marketplace/apps/metagenai.meta-llama-3-1-405b-instruct-offer?tab=PlansAndPrice" + }, "babbage-002": { "max_tokens": 16384, "max_input_tokens": 16384, @@ -862,11 +892,11 @@ "mode": "chat" }, "mistral/mistral-large-latest": { - "max_tokens": 8191, - "max_input_tokens": 32000, - "max_output_tokens": 8191, - "input_cost_per_token": 4e-06, - "output_cost_per_token": 1.2e-05, + "max_tokens": 128000, + "max_input_tokens": 128000, + "max_output_tokens": 128000, + "input_cost_per_token": 3e-06, + "output_cost_per_token": 9e-06, "litellm_provider": "mistral", "mode": "chat", "supports_function_calling": true @@ -881,6 +911,16 @@ "mode": "chat", "supports_function_calling": true }, + "mistral/mistral-large-2407": { + "max_tokens": 128000, + "max_input_tokens": 128000, + "max_output_tokens": 128000, + "input_cost_per_token": 3e-06, + "output_cost_per_token": 9e-06, + "litellm_provider": "mistral", + "mode": "chat", + "supports_function_calling": true + }, "mistral/open-mistral-7b": { "max_tokens": 8191, "max_input_tokens": 32000, @@ -928,6 +968,46 @@ "litellm_provider": "mistral", "mode": "chat" }, + "mistral/open-mistral-nemo": { + "max_tokens": 128000, + "max_input_tokens": 128000, + "max_output_tokens": 128000, + "input_cost_per_token": 3e-07, + "output_cost_per_token": 3e-07, + "litellm_provider": "mistral", + "mode": "chat", + "source": "https://mistral.ai/technology/" + }, + "mistral/open-mistral-nemo-2407": { + "max_tokens": 128000, + "max_input_tokens": 128000, + "max_output_tokens": 128000, + "input_cost_per_token": 3e-07, + "output_cost_per_token": 3e-07, + "litellm_provider": "mistral", + "mode": "chat", + "source": "https://mistral.ai/technology/" + }, + "mistral/open-codestral-mamba": { + "max_tokens": 256000, + "max_input_tokens": 256000, + "max_output_tokens": 256000, + "input_cost_per_token": 2.5e-07, + "output_cost_per_token": 2.5e-07, + "litellm_provider": "mistral", + "mode": "chat", + "source": "https://mistral.ai/technology/" + }, + "mistral/codestral-mamba-latest": { + "max_tokens": 256000, + "max_input_tokens": 256000, + "max_output_tokens": 256000, + "input_cost_per_token": 2.5e-07, + "output_cost_per_token": 2.5e-07, + "litellm_provider": "mistral", + "mode": "chat", + "source": "https://mistral.ai/technology/" + }, "mistral/mistral-embed": { "max_tokens": 8192, "max_input_tokens": 8192, @@ -1023,6 +1103,36 @@ "mode": "chat", "supports_function_calling": true }, + "groq/llama-3.1-8b-instant": { + "max_tokens": 8192, + "max_input_tokens": 8192, + "max_output_tokens": 8192, + "input_cost_per_token": 5.9e-07, + "output_cost_per_token": 7.9e-07, + "litellm_provider": "groq", + "mode": "chat", + "supports_function_calling": true + }, + "groq/llama-3.1-70b-versatile": { + "max_tokens": 8192, + "max_input_tokens": 8192, + "max_output_tokens": 8192, + "input_cost_per_token": 5.9e-07, + "output_cost_per_token": 7.9e-07, + "litellm_provider": "groq", + "mode": "chat", + "supports_function_calling": true + }, + "groq/llama-3.1-405b-reasoning": { + "max_tokens": 8192, + "max_input_tokens": 8192, + "max_output_tokens": 8192, + "input_cost_per_token": 5.9e-07, + "output_cost_per_token": 7.9e-07, + "litellm_provider": "groq", + "mode": "chat", + "supports_function_calling": true + }, "groq/mixtral-8x7b-32768": { "max_tokens": 32768, "max_input_tokens": 32768, @@ -1907,6 +2017,16 @@ "supports_function_calling": true, "supports_vision": true }, + "vertex_ai/meta/llama3-405b-instruct-maas": { + "max_tokens": 32000, + "max_input_tokens": 32000, + "max_output_tokens": 32000, + "input_cost_per_token": 0.0, + "output_cost_per_token": 0.0, + "litellm_provider": "vertex_ai-llama_models", + "mode": "chat", + "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing#partner-models" + }, "vertex_ai/imagegeneration@006": { "cost_per_image": 0.02, "litellm_provider": "vertex_ai-image-models", @@ -2167,6 +2287,28 @@ "supports_vision": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, + "gemini/gemini-gemma-2-27b-it": { + "max_tokens": 8192, + "max_output_tokens": 8192, + "input_cost_per_token": 3.5e-07, + "output_cost_per_token": 1.05e-06, + "litellm_provider": "gemini", + "mode": "chat", + "supports_function_calling": true, + "supports_vision": true, + "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" + }, + "gemini/gemini-gemma-2-9b-it": { + "max_tokens": 8192, + "max_output_tokens": 8192, + "input_cost_per_token": 3.5e-07, + "output_cost_per_token": 1.05e-06, + "litellm_provider": "gemini", + "mode": "chat", + "supports_function_calling": true, + "supports_vision": true, + "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" + }, "command-r": { "max_tokens": 4096, "max_input_tokens": 128000, @@ -2232,15 +2374,6 @@ "litellm_provider": "cohere", "mode": "completion" }, - "replicate/llama-2-70b-chat:2c1608e18606fad2812020dc541930f2d0495ce32eee50074220b87300bc16e1": { - "max_tokens": 4096, - "max_input_tokens": 4096, - "max_output_tokens": 4096, - "input_cost_per_token": 0.0, - "output_cost_per_token": 0.0, - "litellm_provider": "replicate", - "mode": "chat" - }, "replicate/meta/llama-2-13b": { "max_tokens": 4096, "max_input_tokens": 4096, @@ -2789,6 +2922,16 @@ "litellm_provider": "bedrock", "mode": "chat" }, + "ai21.jamba-instruct-v1:0": { + "max_tokens": 4096, + "max_input_tokens": 70000, + "max_output_tokens": 4096, + "input_cost_per_token": 5e-07, + "output_cost_per_token": 7e-07, + "litellm_provider": "bedrock", + "mode": "chat", + "supports_system_messages": true + }, "amazon.titan-text-lite-v1": { "max_tokens": 4000, "max_input_tokens": 42000, @@ -3569,6 +3712,24 @@ "litellm_provider": "bedrock", "mode": "chat" }, + "meta.llama3-1-8b-instruct-v1:0": { + "max_tokens": 128000, + "max_input_tokens": 128000, + "max_output_tokens": 2048, + "input_cost_per_token": 4e-07, + "output_cost_per_token": 6e-07, + "litellm_provider": "bedrock", + "mode": "chat" + }, + "meta.llama3-1-70b-instruct-v1:0": { + "max_tokens": 128000, + "max_input_tokens": 128000, + "max_output_tokens": 2048, + "input_cost_per_token": 2.65e-06, + "output_cost_per_token": 3.5e-06, + "litellm_provider": "bedrock", + "mode": "chat" + }, "512-x-512/50-steps/stability.stable-diffusion-xl-v0": { "max_tokens": 77, "max_input_tokens": 77,