Merge pull request #43 from AgentOps-AI/42-update-static-json-with-update-script

42 update static json with update script
This commit is contained in:
Alex Reibman
2024-05-21 18:05:02 -07:00
committed by GitHub
5 changed files with 2050 additions and 1631 deletions

757
README.md
View File

@@ -117,384 +117,385 @@ Units denominated in USD. All prices can be located in `model_prices.json`.
* Prices last updated Jan 30, 2024 from: https://openai.com/pricing and https://github.com/BerriAI/litellm/blob/main/model_prices_and_context_window.json
| | max_tokens | max_input_tokens | input_cost_per_token | output_cost_per_token |
|:--------------------------------------------------------------------------------------------|:-------------|:-------------------|:-----------------------|:------------------------|
| gpt-4 | 4,096 | 8,192 | $0.00003000 | $0.00006000 |
| gpt-4o | 4,096 | 128,000 | $0.00000500 | $0.00001500 |
| gpt-4o-2024-05-13 | 4,096 | 128,000 | $0.00000500 | $0.00001500 |
| gpt-4-turbo-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| gpt-4-0314 | 4,096 | 8,192 | $0.00003000 | $0.00006000 |
| gpt-4-0613 | 4,096 | 8,192 | $0.00003000 | $0.00006000 |
| gpt-4-32k | 4,096 | 32,768 | $0.00006000 | $0.00012000 |
| gpt-4-32k-0314 | 4,096 | 32,768 | $0.00006000 | $0.00012000 |
| gpt-4-32k-0613 | 4,096 | 32,768 | $0.00006000 | $0.00012000 |
| gpt-4-turbo | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| gpt-4-turbo-2024-04-09 | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| gpt-4-1106-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| gpt-4-0125-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| gpt-4-vision-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| gpt-4-1106-vision-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| gpt-3.5-turbo | 4,097 | 16,385 | $0.00000150 | $0.00000200 |
| gpt-3.5-turbo-0301 | 4,097 | 4,097 | $0.00000150 | $0.00000200 |
| gpt-3.5-turbo-0613 | 4,097 | 4,097 | $0.00000150 | $0.00000200 |
| gpt-3.5-turbo-1106 | 16,385 | 16,385 | $0.00000100 | $0.00000200 |
| gpt-3.5-turbo-0125 | 16,385 | 16,385 | $0.00000050 | $0.00000150 |
| gpt-3.5-turbo-16k | 16,385 | 16,385 | $0.00000300 | $0.00000400 |
| gpt-3.5-turbo-16k-0613 | 16,385 | 16,385 | $0.00000300 | $0.00000400 |
| ft:gpt-3.5-turbo | 4,097 | 4,097 | $0.00000300 | $0.00000600 |
| text-embedding-3-large | 8,191 | 8,191 | $0.00000013 | $0.00000000 |
| text-embedding-3-small | 8,191 | 8,191 | $0.00000002 | $0.00000000 |
| text-embedding-ada-002 | 8,191 | 8,191 | $0.00000010 | $0.00000000 |
| text-embedding-ada-002-v2 | 8,191 | 8,191 | $0.00000010 | $0.00000000 |
| text-moderation-stable | 32,768 | 32,768 | $0.00000000 | $0.00000000 |
| text-moderation-007 | 32,768 | 32,768 | $0.00000000 | $0.00000000 |
| text-moderation-latest | 32,768 | 32,768 | $0.00000000 | $0.00000000 |
| 256-x-256/dall-e-2 | nan | nan | -- | -- |
| 512-x-512/dall-e-2 | nan | nan | -- | -- |
| 1024-x-1024/dall-e-2 | nan | nan | -- | -- |
| hd/1024-x-1792/dall-e-3 | nan | nan | -- | -- |
| hd/1792-x-1024/dall-e-3 | nan | nan | -- | -- |
| hd/1024-x-1024/dall-e-3 | nan | nan | -- | -- |
| standard/1024-x-1792/dall-e-3 | nan | nan | -- | -- |
| standard/1792-x-1024/dall-e-3 | nan | nan | -- | -- |
| standard/1024-x-1024/dall-e-3 | nan | nan | -- | -- |
| whisper-1 | nan | nan | -- | -- |
| azure/whisper-1 | nan | nan | -- | -- |
| azure/gpt-4-turbo-2024-04-09 | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| azure/gpt-4-0125-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| azure/gpt-4-1106-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| azure/gpt-4-0613 | 4,096 | 8,192 | $0.00003000 | $0.00006000 |
| azure/gpt-4-32k-0613 | 4,096 | 32,768 | $0.00006000 | $0.00012000 |
| azure/gpt-4-32k | 4,096 | 32,768 | $0.00006000 | $0.00012000 |
| azure/gpt-4 | 4,096 | 8,192 | $0.00003000 | $0.00006000 |
| azure/gpt-4-turbo | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| azure/gpt-4-turbo-vision-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| azure/gpt-35-turbo-16k-0613 | 4,096 | 16,385 | $0.00000300 | $0.00000400 |
| azure/gpt-35-turbo-1106 | 4,096 | 16,384 | $0.00000150 | $0.00000200 |
| azure/gpt-35-turbo-0125 | 4,096 | 16,384 | $0.00000050 | $0.00000150 |
| azure/gpt-35-turbo-16k | 4,096 | 16,385 | $0.00000300 | $0.00000400 |
| azure/gpt-35-turbo | 4,096 | 4,097 | $0.00000150 | $0.00000200 |
| azure/gpt-3.5-turbo-instruct-0914 | 4,097 | 4,097 | $0.00000150 | $0.00000200 |
| azure/gpt-35-turbo-instruct | 4,097 | 4,097 | $0.00000150 | $0.00000200 |
| azure/mistral-large-latest | 32,000 | 32,000 | $0.00000800 | $0.00002400 |
| azure/mistral-large-2402 | 32,000 | 32,000 | $0.00000800 | $0.00002400 |
| azure/command-r-plus | 4,096 | 128,000 | $0.00000300 | $0.00001500 |
| azure/ada | 8,191 | 8,191 | $0.00000010 | $0.00000000 |
| azure/text-embedding-ada-002 | 8,191 | 8,191 | $0.00000010 | $0.00000000 |
| azure/text-embedding-3-large | 8,191 | 8,191 | $0.00000013 | $0.00000000 |
| azure/text-embedding-3-small | 8,191 | 8,191 | $0.00000002 | $0.00000000 |
| azure/standard/1024-x-1024/dall-e-3 | nan | nan | -- | $0.00000000 |
| azure/hd/1024-x-1024/dall-e-3 | nan | nan | -- | $0.00000000 |
| azure/standard/1024-x-1792/dall-e-3 | nan | nan | -- | $0.00000000 |
| azure/standard/1792-x-1024/dall-e-3 | nan | nan | -- | $0.00000000 |
| azure/hd/1024-x-1792/dall-e-3 | nan | nan | -- | $0.00000000 |
| azure/hd/1792-x-1024/dall-e-3 | nan | nan | -- | $0.00000000 |
| azure/standard/1024-x-1024/dall-e-2 | nan | nan | -- | $0.00000000 |
| babbage-002 | 16,384 | 16,384 | $0.00000040 | $0.00000040 |
| davinci-002 | 16,384 | 16,384 | $0.00000200 | $0.00000200 |
| gpt-3.5-turbo-instruct | 4,096 | 8,192 | $0.00000150 | $0.00000200 |
| gpt-3.5-turbo-instruct-0914 | 4,097 | 8,192 | $0.00000150 | $0.00000200 |
| claude-instant-1 | 8,191 | 100,000 | $0.00000163 | $0.00000551 |
| mistral/mistral-tiny | 8,191 | 32,000 | $0.00000015 | $0.00000046 |
| mistral/mistral-small | 8,191 | 32,000 | $0.00000200 | $0.00000600 |
| mistral/mistral-small-latest | 8,191 | 32,000 | $0.00000200 | $0.00000600 |
| mistral/mistral-medium | 8,191 | 32,000 | $0.00000270 | $0.00000810 |
| mistral/mistral-medium-latest | 8,191 | 32,000 | $0.00000270 | $0.00000810 |
| mistral/mistral-medium-2312 | 8,191 | 32,000 | $0.00000270 | $0.00000810 |
| mistral/mistral-large-latest | 8,191 | 32,000 | $0.00000800 | $0.00002400 |
| mistral/mistral-large-2402 | 8,191 | 32,000 | $0.00000800 | $0.00002400 |
| mistral/open-mixtral-8x7b | 8,191 | 32,000 | $0.00000200 | $0.00000600 |
| mistral/mistral-embed | 8,192 | 8,192 | $0.00000011 | -- |
| deepseek-chat | 4,096 | 32,000 | $0.00000014 | $0.00000028 |
| deepseek-coder | 4,096 | 16,000 | $0.00000014 | $0.00000028 |
| groq/llama2-70b-4096 | 4,096 | 4,096 | $0.00000070 | $0.00000080 |
| groq/llama3-8b-8192 | 8,192 | 8,192 | $0.00000010 | $0.00000010 |
| groq/llama3-70b-8192 | 8,192 | 8,192 | $0.00000064 | $0.00000080 |
| groq/mixtral-8x7b-32768 | 32,768 | 32,768 | $0.00000027 | $0.00000027 |
| groq/gemma-7b-it | 8,192 | 8,192 | $0.00000010 | $0.00000010 |
| claude-instant-1.2 | 8,191 | 100,000 | $0.00000016 | $0.00000055 |
| claude-2 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| claude-2.1 | 8,191 | 200,000 | $0.00000800 | $0.00002400 |
| claude-3-haiku-20240307 | 4,096 | 200,000 | $0.00000025 | $0.00000125 |
| claude-3-opus-20240229 | 4,096 | 200,000 | $0.00001500 | $0.00007500 |
| claude-3-sonnet-20240229 | 4,096 | 200,000 | $0.00000300 | $0.00001500 |
| text-bison | 1,024 | 8,192 | $0.00000012 | $0.00000012 |
| text-bison@001 | 1,024 | 8,192 | $0.00000012 | $0.00000012 |
| text-unicorn | 1,024 | 8,192 | $0.00001000 | $0.00002800 |
| text-unicorn@001 | 1,024 | 8,192 | $0.00001000 | $0.00002800 |
| chat-bison | 4,096 | 8,192 | $0.00000012 | $0.00000012 |
| chat-bison@001 | 4,096 | 8,192 | $0.00000012 | $0.00000012 |
| chat-bison@002 | 4,096 | 8,192 | $0.00000012 | $0.00000012 |
| chat-bison-32k | 8,192 | 32,000 | $0.00000012 | $0.00000012 |
| code-bison | 1,024 | 6,144 | $0.00000012 | $0.00000012 |
| code-bison@001 | 1,024 | 6,144 | $0.00000012 | $0.00000012 |
| code-gecko@001 | 64 | 2,048 | $0.00000012 | $0.00000012 |
| code-gecko@002 | 64 | 2,048 | $0.00000012 | $0.00000012 |
| code-gecko | 64 | 2,048 | $0.00000012 | $0.00000012 |
| codechat-bison | 1,024 | 6,144 | $0.00000012 | $0.00000012 |
| codechat-bison@001 | 1,024 | 6,144 | $0.00000012 | $0.00000012 |
| codechat-bison-32k | 8,192 | 32,000 | $0.00000012 | $0.00000012 |
| gemini-pro | 8,192 | 32,760 | $0.00000025 | $0.00000050 |
| gemini-1.0-pro | 8,192 | 32,760 | $0.00000025 | $0.00000050 |
| gemini-1.0-pro-001 | 8,192 | 32,760 | $0.00000025 | $0.00000050 |
| gemini-1.0-pro-002 | 8,192 | 32,760 | $0.00000025 | $0.00000050 |
| gemini-1.5-pro | 8,192 | 1,000,000 | $0.00000063 | $0.00000188 |
| gemini-1.5-pro-preview-0215 | 8,192 | 1,000,000 | $0.00000063 | $0.00000188 |
| gemini-1.5-pro-preview-0409 | 8,192 | 1,000,000 | $0.00000063 | $0.00000188 |
| gemini-experimental | 8,192 | 1,000,000 | $0.00000000 | $0.00000000 |
| gemini-pro-vision | 2,048 | 16,384 | $0.00000025 | $0.00000050 |
| gemini-1.0-pro-vision | 2,048 | 16,384 | $0.00000025 | $0.00000050 |
| gemini-1.0-pro-vision-001 | 2,048 | 16,384 | $0.00000025 | $0.00000050 |
| vertex_ai/claude-3-sonnet@20240229 | 4,096 | 200,000 | $0.00000300 | $0.00001500 |
| vertex_ai/claude-3-haiku@20240307 | 4,096 | 200,000 | $0.00000025 | $0.00000125 |
| vertex_ai/claude-3-opus@20240229 | 4,096 | 200,000 | $0.00000150 | $0.00000750 |
| textembedding-gecko | 3,072 | 3,072 | $0.00000001 | $0.00000000 |
| textembedding-gecko-multilingual | 3,072 | 3,072 | $0.00000001 | $0.00000000 |
| textembedding-gecko-multilingual@001 | 3,072 | 3,072 | $0.00000001 | $0.00000000 |
| textembedding-gecko@001 | 3,072 | 3,072 | $0.00000001 | $0.00000000 |
| textembedding-gecko@003 | 3,072 | 3,072 | $0.00000001 | $0.00000000 |
| text-embedding-preview-0409 | 3,072 | 3,072 | $0.00000001 | $0.00000000 |
| text-multilingual-embedding-preview-0409 | 3,072 | 3,072 | $0.00000001 | $0.00000000 |
| palm/chat-bison | 4,096 | 8,192 | $0.00000012 | $0.00000012 |
| palm/chat-bison-001 | 4,096 | 8,192 | $0.00000012 | $0.00000012 |
| palm/text-bison | 1,024 | 8,192 | $0.00000012 | $0.00000012 |
| palm/text-bison-001 | 1,024 | 8,192 | $0.00000012 | $0.00000012 |
| palm/text-bison-safety-off | 1,024 | 8,192 | $0.00000012 | $0.00000012 |
| palm/text-bison-safety-recitation-off | 1,024 | 8,192 | $0.00000012 | $0.00000012 |
| gemini/gemini-pro | 8,192 | 32,760 | $0.00000000 | $0.00000000 |
| gemini/gemini-1.5-pro | 8,192 | 1,000,000 | $0.00000000 | $0.00000000 |
| gemini/gemini-1.5-pro-latest | 8,192 | 1,048,576 | $0.00000000 | $0.00000000 |
| gemini/gemini-pro-vision | 2,048 | 30,720 | $0.00000000 | $0.00000000 |
| command-r | 4,096 | 128,000 | $0.00000050 | $0.00000150 |
| command-light | 4,096 | 4,096 | $0.00001500 | $0.00001500 |
| command-r-plus | 4,096 | 128,000 | $0.00000300 | $0.00001500 |
| command-nightly | 4,096 | 4,096 | $0.00001500 | $0.00001500 |
| command | 4,096 | 4,096 | $0.00001500 | $0.00001500 |
| command-medium-beta | 4,096 | 4,096 | $0.00001500 | $0.00001500 |
| command-xlarge-beta | 4,096 | 4,096 | $0.00001500 | $0.00001500 |
| replicate/meta/llama-2-13b | 4,096 | 4,096 | $0.00000010 | $0.00000050 |
| replicate/meta/llama-2-13b-chat | 4,096 | 4,096 | $0.00000010 | $0.00000050 |
| replicate/meta/llama-2-70b | 4,096 | 4,096 | $0.00000065 | $0.00000275 |
| replicate/meta/llama-2-70b-chat | 4,096 | 4,096 | $0.00000065 | $0.00000275 |
| replicate/meta/llama-2-7b | 4,096 | 4,096 | $0.00000005 | $0.00000025 |
| replicate/meta/llama-2-7b-chat | 4,096 | 4,096 | $0.00000005 | $0.00000025 |
| replicate/meta/llama-3-70b | 4,096 | 4,096 | $0.00000065 | $0.00000275 |
| replicate/meta/llama-3-70b-instruct | 4,096 | 4,096 | $0.00000065 | $0.00000275 |
| replicate/meta/llama-3-8b | 4,096 | 4,096 | $0.00000005 | $0.00000025 |
| replicate/meta/llama-3-8b-instruct | 4,096 | 4,096 | $0.00000005 | $0.00000025 |
| replicate/mistralai/mistral-7b-v0.1 | 4,096 | 4,096 | $0.00000005 | $0.00000025 |
| replicate/mistralai/mistral-7b-instruct-v0.2 | 4,096 | 4,096 | $0.00000005 | $0.00000025 |
| replicate/mistralai/mixtral-8x7b-instruct-v0.1 | 4,096 | 4,096 | $0.00000030 | $0.00000100 |
| openrouter/microsoft/wizardlm-2-8x22b:nitro | 65,536 | nan | $0.00000100 | $0.00000100 |
| openrouter/google/gemini-pro-1.5 | 8,192 | 1,000,000 | $0.00000250 | $0.00000750 |
| openrouter/mistralai/mixtral-8x22b-instruct | 65,536 | nan | $0.00000065 | $0.00000065 |
| openrouter/cohere/command-r-plus | 128,000 | nan | $0.00000300 | $0.00001500 |
| openrouter/databricks/dbrx-instruct | 32,768 | nan | $0.00000060 | $0.00000060 |
| openrouter/anthropic/claude-3-haiku | 200,000 | nan | $0.00000025 | $0.00000125 |
| openrouter/anthropic/claude-3-sonnet | 200,000 | nan | $0.00000300 | $0.00001500 |
| openrouter/mistralai/mistral-large | 32,000 | nan | $0.00000800 | $0.00002400 |
| openrouter/cognitivecomputations/dolphin-mixtral-8x7b | 32,769 | nan | $0.00000050 | $0.00000050 |
| openrouter/google/gemini-pro-vision | 45,875 | nan | $0.00000012 | $0.00000038 |
| openrouter/fireworks/firellava-13b | 4,096 | nan | $0.00000020 | $0.00000020 |
| openrouter/meta-llama/llama-3-8b-instruct:free | 8,192 | nan | $0.00000000 | $0.00000000 |
| openrouter/meta-llama/llama-3-8b-instruct:extended | 16,384 | nan | $0.00000022 | $0.00000225 |
| openrouter/meta-llama/llama-3-70b-instruct:nitro | 8,192 | nan | $0.00000090 | $0.00000090 |
| openrouter/meta-llama/llama-3-70b-instruct | 8,192 | nan | $0.00000059 | $0.00000079 |
| openrouter/openai/gpt-4-vision-preview | 130,000 | nan | $0.00001000 | $0.00003000 |
| openrouter/openai/gpt-3.5-turbo | 4,095 | nan | $0.00000150 | $0.00000200 |
| openrouter/openai/gpt-3.5-turbo-16k | 16,383 | nan | $0.00000300 | $0.00000400 |
| openrouter/openai/gpt-4 | 8,192 | nan | $0.00003000 | $0.00006000 |
| openrouter/anthropic/claude-instant-v1 | 100,000 | nan | $0.00000163 | $0.00000551 |
| openrouter/anthropic/claude-2 | 100,000 | nan | $0.00001102 | $0.00003268 |
| openrouter/anthropic/claude-3-opus | 4,096 | 200,000 | $0.00001500 | $0.00007500 |
| openrouter/google/palm-2-chat-bison | 25,804 | nan | $0.00000050 | $0.00000050 |
| openrouter/google/palm-2-codechat-bison | 20,070 | nan | $0.00000050 | $0.00000050 |
| openrouter/meta-llama/llama-2-13b-chat | 4,096 | nan | $0.00000020 | $0.00000020 |
| openrouter/meta-llama/llama-2-70b-chat | 4,096 | nan | $0.00000150 | $0.00000150 |
| openrouter/meta-llama/codellama-34b-instruct | 8,096 | nan | $0.00000050 | $0.00000050 |
| openrouter/nousresearch/nous-hermes-llama2-13b | 4,096 | nan | $0.00000020 | $0.00000020 |
| openrouter/mancer/weaver | 8,000 | nan | $0.00000563 | $0.00000563 |
| openrouter/gryphe/mythomax-l2-13b | 8,192 | nan | $0.00000188 | $0.00000188 |
| openrouter/jondurbin/airoboros-l2-70b-2.1 | 4,096 | nan | $0.00001388 | $0.00001388 |
| openrouter/undi95/remm-slerp-l2-13b | 6,144 | nan | $0.00000188 | $0.00000188 |
| openrouter/pygmalionai/mythalion-13b | 4,096 | nan | $0.00000188 | $0.00000188 |
| openrouter/mistralai/mistral-7b-instruct | 8,192 | nan | $0.00000013 | $0.00000013 |
| openrouter/mistralai/mistral-7b-instruct:free | 8,192 | nan | $0.00000000 | $0.00000000 |
| j2-ultra | 8,192 | 8,192 | $0.00001500 | $0.00001500 |
| j2-mid | 8,192 | 8,192 | $0.00001000 | $0.00001000 |
| j2-light | 8,192 | 8,192 | $0.00000300 | $0.00000300 |
| dolphin | 16,384 | 16,384 | $0.00000050 | $0.00000050 |
| chatdolphin | 16,384 | 16,384 | $0.00000050 | $0.00000050 |
| luminous-base | 2,048 | nan | $0.00003000 | $0.00003300 |
| luminous-base-control | 2,048 | nan | $0.00003750 | $0.00004125 |
| luminous-extended | 2,048 | nan | $0.00004500 | $0.00004950 |
| luminous-extended-control | 2,048 | nan | $0.00005625 | $0.00006187 |
| luminous-supreme | 2,048 | nan | $0.00017500 | $0.00019250 |
| luminous-supreme-control | 2,048 | nan | $0.00021875 | $0.00024063 |
| ai21.j2-mid-v1 | 8,191 | 8,191 | $0.00001250 | $0.00001250 |
| ai21.j2-ultra-v1 | 8,191 | 8,191 | $0.00001880 | $0.00001880 |
| amazon.titan-text-lite-v1 | 4,000 | 42,000 | $0.00000030 | $0.00000040 |
| amazon.titan-text-express-v1 | 8,000 | 42,000 | $0.00000130 | $0.00000170 |
| amazon.titan-embed-text-v1 | 8,192 | 8,192 | $0.00000010 | $0.00000000 |
| amazon.titan-embed-text-v2:0 | 8,192 | 8,192 | $0.00000020 | $0.00000000 |
| mistral.mistral-7b-instruct-v0:2 | 8,191 | 32,000 | $0.00000015 | $0.00000020 |
| mistral.mixtral-8x7b-instruct-v0:1 | 8,191 | 32,000 | $0.00000045 | $0.00000070 |
| mistral.mistral-large-2402-v1:0 | 8,191 | 32,000 | $0.00000800 | $0.00002400 |
| bedrock/us-west-2/mistral.mixtral-8x7b-instruct-v0:1 | 8,191 | 32,000 | $0.00000045 | $0.00000070 |
| bedrock/us-east-1/mistral.mixtral-8x7b-instruct-v0:1 | 8,191 | 32,000 | $0.00000045 | $0.00000070 |
| bedrock/eu-west-3/mistral.mixtral-8x7b-instruct-v0:1 | 8,191 | 32,000 | $0.00000059 | $0.00000091 |
| bedrock/us-west-2/mistral.mistral-7b-instruct-v0:2 | 8,191 | 32,000 | $0.00000015 | $0.00000020 |
| bedrock/us-east-1/mistral.mistral-7b-instruct-v0:2 | 8,191 | 32,000 | $0.00000015 | $0.00000020 |
| bedrock/eu-west-3/mistral.mistral-7b-instruct-v0:2 | 8,191 | 32,000 | $0.00000020 | $0.00000026 |
| bedrock/us-east-1/mistral.mistral-large-2402-v1:0 | 8,191 | 32,000 | $0.00000800 | $0.00002400 |
| bedrock/us-west-2/mistral.mistral-large-2402-v1:0 | 8,191 | 32,000 | $0.00000800 | $0.00002400 |
| bedrock/eu-west-3/mistral.mistral-large-2402-v1:0 | 8,191 | 32,000 | $0.00001040 | $0.00003120 |
| anthropic.claude-3-sonnet-20240229-v1:0 | 4,096 | 200,000 | $0.00000300 | $0.00001500 |
| anthropic.claude-3-haiku-20240307-v1:0 | 4,096 | 200,000 | $0.00000025 | $0.00000125 |
| anthropic.claude-3-opus-20240229-v1:0 | 4,096 | 200,000 | $0.00001500 | $0.00007500 |
| anthropic.claude-v1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/us-east-1/anthropic.claude-v1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/us-west-2/anthropic.claude-v1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/ap-northeast-1/anthropic.claude-v1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/anthropic.claude-v1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| anthropic.claude-v2 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/us-east-1/anthropic.claude-v2 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/us-west-2/anthropic.claude-v2 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/ap-northeast-1/anthropic.claude-v2 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/anthropic.claude-v2 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| anthropic.claude-v2:1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/us-east-1/anthropic.claude-v2:1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/us-west-2/anthropic.claude-v2:1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/ap-northeast-1/anthropic.claude-v2:1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/anthropic.claude-v2:1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| anthropic.claude-instant-v1 | 8,191 | 100,000 | $0.00000163 | $0.00000551 |
| bedrock/us-east-1/anthropic.claude-instant-v1 | 8,191 | 100,000 | $0.00000080 | $0.00000240 |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/anthropic.claude-instant-v1 | 8,191 | 100,000 | $0.00000080 | $0.00000240 |
| bedrock/ap-northeast-1/anthropic.claude-instant-v1 | 8,191 | 100,000 | $0.00000223 | $0.00000755 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/anthropic.claude-instant-v1 | 8,191 | 100,000 | $0.00000248 | $0.00000838 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| cohere.command-text-v14 | 4,096 | 4,096 | $0.00000150 | $0.00000200 |
| bedrock/*/1-month-commitment/cohere.command-text-v14 | 4,096 | 4,096 | -- | -- |
| bedrock/*/6-month-commitment/cohere.command-text-v14 | 4,096 | 4,096 | -- | -- |
| cohere.command-light-text-v14 | 4,096 | 4,096 | $0.00000030 | $0.00000060 |
| bedrock/*/1-month-commitment/cohere.command-light-text-v14 | 4,096 | 4,096 | -- | -- |
| bedrock/*/6-month-commitment/cohere.command-light-text-v14 | 4,096 | 4,096 | -- | -- |
| cohere.command-r-plus-v1:0 | 4,096 | 128,000 | $0.00000300 | $0.00001500 |
| cohere.command-r-v1:0 | 4,096 | 128,000 | $0.00000050 | $0.00000150 |
| cohere.embed-english-v3 | 512 | 512 | $0.00000010 | $0.00000000 |
| cohere.embed-multilingual-v3 | 512 | 512 | $0.00000010 | $0.00000000 |
| meta.llama2-13b-chat-v1 | 4,096 | 4,096 | $0.00000075 | $0.00000100 |
| meta.llama2-70b-chat-v1 | 4,096 | 4,096 | $0.00000195 | $0.00000256 |
| meta.llama3-8b-instruct-v1:0 | 8,192 | 8,192 | $0.00000040 | $0.00000060 |
| meta.llama3-70b-instruct-v1:0 | 8,192 | 8,192 | $0.00000265 | $0.00000350 |
| 512-x-512/50-steps/stability.stable-diffusion-xl-v0 | 77 | 77 | -- | -- |
| 512-x-512/max-steps/stability.stable-diffusion-xl-v0 | 77 | 77 | -- | -- |
| max-x-max/50-steps/stability.stable-diffusion-xl-v0 | 77 | 77 | -- | -- |
| max-x-max/max-steps/stability.stable-diffusion-xl-v0 | 77 | 77 | -- | -- |
| 1024-x-1024/50-steps/stability.stable-diffusion-xl-v1 | 77 | 77 | -- | -- |
| 1024-x-1024/max-steps/stability.stable-diffusion-xl-v1 | 77 | 77 | -- | -- |
| sagemaker/meta-textgeneration-llama-2-7b | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| sagemaker/meta-textgeneration-llama-2-7b-f | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| sagemaker/meta-textgeneration-llama-2-13b | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| sagemaker/meta-textgeneration-llama-2-13b-f | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| sagemaker/meta-textgeneration-llama-2-70b | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| sagemaker/meta-textgeneration-llama-2-70b-b-f | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| together-ai-up-to-3b | nan | nan | $0.00000010 | $0.00000010 |
| together-ai-3.1b-7b | nan | nan | $0.00000020 | $0.00000020 |
| together-ai-7.1b-20b | 1,000 | nan | $0.00000040 | $0.00000040 |
| together-ai-20.1b-40b | nan | nan | $0.00000080 | $0.00000080 |
| together-ai-40.1b-70b | nan | nan | $0.00000090 | $0.00000090 |
| together_ai/mistralai/Mixtral-8x7B-Instruct-v0.1 | nan | nan | $0.00000060 | $0.00000060 |
| together_ai/mistralai/Mistral-7B-Instruct-v0.1 | nan | nan | -- | -- |
| together_ai/togethercomputer/CodeLlama-34b-Instruct | nan | nan | -- | -- |
| ollama/llama2 | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| ollama/llama2:13b | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| ollama/llama2:70b | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| ollama/llama2-uncensored | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| ollama/mistral | 8,192 | 8,192 | $0.00000000 | $0.00000000 |
| ollama/codellama | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| ollama/orca-mini | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| ollama/vicuna | 2,048 | 2,048 | $0.00000000 | $0.00000000 |
| deepinfra/lizpreciatior/lzlv_70b_fp16_hf | 4,096 | 4,096 | $0.00000070 | $0.00000090 |
| deepinfra/Gryphe/MythoMax-L2-13b | 4,096 | 4,096 | $0.00000022 | $0.00000022 |
| deepinfra/mistralai/Mistral-7B-Instruct-v0.1 | 8,191 | 32,768 | $0.00000013 | $0.00000013 |
| deepinfra/meta-llama/Llama-2-70b-chat-hf | 4,096 | 4,096 | $0.00000070 | $0.00000090 |
| deepinfra/cognitivecomputations/dolphin-2.6-mixtral-8x7b | 8,191 | 32,768 | $0.00000027 | $0.00000027 |
| deepinfra/codellama/CodeLlama-34b-Instruct-hf | 4,096 | 4,096 | $0.00000060 | $0.00000060 |
| deepinfra/deepinfra/mixtral | 4,096 | 32,000 | $0.00000027 | $0.00000027 |
| deepinfra/Phind/Phind-CodeLlama-34B-v2 | 4,096 | 16,384 | $0.00000060 | $0.00000060 |
| deepinfra/mistralai/Mixtral-8x7B-Instruct-v0.1 | 8,191 | 32,768 | $0.00000027 | $0.00000027 |
| deepinfra/deepinfra/airoboros-70b | 4,096 | 4,096 | $0.00000070 | $0.00000090 |
| deepinfra/01-ai/Yi-34B-Chat | 4,096 | 4,096 | $0.00000060 | $0.00000060 |
| deepinfra/01-ai/Yi-6B-200K | 4,096 | 200,000 | $0.00000013 | $0.00000013 |
| deepinfra/jondurbin/airoboros-l2-70b-gpt4-1.4.1 | 4,096 | 4,096 | $0.00000070 | $0.00000090 |
| deepinfra/meta-llama/Llama-2-13b-chat-hf | 4,096 | 4,096 | $0.00000022 | $0.00000022 |
| deepinfra/amazon/MistralLite | 8,191 | 32,768 | $0.00000020 | $0.00000020 |
| deepinfra/meta-llama/Llama-2-7b-chat-hf | 4,096 | 4,096 | $0.00000013 | $0.00000013 |
| deepinfra/01-ai/Yi-34B-200K | 4,096 | 200,000 | $0.00000060 | $0.00000060 |
| deepinfra/openchat/openchat_3.5 | 4,096 | 4,096 | $0.00000013 | $0.00000013 |
| perplexity/codellama-34b-instruct | 16,384 | 16,384 | $0.00000035 | $0.00000140 |
| perplexity/codellama-70b-instruct | 16,384 | 16,384 | $0.00000070 | $0.00000280 |
| perplexity/pplx-7b-chat | 8,192 | 8,192 | $0.00000007 | $0.00000028 |
| perplexity/pplx-70b-chat | 4,096 | 4,096 | $0.00000070 | $0.00000280 |
| perplexity/pplx-7b-online | 4,096 | 4,096 | $0.00000000 | $0.00000028 |
| perplexity/pplx-70b-online | 4,096 | 4,096 | $0.00000000 | $0.00000280 |
| perplexity/llama-2-70b-chat | 4,096 | 4,096 | $0.00000070 | $0.00000280 |
| perplexity/mistral-7b-instruct | 4,096 | 4,096 | $0.00000007 | $0.00000028 |
| perplexity/mixtral-8x7b-instruct | 4,096 | 4,096 | $0.00000007 | $0.00000028 |
| perplexity/sonar-small-chat | 16,384 | 16,384 | $0.00000007 | $0.00000028 |
| perplexity/sonar-small-online | 12,000 | 12,000 | $0.00000000 | $0.00000028 |
| perplexity/sonar-medium-chat | 16,384 | 16,384 | $0.00000060 | $0.00000180 |
| perplexity/sonar-medium-online | 12,000 | 12,000 | $0.00000000 | $0.00000180 |
| anyscale/mistralai/Mistral-7B-Instruct-v0.1 | 16,384 | 16,384 | $0.00000015 | $0.00000015 |
| anyscale/Mixtral-8x7B-Instruct-v0.1 | 16,384 | 16,384 | $0.00000015 | $0.00000015 |
| anyscale/HuggingFaceH4/zephyr-7b-beta | 16,384 | 16,384 | $0.00000015 | $0.00000015 |
| anyscale/meta-llama/Llama-2-7b-chat-hf | 4,096 | 4,096 | $0.00000015 | $0.00000015 |
| anyscale/meta-llama/Llama-2-13b-chat-hf | 4,096 | 4,096 | $0.00000025 | $0.00000025 |
| anyscale/meta-llama/Llama-2-70b-chat-hf | 4,096 | 4,096 | $0.00000100 | $0.00000100 |
| anyscale/codellama/CodeLlama-34b-Instruct-hf | 4,096 | 4,096 | $0.00000100 | $0.00000100 |
| cloudflare/@cf/meta/llama-2-7b-chat-fp16 | 3,072 | 3,072 | $0.00000192 | $0.00000192 |
| cloudflare/@cf/meta/llama-2-7b-chat-int8 | 2,048 | 2,048 | $0.00000192 | $0.00000192 |
| cloudflare/@cf/mistral/mistral-7b-instruct-v0.1 | 8,192 | 8,192 | $0.00000192 | $0.00000192 |
| cloudflare/@hf/thebloke/codellama-7b-instruct-awq | 4,096 | 4,096 | $0.00000192 | $0.00000192 |
| voyage/voyage-01 | 4,096 | 4,096 | $0.00000010 | $0.00000000 |
| voyage/voyage-lite-01 | 4,096 | 4,096 | $0.00000010 | $0.00000000 |
| voyage/voyage-large-2 | 16,000 | 16,000 | $0.00000012 | $0.00000000 |
| voyage/voyage-law-2 | 16,000 | 16,000 | $0.00000012 | $0.00000000 |
| voyage/voyage-code-2 | 16,000 | 16,000 | $0.00000012 | $0.00000000 |
| voyage/voyage-2 | 4,000 | 4,000 | $0.00000010 | $0.00000000 |
| voyage/voyage-lite-02-instruct | 4,000 | 4,000 | $0.00000010 | $0.00000000 |
| Model Name | Prompt Cost (USD) | Completion Cost (USD) | Max Prompt Tokens | Max Output Tokens |
|:--------------------------------------------------------------------------------------------|:--------------------|:------------------------|:--------------------|--------------------:|
| gpt-4 | $0.00003000 | $0.00006000 | 8,192 | 4096 |
| gpt-4o | $0.00000500 | $0.00001500 | 128,000 | 4096 |
| gpt-4o-2024-05-13 | $0.00000500 | $0.00001500 | 128,000 | 4096 |
| gpt-4-turbo-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| gpt-4-0314 | $0.00003000 | $0.00006000 | 8,192 | 4096 |
| gpt-4-0613 | $0.00003000 | $0.00006000 | 8,192 | 4096 |
| gpt-4-32k | $0.00006000 | $0.00012000 | 32,768 | 4096 |
| gpt-4-32k-0314 | $0.00006000 | $0.00012000 | 32,768 | 4096 |
| gpt-4-32k-0613 | $0.00006000 | $0.00012000 | 32,768 | 4096 |
| gpt-4-turbo | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| gpt-4-turbo-2024-04-09 | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| gpt-4-1106-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| gpt-4-0125-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| gpt-4-vision-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| gpt-4-1106-vision-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| gpt-3.5-turbo | $0.00000150 | $0.00000200 | 16,385 | 4096 |
| gpt-3.5-turbo-0301 | $0.00000150 | $0.00000200 | 4,097 | 4096 |
| gpt-3.5-turbo-0613 | $0.00000150 | $0.00000200 | 4,097 | 4096 |
| gpt-3.5-turbo-1106 | $0.00000100 | $0.00000200 | 16,385 | 4096 |
| gpt-3.5-turbo-0125 | $0.00000050 | $0.00000150 | 16,385 | 4096 |
| gpt-3.5-turbo-16k | $0.00000300 | $0.00000400 | 16,385 | 4096 |
| gpt-3.5-turbo-16k-0613 | $0.00000300 | $0.00000400 | 16,385 | 4096 |
| ft:gpt-3.5-turbo | $0.00000300 | $0.00000600 | 4,097 | 4096 |
| text-embedding-3-large | $0.00000013 | $0.00000000 | 8,191 | nan |
| text-embedding-3-small | $0.00000002 | $0.00000000 | 8,191 | nan |
| text-embedding-ada-002 | $0.00000010 | $0.00000000 | 8,191 | nan |
| text-embedding-ada-002-v2 | $0.00000010 | $0.00000000 | 8,191 | nan |
| text-moderation-stable | $0.00000000 | $0.00000000 | 32,768 | 0 |
| text-moderation-007 | $0.00000000 | $0.00000000 | 32,768 | 0 |
| text-moderation-latest | $0.00000000 | $0.00000000 | 32,768 | 0 |
| 256-x-256/dall-e-2 | -- | -- | nan | nan |
| 512-x-512/dall-e-2 | -- | -- | nan | nan |
| 1024-x-1024/dall-e-2 | -- | -- | nan | nan |
| hd/1024-x-1792/dall-e-3 | -- | -- | nan | nan |
| hd/1792-x-1024/dall-e-3 | -- | -- | nan | nan |
| hd/1024-x-1024/dall-e-3 | -- | -- | nan | nan |
| standard/1024-x-1792/dall-e-3 | -- | -- | nan | nan |
| standard/1792-x-1024/dall-e-3 | -- | -- | nan | nan |
| standard/1024-x-1024/dall-e-3 | -- | -- | nan | nan |
| whisper-1 | -- | -- | nan | nan |
| azure/whisper-1 | -- | -- | nan | nan |
| azure/gpt-4-turbo-2024-04-09 | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| azure/gpt-4-0125-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| azure/gpt-4-1106-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| azure/gpt-4-0613 | $0.00003000 | $0.00006000 | 8,192 | 4096 |
| azure/gpt-4-32k-0613 | $0.00006000 | $0.00012000 | 32,768 | 4096 |
| azure/gpt-4-32k | $0.00006000 | $0.00012000 | 32,768 | 4096 |
| azure/gpt-4 | $0.00003000 | $0.00006000 | 8,192 | 4096 |
| azure/gpt-4-turbo | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| azure/gpt-4-turbo-vision-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| azure/gpt-35-turbo-16k-0613 | $0.00000300 | $0.00000400 | 16,385 | 4096 |
| azure/gpt-35-turbo-1106 | $0.00000150 | $0.00000200 | 16,384 | 4096 |
| azure/gpt-35-turbo-0125 | $0.00000050 | $0.00000150 | 16,384 | 4096 |
| azure/gpt-35-turbo-16k | $0.00000300 | $0.00000400 | 16,385 | 4096 |
| azure/gpt-35-turbo | $0.00000150 | $0.00000200 | 4,097 | 4096 |
| azure/gpt-3.5-turbo-instruct-0914 | $0.00000150 | $0.00000200 | 4,097 | nan |
| azure/gpt-35-turbo-instruct | $0.00000150 | $0.00000200 | 4,097 | nan |
| azure/mistral-large-latest | $0.00000800 | $0.00002400 | 32,000 | nan |
| azure/mistral-large-2402 | $0.00000800 | $0.00002400 | 32,000 | nan |
| azure/command-r-plus | $0.00000300 | $0.00001500 | 128,000 | 4096 |
| azure/ada | $0.00000010 | $0.00000000 | 8,191 | nan |
| azure/text-embedding-ada-002 | $0.00000010 | $0.00000000 | 8,191 | nan |
| azure/text-embedding-3-large | $0.00000013 | $0.00000000 | 8,191 | nan |
| azure/text-embedding-3-small | $0.00000002 | $0.00000000 | 8,191 | nan |
| azure/standard/1024-x-1024/dall-e-3 | -- | $0.00000000 | nan | nan |
| azure/hd/1024-x-1024/dall-e-3 | -- | $0.00000000 | nan | nan |
| azure/standard/1024-x-1792/dall-e-3 | -- | $0.00000000 | nan | nan |
| azure/standard/1792-x-1024/dall-e-3 | -- | $0.00000000 | nan | nan |
| azure/hd/1024-x-1792/dall-e-3 | -- | $0.00000000 | nan | nan |
| azure/hd/1792-x-1024/dall-e-3 | -- | $0.00000000 | nan | nan |
| azure/standard/1024-x-1024/dall-e-2 | -- | $0.00000000 | nan | nan |
| babbage-002 | $0.00000040 | $0.00000040 | 16,384 | 4096 |
| davinci-002 | $0.00000200 | $0.00000200 | 16,384 | 4096 |
| gpt-3.5-turbo-instruct | $0.00000150 | $0.00000200 | 8,192 | 4096 |
| gpt-3.5-turbo-instruct-0914 | $0.00000150 | $0.00000200 | 8,192 | 4097 |
| claude-instant-1 | $0.00000163 | $0.00000551 | 100,000 | 8191 |
| mistral/mistral-tiny | $0.00000015 | $0.00000046 | 32,000 | 8191 |
| mistral/mistral-small | $0.00000200 | $0.00000600 | 32,000 | 8191 |
| mistral/mistral-small-latest | $0.00000200 | $0.00000600 | 32,000 | 8191 |
| mistral/mistral-medium | $0.00000270 | $0.00000810 | 32,000 | 8191 |
| mistral/mistral-medium-latest | $0.00000270 | $0.00000810 | 32,000 | 8191 |
| mistral/mistral-medium-2312 | $0.00000270 | $0.00000810 | 32,000 | 8191 |
| mistral/mistral-large-latest | $0.00000800 | $0.00002400 | 32,000 | 8191 |
| mistral/mistral-large-2402 | $0.00000800 | $0.00002400 | 32,000 | 8191 |
| mistral/open-mixtral-8x7b | $0.00000200 | $0.00000600 | 32,000 | 8191 |
| mistral/mistral-embed | $0.00000011 | -- | 8,192 | nan |
| deepseek-chat | $0.00000014 | $0.00000028 | 32,000 | 4096 |
| deepseek-coder | $0.00000014 | $0.00000028 | 16,000 | 4096 |
| groq/llama2-70b-4096 | $0.00000070 | $0.00000080 | 4,096 | 4096 |
| groq/llama3-8b-8192 | $0.00000010 | $0.00000010 | 8,192 | 8192 |
| groq/llama3-70b-8192 | $0.00000064 | $0.00000080 | 8,192 | 8192 |
| groq/mixtral-8x7b-32768 | $0.00000027 | $0.00000027 | 32,768 | 32768 |
| groq/gemma-7b-it | $0.00000010 | $0.00000010 | 8,192 | 8192 |
| claude-instant-1.2 | $0.00000016 | $0.00000055 | 100,000 | 8191 |
| claude-2 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| claude-2.1 | $0.00000800 | $0.00002400 | 200,000 | 8191 |
| claude-3-haiku-20240307 | $0.00000025 | $0.00000125 | 200,000 | 4096 |
| claude-3-opus-20240229 | $0.00001500 | $0.00007500 | 200,000 | 4096 |
| claude-3-sonnet-20240229 | $0.00000300 | $0.00001500 | 200,000 | 4096 |
| text-bison | $0.00000012 | $0.00000012 | 8,192 | 1024 |
| text-bison@001 | $0.00000012 | $0.00000012 | 8,192 | 1024 |
| text-unicorn | $0.00001000 | $0.00002800 | 8,192 | 1024 |
| text-unicorn@001 | $0.00001000 | $0.00002800 | 8,192 | 1024 |
| chat-bison | $0.00000012 | $0.00000012 | 8,192 | 4096 |
| chat-bison@001 | $0.00000012 | $0.00000012 | 8,192 | 4096 |
| chat-bison@002 | $0.00000012 | $0.00000012 | 8,192 | 4096 |
| chat-bison-32k | $0.00000012 | $0.00000012 | 32,000 | 8192 |
| code-bison | $0.00000012 | $0.00000012 | 6,144 | 1024 |
| code-bison@001 | $0.00000012 | $0.00000012 | 6,144 | 1024 |
| code-gecko@001 | $0.00000012 | $0.00000012 | 2,048 | 64 |
| code-gecko@002 | $0.00000012 | $0.00000012 | 2,048 | 64 |
| code-gecko | $0.00000012 | $0.00000012 | 2,048 | 64 |
| codechat-bison | $0.00000012 | $0.00000012 | 6,144 | 1024 |
| codechat-bison@001 | $0.00000012 | $0.00000012 | 6,144 | 1024 |
| codechat-bison-32k | $0.00000012 | $0.00000012 | 32,000 | 8192 |
| gemini-pro | $0.00000025 | $0.00000050 | 32,760 | 8192 |
| gemini-1.0-pro | $0.00000025 | $0.00000050 | 32,760 | 8192 |
| gemini-1.0-pro-001 | $0.00000025 | $0.00000050 | 32,760 | 8192 |
| gemini-1.0-pro-002 | $0.00000025 | $0.00000050 | 32,760 | 8192 |
| gemini-1.5-pro | $0.00000063 | $0.00000188 | 1,000,000 | 8192 |
| gemini-1.5-pro-preview-0215 | $0.00000063 | $0.00000188 | 1,000,000 | 8192 |
| gemini-1.5-pro-preview-0409 | $0.00000063 | $0.00000188 | 1,000,000 | 8192 |
| gemini-experimental | $0.00000000 | $0.00000000 | 1,000,000 | 8192 |
| gemini-pro-vision | $0.00000025 | $0.00000050 | 16,384 | 2048 |
| gemini-1.0-pro-vision | $0.00000025 | $0.00000050 | 16,384 | 2048 |
| gemini-1.0-pro-vision-001 | $0.00000025 | $0.00000050 | 16,384 | 2048 |
| vertex_ai/claude-3-sonnet@20240229 | $0.00000300 | $0.00001500 | 200,000 | 4096 |
| vertex_ai/claude-3-haiku@20240307 | $0.00000025 | $0.00000125 | 200,000 | 4096 |
| vertex_ai/claude-3-opus@20240229 | $0.00000150 | $0.00000750 | 200,000 | 4096 |
| textembedding-gecko | $0.00000001 | $0.00000000 | 3,072 | nan |
| textembedding-gecko-multilingual | $0.00000001 | $0.00000000 | 3,072 | nan |
| textembedding-gecko-multilingual@001 | $0.00000001 | $0.00000000 | 3,072 | nan |
| textembedding-gecko@001 | $0.00000001 | $0.00000000 | 3,072 | nan |
| textembedding-gecko@003 | $0.00000001 | $0.00000000 | 3,072 | nan |
| text-embedding-preview-0409 | $0.00000001 | $0.00000000 | 3,072 | nan |
| text-multilingual-embedding-preview-0409 | $0.00000001 | $0.00000000 | 3,072 | nan |
| palm/chat-bison | $0.00000012 | $0.00000012 | 8,192 | 4096 |
| palm/chat-bison-001 | $0.00000012 | $0.00000012 | 8,192 | 4096 |
| palm/text-bison | $0.00000012 | $0.00000012 | 8,192 | 1024 |
| palm/text-bison-001 | $0.00000012 | $0.00000012 | 8,192 | 1024 |
| palm/text-bison-safety-off | $0.00000012 | $0.00000012 | 8,192 | 1024 |
| palm/text-bison-safety-recitation-off | $0.00000012 | $0.00000012 | 8,192 | 1024 |
| gemini/gemini-pro | $0.00000000 | $0.00000000 | 32,760 | 8192 |
| gemini/gemini-1.5-pro | $0.00000000 | $0.00000000 | 1,000,000 | 8192 |
| gemini/gemini-1.5-pro-latest | $0.00000000 | $0.00000000 | 1,048,576 | 8192 |
| gemini/gemini-pro-vision | $0.00000000 | $0.00000000 | 30,720 | 2048 |
| command-r | $0.00000050 | $0.00000150 | 128,000 | 4096 |
| command-light | $0.00001500 | $0.00001500 | 4,096 | 4096 |
| command-r-plus | $0.00000300 | $0.00001500 | 128,000 | 4096 |
| command-nightly | $0.00001500 | $0.00001500 | 4,096 | 4096 |
| command | $0.00001500 | $0.00001500 | 4,096 | 4096 |
| command-medium-beta | $0.00001500 | $0.00001500 | 4,096 | 4096 |
| command-xlarge-beta | $0.00001500 | $0.00001500 | 4,096 | 4096 |
| replicate/llama-2-70b-chat:2c1608e18606fad2812020dc541930f2d0495ce32eee50074220b87300bc16e1 | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| replicate/meta/llama-2-13b | $0.00000010 | $0.00000050 | 4,096 | 4096 |
| replicate/meta/llama-2-13b-chat | $0.00000010 | $0.00000050 | 4,096 | 4096 |
| replicate/meta/llama-2-70b | $0.00000065 | $0.00000275 | 4,096 | 4096 |
| replicate/meta/llama-2-70b-chat | $0.00000065 | $0.00000275 | 4,096 | 4096 |
| replicate/meta/llama-2-7b | $0.00000005 | $0.00000025 | 4,096 | 4096 |
| replicate/meta/llama-2-7b-chat | $0.00000005 | $0.00000025 | 4,096 | 4096 |
| replicate/meta/llama-3-70b | $0.00000065 | $0.00000275 | 4,096 | 4096 |
| replicate/meta/llama-3-70b-instruct | $0.00000065 | $0.00000275 | 4,096 | 4096 |
| replicate/meta/llama-3-8b | $0.00000005 | $0.00000025 | 4,096 | 4096 |
| replicate/meta/llama-3-8b-instruct | $0.00000005 | $0.00000025 | 4,096 | 4096 |
| replicate/mistralai/mistral-7b-v0.1 | $0.00000005 | $0.00000025 | 4,096 | 4096 |
| replicate/mistralai/mistral-7b-instruct-v0.2 | $0.00000005 | $0.00000025 | 4,096 | 4096 |
| replicate/mistralai/mixtral-8x7b-instruct-v0.1 | $0.00000030 | $0.00000100 | 4,096 | 4096 |
| openrouter/microsoft/wizardlm-2-8x22b:nitro | $0.00000100 | $0.00000100 | nan | nan |
| openrouter/google/gemini-pro-1.5 | $0.00000250 | $0.00000750 | 1,000,000 | 8192 |
| openrouter/mistralai/mixtral-8x22b-instruct | $0.00000065 | $0.00000065 | nan | nan |
| openrouter/cohere/command-r-plus | $0.00000300 | $0.00001500 | nan | nan |
| openrouter/databricks/dbrx-instruct | $0.00000060 | $0.00000060 | nan | nan |
| openrouter/anthropic/claude-3-haiku | $0.00000025 | $0.00000125 | nan | nan |
| openrouter/anthropic/claude-3-sonnet | $0.00000300 | $0.00001500 | nan | nan |
| openrouter/mistralai/mistral-large | $0.00000800 | $0.00002400 | nan | nan |
| openrouter/cognitivecomputations/dolphin-mixtral-8x7b | $0.00000050 | $0.00000050 | nan | nan |
| openrouter/google/gemini-pro-vision | $0.00000012 | $0.00000038 | nan | nan |
| openrouter/fireworks/firellava-13b | $0.00000020 | $0.00000020 | nan | nan |
| openrouter/meta-llama/llama-3-8b-instruct:free | $0.00000000 | $0.00000000 | nan | nan |
| openrouter/meta-llama/llama-3-8b-instruct:extended | $0.00000022 | $0.00000225 | nan | nan |
| openrouter/meta-llama/llama-3-70b-instruct:nitro | $0.00000090 | $0.00000090 | nan | nan |
| openrouter/meta-llama/llama-3-70b-instruct | $0.00000059 | $0.00000079 | nan | nan |
| openrouter/openai/gpt-4-vision-preview | $0.00001000 | $0.00003000 | nan | nan |
| openrouter/openai/gpt-3.5-turbo | $0.00000150 | $0.00000200 | nan | nan |
| openrouter/openai/gpt-3.5-turbo-16k | $0.00000300 | $0.00000400 | nan | nan |
| openrouter/openai/gpt-4 | $0.00003000 | $0.00006000 | nan | nan |
| openrouter/anthropic/claude-instant-v1 | $0.00000163 | $0.00000551 | nan | 8191 |
| openrouter/anthropic/claude-2 | $0.00001102 | $0.00003268 | nan | 8191 |
| openrouter/anthropic/claude-3-opus | $0.00001500 | $0.00007500 | 200,000 | 4096 |
| openrouter/google/palm-2-chat-bison | $0.00000050 | $0.00000050 | nan | nan |
| openrouter/google/palm-2-codechat-bison | $0.00000050 | $0.00000050 | nan | nan |
| openrouter/meta-llama/llama-2-13b-chat | $0.00000020 | $0.00000020 | nan | nan |
| openrouter/meta-llama/llama-2-70b-chat | $0.00000150 | $0.00000150 | nan | nan |
| openrouter/meta-llama/codellama-34b-instruct | $0.00000050 | $0.00000050 | nan | nan |
| openrouter/nousresearch/nous-hermes-llama2-13b | $0.00000020 | $0.00000020 | nan | nan |
| openrouter/mancer/weaver | $0.00000563 | $0.00000563 | nan | nan |
| openrouter/gryphe/mythomax-l2-13b | $0.00000188 | $0.00000188 | nan | nan |
| openrouter/jondurbin/airoboros-l2-70b-2.1 | $0.00001388 | $0.00001388 | nan | nan |
| openrouter/undi95/remm-slerp-l2-13b | $0.00000188 | $0.00000188 | nan | nan |
| openrouter/pygmalionai/mythalion-13b | $0.00000188 | $0.00000188 | nan | nan |
| openrouter/mistralai/mistral-7b-instruct | $0.00000013 | $0.00000013 | nan | nan |
| openrouter/mistralai/mistral-7b-instruct:free | $0.00000000 | $0.00000000 | nan | nan |
| j2-ultra | $0.00001500 | $0.00001500 | 8,192 | 8192 |
| j2-mid | $0.00001000 | $0.00001000 | 8,192 | 8192 |
| j2-light | $0.00000300 | $0.00000300 | 8,192 | 8192 |
| dolphin | $0.00000050 | $0.00000050 | 16,384 | 16384 |
| chatdolphin | $0.00000050 | $0.00000050 | 16,384 | 16384 |
| luminous-base | $0.00003000 | $0.00003300 | nan | nan |
| luminous-base-control | $0.00003750 | $0.00004125 | nan | nan |
| luminous-extended | $0.00004500 | $0.00004950 | nan | nan |
| luminous-extended-control | $0.00005625 | $0.00006187 | nan | nan |
| luminous-supreme | $0.00017500 | $0.00019250 | nan | nan |
| luminous-supreme-control | $0.00021875 | $0.00024063 | nan | nan |
| ai21.j2-mid-v1 | $0.00001250 | $0.00001250 | 8,191 | 8191 |
| ai21.j2-ultra-v1 | $0.00001880 | $0.00001880 | 8,191 | 8191 |
| amazon.titan-text-lite-v1 | $0.00000030 | $0.00000040 | 42,000 | 4000 |
| amazon.titan-text-express-v1 | $0.00000130 | $0.00000170 | 42,000 | 8000 |
| amazon.titan-embed-text-v1 | $0.00000010 | $0.00000000 | 8,192 | nan |
| amazon.titan-embed-text-v2:0 | $0.00000020 | $0.00000000 | 8,192 | nan |
| mistral.mistral-7b-instruct-v0:2 | $0.00000015 | $0.00000020 | 32,000 | 8191 |
| mistral.mixtral-8x7b-instruct-v0:1 | $0.00000045 | $0.00000070 | 32,000 | 8191 |
| mistral.mistral-large-2402-v1:0 | $0.00000800 | $0.00002400 | 32,000 | 8191 |
| bedrock/us-west-2/mistral.mixtral-8x7b-instruct-v0:1 | $0.00000045 | $0.00000070 | 32,000 | 8191 |
| bedrock/us-east-1/mistral.mixtral-8x7b-instruct-v0:1 | $0.00000045 | $0.00000070 | 32,000 | 8191 |
| bedrock/eu-west-3/mistral.mixtral-8x7b-instruct-v0:1 | $0.00000059 | $0.00000091 | 32,000 | 8191 |
| bedrock/us-west-2/mistral.mistral-7b-instruct-v0:2 | $0.00000015 | $0.00000020 | 32,000 | 8191 |
| bedrock/us-east-1/mistral.mistral-7b-instruct-v0:2 | $0.00000015 | $0.00000020 | 32,000 | 8191 |
| bedrock/eu-west-3/mistral.mistral-7b-instruct-v0:2 | $0.00000020 | $0.00000026 | 32,000 | 8191 |
| bedrock/us-east-1/mistral.mistral-large-2402-v1:0 | $0.00000800 | $0.00002400 | 32,000 | 8191 |
| bedrock/us-west-2/mistral.mistral-large-2402-v1:0 | $0.00000800 | $0.00002400 | 32,000 | 8191 |
| bedrock/eu-west-3/mistral.mistral-large-2402-v1:0 | $0.00001040 | $0.00003120 | 32,000 | 8191 |
| anthropic.claude-3-sonnet-20240229-v1:0 | $0.00000300 | $0.00001500 | 200,000 | 4096 |
| anthropic.claude-3-haiku-20240307-v1:0 | $0.00000025 | $0.00000125 | 200,000 | 4096 |
| anthropic.claude-3-opus-20240229-v1:0 | $0.00001500 | $0.00007500 | 200,000 | 4096 |
| anthropic.claude-v1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/us-east-1/anthropic.claude-v1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/us-west-2/anthropic.claude-v1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/ap-northeast-1/anthropic.claude-v1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/anthropic.claude-v1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| anthropic.claude-v2 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/us-east-1/anthropic.claude-v2 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/us-west-2/anthropic.claude-v2 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/ap-northeast-1/anthropic.claude-v2 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/anthropic.claude-v2 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| anthropic.claude-v2:1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/us-east-1/anthropic.claude-v2:1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/us-west-2/anthropic.claude-v2:1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/ap-northeast-1/anthropic.claude-v2:1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/anthropic.claude-v2:1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| anthropic.claude-instant-v1 | $0.00000163 | $0.00000551 | 100,000 | 8191 |
| bedrock/us-east-1/anthropic.claude-instant-v1 | $0.00000080 | $0.00000240 | 100,000 | 8191 |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/anthropic.claude-instant-v1 | $0.00000080 | $0.00000240 | 100,000 | 8191 |
| bedrock/ap-northeast-1/anthropic.claude-instant-v1 | $0.00000223 | $0.00000755 | 100,000 | 8191 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/anthropic.claude-instant-v1 | $0.00000248 | $0.00000838 | 100,000 | 8191 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| cohere.command-text-v14 | $0.00000150 | $0.00000200 | 4,096 | 4096 |
| bedrock/*/1-month-commitment/cohere.command-text-v14 | -- | -- | 4,096 | 4096 |
| bedrock/*/6-month-commitment/cohere.command-text-v14 | -- | -- | 4,096 | 4096 |
| cohere.command-light-text-v14 | $0.00000030 | $0.00000060 | 4,096 | 4096 |
| bedrock/*/1-month-commitment/cohere.command-light-text-v14 | -- | -- | 4,096 | 4096 |
| bedrock/*/6-month-commitment/cohere.command-light-text-v14 | -- | -- | 4,096 | 4096 |
| cohere.command-r-plus-v1:0 | $0.00000300 | $0.00001500 | 128,000 | 4096 |
| cohere.command-r-v1:0 | $0.00000050 | $0.00000150 | 128,000 | 4096 |
| cohere.embed-english-v3 | $0.00000010 | $0.00000000 | 512 | nan |
| cohere.embed-multilingual-v3 | $0.00000010 | $0.00000000 | 512 | nan |
| meta.llama2-13b-chat-v1 | $0.00000075 | $0.00000100 | 4,096 | 4096 |
| meta.llama2-70b-chat-v1 | $0.00000195 | $0.00000256 | 4,096 | 4096 |
| meta.llama3-8b-instruct-v1:0 | $0.00000040 | $0.00000060 | 8,192 | 8192 |
| meta.llama3-70b-instruct-v1:0 | $0.00000265 | $0.00000350 | 8,192 | 8192 |
| 512-x-512/50-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan |
| 512-x-512/max-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan |
| max-x-max/50-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan |
| max-x-max/max-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan |
| 1024-x-1024/50-steps/stability.stable-diffusion-xl-v1 | -- | -- | 77 | nan |
| 1024-x-1024/max-steps/stability.stable-diffusion-xl-v1 | -- | -- | 77 | nan |
| sagemaker/meta-textgeneration-llama-2-7b | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| sagemaker/meta-textgeneration-llama-2-7b-f | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| sagemaker/meta-textgeneration-llama-2-13b | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| sagemaker/meta-textgeneration-llama-2-13b-f | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| sagemaker/meta-textgeneration-llama-2-70b | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| sagemaker/meta-textgeneration-llama-2-70b-b-f | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| together-ai-up-to-3b | $0.00000010 | $0.00000010 | nan | nan |
| together-ai-3.1b-7b | $0.00000020 | $0.00000020 | nan | nan |
| together-ai-7.1b-20b | $0.00000040 | $0.00000040 | nan | nan |
| together-ai-20.1b-40b | $0.00000080 | $0.00000080 | nan | nan |
| together-ai-40.1b-70b | $0.00000090 | $0.00000090 | nan | nan |
| together_ai/mistralai/Mixtral-8x7B-Instruct-v0.1 | $0.00000060 | $0.00000060 | nan | nan |
| together_ai/mistralai/Mistral-7B-Instruct-v0.1 | -- | -- | nan | nan |
| together_ai/togethercomputer/CodeLlama-34b-Instruct | -- | -- | nan | nan |
| ollama/llama2 | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| ollama/llama2:13b | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| ollama/llama2:70b | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| ollama/llama2-uncensored | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| ollama/mistral | $0.00000000 | $0.00000000 | 8,192 | 8192 |
| ollama/codellama | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| ollama/orca-mini | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| ollama/vicuna | $0.00000000 | $0.00000000 | 2,048 | 2048 |
| deepinfra/lizpreciatior/lzlv_70b_fp16_hf | $0.00000070 | $0.00000090 | 4,096 | 4096 |
| deepinfra/Gryphe/MythoMax-L2-13b | $0.00000022 | $0.00000022 | 4,096 | 4096 |
| deepinfra/mistralai/Mistral-7B-Instruct-v0.1 | $0.00000013 | $0.00000013 | 32,768 | 8191 |
| deepinfra/meta-llama/Llama-2-70b-chat-hf | $0.00000070 | $0.00000090 | 4,096 | 4096 |
| deepinfra/cognitivecomputations/dolphin-2.6-mixtral-8x7b | $0.00000027 | $0.00000027 | 32,768 | 8191 |
| deepinfra/codellama/CodeLlama-34b-Instruct-hf | $0.00000060 | $0.00000060 | 4,096 | 4096 |
| deepinfra/deepinfra/mixtral | $0.00000027 | $0.00000027 | 32,000 | 4096 |
| deepinfra/Phind/Phind-CodeLlama-34B-v2 | $0.00000060 | $0.00000060 | 16,384 | 4096 |
| deepinfra/mistralai/Mixtral-8x7B-Instruct-v0.1 | $0.00000027 | $0.00000027 | 32,768 | 8191 |
| deepinfra/deepinfra/airoboros-70b | $0.00000070 | $0.00000090 | 4,096 | 4096 |
| deepinfra/01-ai/Yi-34B-Chat | $0.00000060 | $0.00000060 | 4,096 | 4096 |
| deepinfra/01-ai/Yi-6B-200K | $0.00000013 | $0.00000013 | 200,000 | 4096 |
| deepinfra/jondurbin/airoboros-l2-70b-gpt4-1.4.1 | $0.00000070 | $0.00000090 | 4,096 | 4096 |
| deepinfra/meta-llama/Llama-2-13b-chat-hf | $0.00000022 | $0.00000022 | 4,096 | 4096 |
| deepinfra/amazon/MistralLite | $0.00000020 | $0.00000020 | 32,768 | 8191 |
| deepinfra/meta-llama/Llama-2-7b-chat-hf | $0.00000013 | $0.00000013 | 4,096 | 4096 |
| deepinfra/01-ai/Yi-34B-200K | $0.00000060 | $0.00000060 | 200,000 | 4096 |
| deepinfra/openchat/openchat_3.5 | $0.00000013 | $0.00000013 | 4,096 | 4096 |
| perplexity/codellama-34b-instruct | $0.00000035 | $0.00000140 | 16,384 | 16384 |
| perplexity/codellama-70b-instruct | $0.00000070 | $0.00000280 | 16,384 | 16384 |
| perplexity/pplx-7b-chat | $0.00000007 | $0.00000028 | 8,192 | 8192 |
| perplexity/pplx-70b-chat | $0.00000070 | $0.00000280 | 4,096 | 4096 |
| perplexity/pplx-7b-online | $0.00000000 | $0.00000028 | 4,096 | 4096 |
| perplexity/pplx-70b-online | $0.00000000 | $0.00000280 | 4,096 | 4096 |
| perplexity/llama-2-70b-chat | $0.00000070 | $0.00000280 | 4,096 | 4096 |
| perplexity/mistral-7b-instruct | $0.00000007 | $0.00000028 | 4,096 | 4096 |
| perplexity/mixtral-8x7b-instruct | $0.00000007 | $0.00000028 | 4,096 | 4096 |
| perplexity/sonar-small-chat | $0.00000007 | $0.00000028 | 16,384 | 16384 |
| perplexity/sonar-small-online | $0.00000000 | $0.00000028 | 12,000 | 12000 |
| perplexity/sonar-medium-chat | $0.00000060 | $0.00000180 | 16,384 | 16384 |
| perplexity/sonar-medium-online | $0.00000000 | $0.00000180 | 12,000 | 12000 |
| anyscale/mistralai/Mistral-7B-Instruct-v0.1 | $0.00000015 | $0.00000015 | 16,384 | 16384 |
| anyscale/Mixtral-8x7B-Instruct-v0.1 | $0.00000015 | $0.00000015 | 16,384 | 16384 |
| anyscale/HuggingFaceH4/zephyr-7b-beta | $0.00000015 | $0.00000015 | 16,384 | 16384 |
| anyscale/meta-llama/Llama-2-7b-chat-hf | $0.00000015 | $0.00000015 | 4,096 | 4096 |
| anyscale/meta-llama/Llama-2-13b-chat-hf | $0.00000025 | $0.00000025 | 4,096 | 4096 |
| anyscale/meta-llama/Llama-2-70b-chat-hf | $0.00000100 | $0.00000100 | 4,096 | 4096 |
| anyscale/codellama/CodeLlama-34b-Instruct-hf | $0.00000100 | $0.00000100 | 4,096 | 4096 |
| cloudflare/@cf/meta/llama-2-7b-chat-fp16 | $0.00000192 | $0.00000192 | 3,072 | 3072 |
| cloudflare/@cf/meta/llama-2-7b-chat-int8 | $0.00000192 | $0.00000192 | 2,048 | 2048 |
| cloudflare/@cf/mistral/mistral-7b-instruct-v0.1 | $0.00000192 | $0.00000192 | 8,192 | 8192 |
| cloudflare/@hf/thebloke/codellama-7b-instruct-awq | $0.00000192 | $0.00000192 | 4,096 | 4096 |
| voyage/voyage-01 | $0.00000010 | $0.00000000 | 4,096 | nan |
| voyage/voyage-lite-01 | $0.00000010 | $0.00000000 | 4,096 | nan |
| voyage/voyage-large-2 | $0.00000012 | $0.00000000 | 16,000 | nan |
| voyage/voyage-law-2 | $0.00000012 | $0.00000000 | 16,000 | nan |
| voyage/voyage-code-2 | $0.00000012 | $0.00000000 | 16,000 | nan |
| voyage/voyage-2 | $0.00000010 | $0.00000000 | 4,000 | nan |
| voyage/voyage-lite-02-instruct | $0.00000010 | $0.00000000 | 4,000 | nan |
### Callback handlers
You may also calculate token costs in LLM wrapper/framework libraries using callbacks.

View File

@@ -1,378 +1,379 @@
| | max_tokens | max_input_tokens | input_cost_per_token | output_cost_per_token |
|:--------------------------------------------------------------------------------------------|:-------------|:-------------------|:-----------------------|:------------------------|
| gpt-4 | 4,096 | 8,192 | $0.00003000 | $0.00006000 |
| gpt-4o | 4,096 | 128,000 | $0.00000500 | $0.00001500 |
| gpt-4o-2024-05-13 | 4,096 | 128,000 | $0.00000500 | $0.00001500 |
| gpt-4-turbo-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| gpt-4-0314 | 4,096 | 8,192 | $0.00003000 | $0.00006000 |
| gpt-4-0613 | 4,096 | 8,192 | $0.00003000 | $0.00006000 |
| gpt-4-32k | 4,096 | 32,768 | $0.00006000 | $0.00012000 |
| gpt-4-32k-0314 | 4,096 | 32,768 | $0.00006000 | $0.00012000 |
| gpt-4-32k-0613 | 4,096 | 32,768 | $0.00006000 | $0.00012000 |
| gpt-4-turbo | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| gpt-4-turbo-2024-04-09 | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| gpt-4-1106-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| gpt-4-0125-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| gpt-4-vision-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| gpt-4-1106-vision-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| gpt-3.5-turbo | 4,097 | 16,385 | $0.00000150 | $0.00000200 |
| gpt-3.5-turbo-0301 | 4,097 | 4,097 | $0.00000150 | $0.00000200 |
| gpt-3.5-turbo-0613 | 4,097 | 4,097 | $0.00000150 | $0.00000200 |
| gpt-3.5-turbo-1106 | 16,385 | 16,385 | $0.00000100 | $0.00000200 |
| gpt-3.5-turbo-0125 | 16,385 | 16,385 | $0.00000050 | $0.00000150 |
| gpt-3.5-turbo-16k | 16,385 | 16,385 | $0.00000300 | $0.00000400 |
| gpt-3.5-turbo-16k-0613 | 16,385 | 16,385 | $0.00000300 | $0.00000400 |
| ft:gpt-3.5-turbo | 4,097 | 4,097 | $0.00000300 | $0.00000600 |
| text-embedding-3-large | 8,191 | 8,191 | $0.00000013 | $0.00000000 |
| text-embedding-3-small | 8,191 | 8,191 | $0.00000002 | $0.00000000 |
| text-embedding-ada-002 | 8,191 | 8,191 | $0.00000010 | $0.00000000 |
| text-embedding-ada-002-v2 | 8,191 | 8,191 | $0.00000010 | $0.00000000 |
| text-moderation-stable | 32,768 | 32,768 | $0.00000000 | $0.00000000 |
| text-moderation-007 | 32,768 | 32,768 | $0.00000000 | $0.00000000 |
| text-moderation-latest | 32,768 | 32,768 | $0.00000000 | $0.00000000 |
| 256-x-256/dall-e-2 | nan | nan | -- | -- |
| 512-x-512/dall-e-2 | nan | nan | -- | -- |
| 1024-x-1024/dall-e-2 | nan | nan | -- | -- |
| hd/1024-x-1792/dall-e-3 | nan | nan | -- | -- |
| hd/1792-x-1024/dall-e-3 | nan | nan | -- | -- |
| hd/1024-x-1024/dall-e-3 | nan | nan | -- | -- |
| standard/1024-x-1792/dall-e-3 | nan | nan | -- | -- |
| standard/1792-x-1024/dall-e-3 | nan | nan | -- | -- |
| standard/1024-x-1024/dall-e-3 | nan | nan | -- | -- |
| whisper-1 | nan | nan | -- | -- |
| azure/whisper-1 | nan | nan | -- | -- |
| azure/gpt-4-turbo-2024-04-09 | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| azure/gpt-4-0125-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| azure/gpt-4-1106-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| azure/gpt-4-0613 | 4,096 | 8,192 | $0.00003000 | $0.00006000 |
| azure/gpt-4-32k-0613 | 4,096 | 32,768 | $0.00006000 | $0.00012000 |
| azure/gpt-4-32k | 4,096 | 32,768 | $0.00006000 | $0.00012000 |
| azure/gpt-4 | 4,096 | 8,192 | $0.00003000 | $0.00006000 |
| azure/gpt-4-turbo | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| azure/gpt-4-turbo-vision-preview | 4,096 | 128,000 | $0.00001000 | $0.00003000 |
| azure/gpt-35-turbo-16k-0613 | 4,096 | 16,385 | $0.00000300 | $0.00000400 |
| azure/gpt-35-turbo-1106 | 4,096 | 16,384 | $0.00000150 | $0.00000200 |
| azure/gpt-35-turbo-0125 | 4,096 | 16,384 | $0.00000050 | $0.00000150 |
| azure/gpt-35-turbo-16k | 4,096 | 16,385 | $0.00000300 | $0.00000400 |
| azure/gpt-35-turbo | 4,096 | 4,097 | $0.00000150 | $0.00000200 |
| azure/gpt-3.5-turbo-instruct-0914 | 4,097 | 4,097 | $0.00000150 | $0.00000200 |
| azure/gpt-35-turbo-instruct | 4,097 | 4,097 | $0.00000150 | $0.00000200 |
| azure/mistral-large-latest | 32,000 | 32,000 | $0.00000800 | $0.00002400 |
| azure/mistral-large-2402 | 32,000 | 32,000 | $0.00000800 | $0.00002400 |
| azure/command-r-plus | 4,096 | 128,000 | $0.00000300 | $0.00001500 |
| azure/ada | 8,191 | 8,191 | $0.00000010 | $0.00000000 |
| azure/text-embedding-ada-002 | 8,191 | 8,191 | $0.00000010 | $0.00000000 |
| azure/text-embedding-3-large | 8,191 | 8,191 | $0.00000013 | $0.00000000 |
| azure/text-embedding-3-small | 8,191 | 8,191 | $0.00000002 | $0.00000000 |
| azure/standard/1024-x-1024/dall-e-3 | nan | nan | -- | $0.00000000 |
| azure/hd/1024-x-1024/dall-e-3 | nan | nan | -- | $0.00000000 |
| azure/standard/1024-x-1792/dall-e-3 | nan | nan | -- | $0.00000000 |
| azure/standard/1792-x-1024/dall-e-3 | nan | nan | -- | $0.00000000 |
| azure/hd/1024-x-1792/dall-e-3 | nan | nan | -- | $0.00000000 |
| azure/hd/1792-x-1024/dall-e-3 | nan | nan | -- | $0.00000000 |
| azure/standard/1024-x-1024/dall-e-2 | nan | nan | -- | $0.00000000 |
| babbage-002 | 16,384 | 16,384 | $0.00000040 | $0.00000040 |
| davinci-002 | 16,384 | 16,384 | $0.00000200 | $0.00000200 |
| gpt-3.5-turbo-instruct | 4,096 | 8,192 | $0.00000150 | $0.00000200 |
| gpt-3.5-turbo-instruct-0914 | 4,097 | 8,192 | $0.00000150 | $0.00000200 |
| claude-instant-1 | 8,191 | 100,000 | $0.00000163 | $0.00000551 |
| mistral/mistral-tiny | 8,191 | 32,000 | $0.00000015 | $0.00000046 |
| mistral/mistral-small | 8,191 | 32,000 | $0.00000200 | $0.00000600 |
| mistral/mistral-small-latest | 8,191 | 32,000 | $0.00000200 | $0.00000600 |
| mistral/mistral-medium | 8,191 | 32,000 | $0.00000270 | $0.00000810 |
| mistral/mistral-medium-latest | 8,191 | 32,000 | $0.00000270 | $0.00000810 |
| mistral/mistral-medium-2312 | 8,191 | 32,000 | $0.00000270 | $0.00000810 |
| mistral/mistral-large-latest | 8,191 | 32,000 | $0.00000800 | $0.00002400 |
| mistral/mistral-large-2402 | 8,191 | 32,000 | $0.00000800 | $0.00002400 |
| mistral/open-mixtral-8x7b | 8,191 | 32,000 | $0.00000200 | $0.00000600 |
| mistral/mistral-embed | 8,192 | 8,192 | $0.00000011 | -- |
| deepseek-chat | 4,096 | 32,000 | $0.00000014 | $0.00000028 |
| deepseek-coder | 4,096 | 16,000 | $0.00000014 | $0.00000028 |
| groq/llama2-70b-4096 | 4,096 | 4,096 | $0.00000070 | $0.00000080 |
| groq/llama3-8b-8192 | 8,192 | 8,192 | $0.00000010 | $0.00000010 |
| groq/llama3-70b-8192 | 8,192 | 8,192 | $0.00000064 | $0.00000080 |
| groq/mixtral-8x7b-32768 | 32,768 | 32,768 | $0.00000027 | $0.00000027 |
| groq/gemma-7b-it | 8,192 | 8,192 | $0.00000010 | $0.00000010 |
| claude-instant-1.2 | 8,191 | 100,000 | $0.00000016 | $0.00000055 |
| claude-2 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| claude-2.1 | 8,191 | 200,000 | $0.00000800 | $0.00002400 |
| claude-3-haiku-20240307 | 4,096 | 200,000 | $0.00000025 | $0.00000125 |
| claude-3-opus-20240229 | 4,096 | 200,000 | $0.00001500 | $0.00007500 |
| claude-3-sonnet-20240229 | 4,096 | 200,000 | $0.00000300 | $0.00001500 |
| text-bison | 1,024 | 8,192 | $0.00000012 | $0.00000012 |
| text-bison@001 | 1,024 | 8,192 | $0.00000012 | $0.00000012 |
| text-unicorn | 1,024 | 8,192 | $0.00001000 | $0.00002800 |
| text-unicorn@001 | 1,024 | 8,192 | $0.00001000 | $0.00002800 |
| chat-bison | 4,096 | 8,192 | $0.00000012 | $0.00000012 |
| chat-bison@001 | 4,096 | 8,192 | $0.00000012 | $0.00000012 |
| chat-bison@002 | 4,096 | 8,192 | $0.00000012 | $0.00000012 |
| chat-bison-32k | 8,192 | 32,000 | $0.00000012 | $0.00000012 |
| code-bison | 1,024 | 6,144 | $0.00000012 | $0.00000012 |
| code-bison@001 | 1,024 | 6,144 | $0.00000012 | $0.00000012 |
| code-gecko@001 | 64 | 2,048 | $0.00000012 | $0.00000012 |
| code-gecko@002 | 64 | 2,048 | $0.00000012 | $0.00000012 |
| code-gecko | 64 | 2,048 | $0.00000012 | $0.00000012 |
| codechat-bison | 1,024 | 6,144 | $0.00000012 | $0.00000012 |
| codechat-bison@001 | 1,024 | 6,144 | $0.00000012 | $0.00000012 |
| codechat-bison-32k | 8,192 | 32,000 | $0.00000012 | $0.00000012 |
| gemini-pro | 8,192 | 32,760 | $0.00000025 | $0.00000050 |
| gemini-1.0-pro | 8,192 | 32,760 | $0.00000025 | $0.00000050 |
| gemini-1.0-pro-001 | 8,192 | 32,760 | $0.00000025 | $0.00000050 |
| gemini-1.0-pro-002 | 8,192 | 32,760 | $0.00000025 | $0.00000050 |
| gemini-1.5-pro | 8,192 | 1,000,000 | $0.00000063 | $0.00000188 |
| gemini-1.5-pro-preview-0215 | 8,192 | 1,000,000 | $0.00000063 | $0.00000188 |
| gemini-1.5-pro-preview-0409 | 8,192 | 1,000,000 | $0.00000063 | $0.00000188 |
| gemini-experimental | 8,192 | 1,000,000 | $0.00000000 | $0.00000000 |
| gemini-pro-vision | 2,048 | 16,384 | $0.00000025 | $0.00000050 |
| gemini-1.0-pro-vision | 2,048 | 16,384 | $0.00000025 | $0.00000050 |
| gemini-1.0-pro-vision-001 | 2,048 | 16,384 | $0.00000025 | $0.00000050 |
| vertex_ai/claude-3-sonnet@20240229 | 4,096 | 200,000 | $0.00000300 | $0.00001500 |
| vertex_ai/claude-3-haiku@20240307 | 4,096 | 200,000 | $0.00000025 | $0.00000125 |
| vertex_ai/claude-3-opus@20240229 | 4,096 | 200,000 | $0.00000150 | $0.00000750 |
| textembedding-gecko | 3,072 | 3,072 | $0.00000001 | $0.00000000 |
| textembedding-gecko-multilingual | 3,072 | 3,072 | $0.00000001 | $0.00000000 |
| textembedding-gecko-multilingual@001 | 3,072 | 3,072 | $0.00000001 | $0.00000000 |
| textembedding-gecko@001 | 3,072 | 3,072 | $0.00000001 | $0.00000000 |
| textembedding-gecko@003 | 3,072 | 3,072 | $0.00000001 | $0.00000000 |
| text-embedding-preview-0409 | 3,072 | 3,072 | $0.00000001 | $0.00000000 |
| text-multilingual-embedding-preview-0409 | 3,072 | 3,072 | $0.00000001 | $0.00000000 |
| palm/chat-bison | 4,096 | 8,192 | $0.00000012 | $0.00000012 |
| palm/chat-bison-001 | 4,096 | 8,192 | $0.00000012 | $0.00000012 |
| palm/text-bison | 1,024 | 8,192 | $0.00000012 | $0.00000012 |
| palm/text-bison-001 | 1,024 | 8,192 | $0.00000012 | $0.00000012 |
| palm/text-bison-safety-off | 1,024 | 8,192 | $0.00000012 | $0.00000012 |
| palm/text-bison-safety-recitation-off | 1,024 | 8,192 | $0.00000012 | $0.00000012 |
| gemini/gemini-pro | 8,192 | 32,760 | $0.00000000 | $0.00000000 |
| gemini/gemini-1.5-pro | 8,192 | 1,000,000 | $0.00000000 | $0.00000000 |
| gemini/gemini-1.5-pro-latest | 8,192 | 1,048,576 | $0.00000000 | $0.00000000 |
| gemini/gemini-pro-vision | 2,048 | 30,720 | $0.00000000 | $0.00000000 |
| command-r | 4,096 | 128,000 | $0.00000050 | $0.00000150 |
| command-light | 4,096 | 4,096 | $0.00001500 | $0.00001500 |
| command-r-plus | 4,096 | 128,000 | $0.00000300 | $0.00001500 |
| command-nightly | 4,096 | 4,096 | $0.00001500 | $0.00001500 |
| command | 4,096 | 4,096 | $0.00001500 | $0.00001500 |
| command-medium-beta | 4,096 | 4,096 | $0.00001500 | $0.00001500 |
| command-xlarge-beta | 4,096 | 4,096 | $0.00001500 | $0.00001500 |
| replicate/meta/llama-2-13b | 4,096 | 4,096 | $0.00000010 | $0.00000050 |
| replicate/meta/llama-2-13b-chat | 4,096 | 4,096 | $0.00000010 | $0.00000050 |
| replicate/meta/llama-2-70b | 4,096 | 4,096 | $0.00000065 | $0.00000275 |
| replicate/meta/llama-2-70b-chat | 4,096 | 4,096 | $0.00000065 | $0.00000275 |
| replicate/meta/llama-2-7b | 4,096 | 4,096 | $0.00000005 | $0.00000025 |
| replicate/meta/llama-2-7b-chat | 4,096 | 4,096 | $0.00000005 | $0.00000025 |
| replicate/meta/llama-3-70b | 4,096 | 4,096 | $0.00000065 | $0.00000275 |
| replicate/meta/llama-3-70b-instruct | 4,096 | 4,096 | $0.00000065 | $0.00000275 |
| replicate/meta/llama-3-8b | 4,096 | 4,096 | $0.00000005 | $0.00000025 |
| replicate/meta/llama-3-8b-instruct | 4,096 | 4,096 | $0.00000005 | $0.00000025 |
| replicate/mistralai/mistral-7b-v0.1 | 4,096 | 4,096 | $0.00000005 | $0.00000025 |
| replicate/mistralai/mistral-7b-instruct-v0.2 | 4,096 | 4,096 | $0.00000005 | $0.00000025 |
| replicate/mistralai/mixtral-8x7b-instruct-v0.1 | 4,096 | 4,096 | $0.00000030 | $0.00000100 |
| openrouter/microsoft/wizardlm-2-8x22b:nitro | 65,536 | nan | $0.00000100 | $0.00000100 |
| openrouter/google/gemini-pro-1.5 | 8,192 | 1,000,000 | $0.00000250 | $0.00000750 |
| openrouter/mistralai/mixtral-8x22b-instruct | 65,536 | nan | $0.00000065 | $0.00000065 |
| openrouter/cohere/command-r-plus | 128,000 | nan | $0.00000300 | $0.00001500 |
| openrouter/databricks/dbrx-instruct | 32,768 | nan | $0.00000060 | $0.00000060 |
| openrouter/anthropic/claude-3-haiku | 200,000 | nan | $0.00000025 | $0.00000125 |
| openrouter/anthropic/claude-3-sonnet | 200,000 | nan | $0.00000300 | $0.00001500 |
| openrouter/mistralai/mistral-large | 32,000 | nan | $0.00000800 | $0.00002400 |
| openrouter/cognitivecomputations/dolphin-mixtral-8x7b | 32,769 | nan | $0.00000050 | $0.00000050 |
| openrouter/google/gemini-pro-vision | 45,875 | nan | $0.00000012 | $0.00000038 |
| openrouter/fireworks/firellava-13b | 4,096 | nan | $0.00000020 | $0.00000020 |
| openrouter/meta-llama/llama-3-8b-instruct:free | 8,192 | nan | $0.00000000 | $0.00000000 |
| openrouter/meta-llama/llama-3-8b-instruct:extended | 16,384 | nan | $0.00000022 | $0.00000225 |
| openrouter/meta-llama/llama-3-70b-instruct:nitro | 8,192 | nan | $0.00000090 | $0.00000090 |
| openrouter/meta-llama/llama-3-70b-instruct | 8,192 | nan | $0.00000059 | $0.00000079 |
| openrouter/openai/gpt-4-vision-preview | 130,000 | nan | $0.00001000 | $0.00003000 |
| openrouter/openai/gpt-3.5-turbo | 4,095 | nan | $0.00000150 | $0.00000200 |
| openrouter/openai/gpt-3.5-turbo-16k | 16,383 | nan | $0.00000300 | $0.00000400 |
| openrouter/openai/gpt-4 | 8,192 | nan | $0.00003000 | $0.00006000 |
| openrouter/anthropic/claude-instant-v1 | 100,000 | nan | $0.00000163 | $0.00000551 |
| openrouter/anthropic/claude-2 | 100,000 | nan | $0.00001102 | $0.00003268 |
| openrouter/anthropic/claude-3-opus | 4,096 | 200,000 | $0.00001500 | $0.00007500 |
| openrouter/google/palm-2-chat-bison | 25,804 | nan | $0.00000050 | $0.00000050 |
| openrouter/google/palm-2-codechat-bison | 20,070 | nan | $0.00000050 | $0.00000050 |
| openrouter/meta-llama/llama-2-13b-chat | 4,096 | nan | $0.00000020 | $0.00000020 |
| openrouter/meta-llama/llama-2-70b-chat | 4,096 | nan | $0.00000150 | $0.00000150 |
| openrouter/meta-llama/codellama-34b-instruct | 8,096 | nan | $0.00000050 | $0.00000050 |
| openrouter/nousresearch/nous-hermes-llama2-13b | 4,096 | nan | $0.00000020 | $0.00000020 |
| openrouter/mancer/weaver | 8,000 | nan | $0.00000563 | $0.00000563 |
| openrouter/gryphe/mythomax-l2-13b | 8,192 | nan | $0.00000188 | $0.00000188 |
| openrouter/jondurbin/airoboros-l2-70b-2.1 | 4,096 | nan | $0.00001388 | $0.00001388 |
| openrouter/undi95/remm-slerp-l2-13b | 6,144 | nan | $0.00000188 | $0.00000188 |
| openrouter/pygmalionai/mythalion-13b | 4,096 | nan | $0.00000188 | $0.00000188 |
| openrouter/mistralai/mistral-7b-instruct | 8,192 | nan | $0.00000013 | $0.00000013 |
| openrouter/mistralai/mistral-7b-instruct:free | 8,192 | nan | $0.00000000 | $0.00000000 |
| j2-ultra | 8,192 | 8,192 | $0.00001500 | $0.00001500 |
| j2-mid | 8,192 | 8,192 | $0.00001000 | $0.00001000 |
| j2-light | 8,192 | 8,192 | $0.00000300 | $0.00000300 |
| dolphin | 16,384 | 16,384 | $0.00000050 | $0.00000050 |
| chatdolphin | 16,384 | 16,384 | $0.00000050 | $0.00000050 |
| luminous-base | 2,048 | nan | $0.00003000 | $0.00003300 |
| luminous-base-control | 2,048 | nan | $0.00003750 | $0.00004125 |
| luminous-extended | 2,048 | nan | $0.00004500 | $0.00004950 |
| luminous-extended-control | 2,048 | nan | $0.00005625 | $0.00006187 |
| luminous-supreme | 2,048 | nan | $0.00017500 | $0.00019250 |
| luminous-supreme-control | 2,048 | nan | $0.00021875 | $0.00024063 |
| ai21.j2-mid-v1 | 8,191 | 8,191 | $0.00001250 | $0.00001250 |
| ai21.j2-ultra-v1 | 8,191 | 8,191 | $0.00001880 | $0.00001880 |
| amazon.titan-text-lite-v1 | 4,000 | 42,000 | $0.00000030 | $0.00000040 |
| amazon.titan-text-express-v1 | 8,000 | 42,000 | $0.00000130 | $0.00000170 |
| amazon.titan-embed-text-v1 | 8,192 | 8,192 | $0.00000010 | $0.00000000 |
| amazon.titan-embed-text-v2:0 | 8,192 | 8,192 | $0.00000020 | $0.00000000 |
| mistral.mistral-7b-instruct-v0:2 | 8,191 | 32,000 | $0.00000015 | $0.00000020 |
| mistral.mixtral-8x7b-instruct-v0:1 | 8,191 | 32,000 | $0.00000045 | $0.00000070 |
| mistral.mistral-large-2402-v1:0 | 8,191 | 32,000 | $0.00000800 | $0.00002400 |
| bedrock/us-west-2/mistral.mixtral-8x7b-instruct-v0:1 | 8,191 | 32,000 | $0.00000045 | $0.00000070 |
| bedrock/us-east-1/mistral.mixtral-8x7b-instruct-v0:1 | 8,191 | 32,000 | $0.00000045 | $0.00000070 |
| bedrock/eu-west-3/mistral.mixtral-8x7b-instruct-v0:1 | 8,191 | 32,000 | $0.00000059 | $0.00000091 |
| bedrock/us-west-2/mistral.mistral-7b-instruct-v0:2 | 8,191 | 32,000 | $0.00000015 | $0.00000020 |
| bedrock/us-east-1/mistral.mistral-7b-instruct-v0:2 | 8,191 | 32,000 | $0.00000015 | $0.00000020 |
| bedrock/eu-west-3/mistral.mistral-7b-instruct-v0:2 | 8,191 | 32,000 | $0.00000020 | $0.00000026 |
| bedrock/us-east-1/mistral.mistral-large-2402-v1:0 | 8,191 | 32,000 | $0.00000800 | $0.00002400 |
| bedrock/us-west-2/mistral.mistral-large-2402-v1:0 | 8,191 | 32,000 | $0.00000800 | $0.00002400 |
| bedrock/eu-west-3/mistral.mistral-large-2402-v1:0 | 8,191 | 32,000 | $0.00001040 | $0.00003120 |
| anthropic.claude-3-sonnet-20240229-v1:0 | 4,096 | 200,000 | $0.00000300 | $0.00001500 |
| anthropic.claude-3-haiku-20240307-v1:0 | 4,096 | 200,000 | $0.00000025 | $0.00000125 |
| anthropic.claude-3-opus-20240229-v1:0 | 4,096 | 200,000 | $0.00001500 | $0.00007500 |
| anthropic.claude-v1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/us-east-1/anthropic.claude-v1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/us-west-2/anthropic.claude-v1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/ap-northeast-1/anthropic.claude-v1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/anthropic.claude-v1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-v1 | 8,191 | 100,000 | -- | -- |
| anthropic.claude-v2 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/us-east-1/anthropic.claude-v2 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/us-west-2/anthropic.claude-v2 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/ap-northeast-1/anthropic.claude-v2 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/anthropic.claude-v2 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-v2 | 8,191 | 100,000 | -- | -- |
| anthropic.claude-v2:1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/us-east-1/anthropic.claude-v2:1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/us-west-2/anthropic.claude-v2:1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/ap-northeast-1/anthropic.claude-v2:1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/anthropic.claude-v2:1 | 8,191 | 100,000 | $0.00000800 | $0.00002400 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-v2:1 | 8,191 | 100,000 | -- | -- |
| anthropic.claude-instant-v1 | 8,191 | 100,000 | $0.00000163 | $0.00000551 |
| bedrock/us-east-1/anthropic.claude-instant-v1 | 8,191 | 100,000 | $0.00000080 | $0.00000240 |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/us-west-2/anthropic.claude-instant-v1 | 8,191 | 100,000 | $0.00000080 | $0.00000240 |
| bedrock/ap-northeast-1/anthropic.claude-instant-v1 | 8,191 | 100,000 | $0.00000223 | $0.00000755 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/anthropic.claude-instant-v1 | 8,191 | 100,000 | $0.00000248 | $0.00000838 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-instant-v1 | 8,191 | 100,000 | -- | -- |
| cohere.command-text-v14 | 4,096 | 4,096 | $0.00000150 | $0.00000200 |
| bedrock/*/1-month-commitment/cohere.command-text-v14 | 4,096 | 4,096 | -- | -- |
| bedrock/*/6-month-commitment/cohere.command-text-v14 | 4,096 | 4,096 | -- | -- |
| cohere.command-light-text-v14 | 4,096 | 4,096 | $0.00000030 | $0.00000060 |
| bedrock/*/1-month-commitment/cohere.command-light-text-v14 | 4,096 | 4,096 | -- | -- |
| bedrock/*/6-month-commitment/cohere.command-light-text-v14 | 4,096 | 4,096 | -- | -- |
| cohere.command-r-plus-v1:0 | 4,096 | 128,000 | $0.00000300 | $0.00001500 |
| cohere.command-r-v1:0 | 4,096 | 128,000 | $0.00000050 | $0.00000150 |
| cohere.embed-english-v3 | 512 | 512 | $0.00000010 | $0.00000000 |
| cohere.embed-multilingual-v3 | 512 | 512 | $0.00000010 | $0.00000000 |
| meta.llama2-13b-chat-v1 | 4,096 | 4,096 | $0.00000075 | $0.00000100 |
| meta.llama2-70b-chat-v1 | 4,096 | 4,096 | $0.00000195 | $0.00000256 |
| meta.llama3-8b-instruct-v1:0 | 8,192 | 8,192 | $0.00000040 | $0.00000060 |
| meta.llama3-70b-instruct-v1:0 | 8,192 | 8,192 | $0.00000265 | $0.00000350 |
| 512-x-512/50-steps/stability.stable-diffusion-xl-v0 | 77 | 77 | -- | -- |
| 512-x-512/max-steps/stability.stable-diffusion-xl-v0 | 77 | 77 | -- | -- |
| max-x-max/50-steps/stability.stable-diffusion-xl-v0 | 77 | 77 | -- | -- |
| max-x-max/max-steps/stability.stable-diffusion-xl-v0 | 77 | 77 | -- | -- |
| 1024-x-1024/50-steps/stability.stable-diffusion-xl-v1 | 77 | 77 | -- | -- |
| 1024-x-1024/max-steps/stability.stable-diffusion-xl-v1 | 77 | 77 | -- | -- |
| sagemaker/meta-textgeneration-llama-2-7b | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| sagemaker/meta-textgeneration-llama-2-7b-f | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| sagemaker/meta-textgeneration-llama-2-13b | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| sagemaker/meta-textgeneration-llama-2-13b-f | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| sagemaker/meta-textgeneration-llama-2-70b | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| sagemaker/meta-textgeneration-llama-2-70b-b-f | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| together-ai-up-to-3b | nan | nan | $0.00000010 | $0.00000010 |
| together-ai-3.1b-7b | nan | nan | $0.00000020 | $0.00000020 |
| together-ai-7.1b-20b | 1,000 | nan | $0.00000040 | $0.00000040 |
| together-ai-20.1b-40b | nan | nan | $0.00000080 | $0.00000080 |
| together-ai-40.1b-70b | nan | nan | $0.00000090 | $0.00000090 |
| together_ai/mistralai/Mixtral-8x7B-Instruct-v0.1 | nan | nan | $0.00000060 | $0.00000060 |
| together_ai/mistralai/Mistral-7B-Instruct-v0.1 | nan | nan | -- | -- |
| together_ai/togethercomputer/CodeLlama-34b-Instruct | nan | nan | -- | -- |
| ollama/llama2 | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| ollama/llama2:13b | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| ollama/llama2:70b | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| ollama/llama2-uncensored | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| ollama/mistral | 8,192 | 8,192 | $0.00000000 | $0.00000000 |
| ollama/codellama | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| ollama/orca-mini | 4,096 | 4,096 | $0.00000000 | $0.00000000 |
| ollama/vicuna | 2,048 | 2,048 | $0.00000000 | $0.00000000 |
| deepinfra/lizpreciatior/lzlv_70b_fp16_hf | 4,096 | 4,096 | $0.00000070 | $0.00000090 |
| deepinfra/Gryphe/MythoMax-L2-13b | 4,096 | 4,096 | $0.00000022 | $0.00000022 |
| deepinfra/mistralai/Mistral-7B-Instruct-v0.1 | 8,191 | 32,768 | $0.00000013 | $0.00000013 |
| deepinfra/meta-llama/Llama-2-70b-chat-hf | 4,096 | 4,096 | $0.00000070 | $0.00000090 |
| deepinfra/cognitivecomputations/dolphin-2.6-mixtral-8x7b | 8,191 | 32,768 | $0.00000027 | $0.00000027 |
| deepinfra/codellama/CodeLlama-34b-Instruct-hf | 4,096 | 4,096 | $0.00000060 | $0.00000060 |
| deepinfra/deepinfra/mixtral | 4,096 | 32,000 | $0.00000027 | $0.00000027 |
| deepinfra/Phind/Phind-CodeLlama-34B-v2 | 4,096 | 16,384 | $0.00000060 | $0.00000060 |
| deepinfra/mistralai/Mixtral-8x7B-Instruct-v0.1 | 8,191 | 32,768 | $0.00000027 | $0.00000027 |
| deepinfra/deepinfra/airoboros-70b | 4,096 | 4,096 | $0.00000070 | $0.00000090 |
| deepinfra/01-ai/Yi-34B-Chat | 4,096 | 4,096 | $0.00000060 | $0.00000060 |
| deepinfra/01-ai/Yi-6B-200K | 4,096 | 200,000 | $0.00000013 | $0.00000013 |
| deepinfra/jondurbin/airoboros-l2-70b-gpt4-1.4.1 | 4,096 | 4,096 | $0.00000070 | $0.00000090 |
| deepinfra/meta-llama/Llama-2-13b-chat-hf | 4,096 | 4,096 | $0.00000022 | $0.00000022 |
| deepinfra/amazon/MistralLite | 8,191 | 32,768 | $0.00000020 | $0.00000020 |
| deepinfra/meta-llama/Llama-2-7b-chat-hf | 4,096 | 4,096 | $0.00000013 | $0.00000013 |
| deepinfra/01-ai/Yi-34B-200K | 4,096 | 200,000 | $0.00000060 | $0.00000060 |
| deepinfra/openchat/openchat_3.5 | 4,096 | 4,096 | $0.00000013 | $0.00000013 |
| perplexity/codellama-34b-instruct | 16,384 | 16,384 | $0.00000035 | $0.00000140 |
| perplexity/codellama-70b-instruct | 16,384 | 16,384 | $0.00000070 | $0.00000280 |
| perplexity/pplx-7b-chat | 8,192 | 8,192 | $0.00000007 | $0.00000028 |
| perplexity/pplx-70b-chat | 4,096 | 4,096 | $0.00000070 | $0.00000280 |
| perplexity/pplx-7b-online | 4,096 | 4,096 | $0.00000000 | $0.00000028 |
| perplexity/pplx-70b-online | 4,096 | 4,096 | $0.00000000 | $0.00000280 |
| perplexity/llama-2-70b-chat | 4,096 | 4,096 | $0.00000070 | $0.00000280 |
| perplexity/mistral-7b-instruct | 4,096 | 4,096 | $0.00000007 | $0.00000028 |
| perplexity/mixtral-8x7b-instruct | 4,096 | 4,096 | $0.00000007 | $0.00000028 |
| perplexity/sonar-small-chat | 16,384 | 16,384 | $0.00000007 | $0.00000028 |
| perplexity/sonar-small-online | 12,000 | 12,000 | $0.00000000 | $0.00000028 |
| perplexity/sonar-medium-chat | 16,384 | 16,384 | $0.00000060 | $0.00000180 |
| perplexity/sonar-medium-online | 12,000 | 12,000 | $0.00000000 | $0.00000180 |
| anyscale/mistralai/Mistral-7B-Instruct-v0.1 | 16,384 | 16,384 | $0.00000015 | $0.00000015 |
| anyscale/Mixtral-8x7B-Instruct-v0.1 | 16,384 | 16,384 | $0.00000015 | $0.00000015 |
| anyscale/HuggingFaceH4/zephyr-7b-beta | 16,384 | 16,384 | $0.00000015 | $0.00000015 |
| anyscale/meta-llama/Llama-2-7b-chat-hf | 4,096 | 4,096 | $0.00000015 | $0.00000015 |
| anyscale/meta-llama/Llama-2-13b-chat-hf | 4,096 | 4,096 | $0.00000025 | $0.00000025 |
| anyscale/meta-llama/Llama-2-70b-chat-hf | 4,096 | 4,096 | $0.00000100 | $0.00000100 |
| anyscale/codellama/CodeLlama-34b-Instruct-hf | 4,096 | 4,096 | $0.00000100 | $0.00000100 |
| cloudflare/@cf/meta/llama-2-7b-chat-fp16 | 3,072 | 3,072 | $0.00000192 | $0.00000192 |
| cloudflare/@cf/meta/llama-2-7b-chat-int8 | 2,048 | 2,048 | $0.00000192 | $0.00000192 |
| cloudflare/@cf/mistral/mistral-7b-instruct-v0.1 | 8,192 | 8,192 | $0.00000192 | $0.00000192 |
| cloudflare/@hf/thebloke/codellama-7b-instruct-awq | 4,096 | 4,096 | $0.00000192 | $0.00000192 |
| voyage/voyage-01 | 4,096 | 4,096 | $0.00000010 | $0.00000000 |
| voyage/voyage-lite-01 | 4,096 | 4,096 | $0.00000010 | $0.00000000 |
| voyage/voyage-large-2 | 16,000 | 16,000 | $0.00000012 | $0.00000000 |
| voyage/voyage-law-2 | 16,000 | 16,000 | $0.00000012 | $0.00000000 |
| voyage/voyage-code-2 | 16,000 | 16,000 | $0.00000012 | $0.00000000 |
| voyage/voyage-2 | 4,000 | 4,000 | $0.00000010 | $0.00000000 |
| voyage/voyage-lite-02-instruct | 4,000 | 4,000 | $0.00000010 | $0.00000000 |
| Model Name | Prompt Cost (USD) | Completion Cost (USD) | Max Prompt Tokens | Max Output Tokens |
|:--------------------------------------------------------------------------------------------|:--------------------|:------------------------|:--------------------|--------------------:|
| gpt-4 | $0.00003000 | $0.00006000 | 8,192 | 4096 |
| gpt-4o | $0.00000500 | $0.00001500 | 128,000 | 4096 |
| gpt-4o-2024-05-13 | $0.00000500 | $0.00001500 | 128,000 | 4096 |
| gpt-4-turbo-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| gpt-4-0314 | $0.00003000 | $0.00006000 | 8,192 | 4096 |
| gpt-4-0613 | $0.00003000 | $0.00006000 | 8,192 | 4096 |
| gpt-4-32k | $0.00006000 | $0.00012000 | 32,768 | 4096 |
| gpt-4-32k-0314 | $0.00006000 | $0.00012000 | 32,768 | 4096 |
| gpt-4-32k-0613 | $0.00006000 | $0.00012000 | 32,768 | 4096 |
| gpt-4-turbo | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| gpt-4-turbo-2024-04-09 | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| gpt-4-1106-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| gpt-4-0125-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| gpt-4-vision-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| gpt-4-1106-vision-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| gpt-3.5-turbo | $0.00000150 | $0.00000200 | 16,385 | 4096 |
| gpt-3.5-turbo-0301 | $0.00000150 | $0.00000200 | 4,097 | 4096 |
| gpt-3.5-turbo-0613 | $0.00000150 | $0.00000200 | 4,097 | 4096 |
| gpt-3.5-turbo-1106 | $0.00000100 | $0.00000200 | 16,385 | 4096 |
| gpt-3.5-turbo-0125 | $0.00000050 | $0.00000150 | 16,385 | 4096 |
| gpt-3.5-turbo-16k | $0.00000300 | $0.00000400 | 16,385 | 4096 |
| gpt-3.5-turbo-16k-0613 | $0.00000300 | $0.00000400 | 16,385 | 4096 |
| ft:gpt-3.5-turbo | $0.00000300 | $0.00000600 | 4,097 | 4096 |
| text-embedding-3-large | $0.00000013 | $0.00000000 | 8,191 | nan |
| text-embedding-3-small | $0.00000002 | $0.00000000 | 8,191 | nan |
| text-embedding-ada-002 | $0.00000010 | $0.00000000 | 8,191 | nan |
| text-embedding-ada-002-v2 | $0.00000010 | $0.00000000 | 8,191 | nan |
| text-moderation-stable | $0.00000000 | $0.00000000 | 32,768 | 0 |
| text-moderation-007 | $0.00000000 | $0.00000000 | 32,768 | 0 |
| text-moderation-latest | $0.00000000 | $0.00000000 | 32,768 | 0 |
| 256-x-256/dall-e-2 | -- | -- | nan | nan |
| 512-x-512/dall-e-2 | -- | -- | nan | nan |
| 1024-x-1024/dall-e-2 | -- | -- | nan | nan |
| hd/1024-x-1792/dall-e-3 | -- | -- | nan | nan |
| hd/1792-x-1024/dall-e-3 | -- | -- | nan | nan |
| hd/1024-x-1024/dall-e-3 | -- | -- | nan | nan |
| standard/1024-x-1792/dall-e-3 | -- | -- | nan | nan |
| standard/1792-x-1024/dall-e-3 | -- | -- | nan | nan |
| standard/1024-x-1024/dall-e-3 | -- | -- | nan | nan |
| whisper-1 | -- | -- | nan | nan |
| azure/whisper-1 | -- | -- | nan | nan |
| azure/gpt-4-turbo-2024-04-09 | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| azure/gpt-4-0125-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| azure/gpt-4-1106-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| azure/gpt-4-0613 | $0.00003000 | $0.00006000 | 8,192 | 4096 |
| azure/gpt-4-32k-0613 | $0.00006000 | $0.00012000 | 32,768 | 4096 |
| azure/gpt-4-32k | $0.00006000 | $0.00012000 | 32,768 | 4096 |
| azure/gpt-4 | $0.00003000 | $0.00006000 | 8,192 | 4096 |
| azure/gpt-4-turbo | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| azure/gpt-4-turbo-vision-preview | $0.00001000 | $0.00003000 | 128,000 | 4096 |
| azure/gpt-35-turbo-16k-0613 | $0.00000300 | $0.00000400 | 16,385 | 4096 |
| azure/gpt-35-turbo-1106 | $0.00000150 | $0.00000200 | 16,384 | 4096 |
| azure/gpt-35-turbo-0125 | $0.00000050 | $0.00000150 | 16,384 | 4096 |
| azure/gpt-35-turbo-16k | $0.00000300 | $0.00000400 | 16,385 | 4096 |
| azure/gpt-35-turbo | $0.00000150 | $0.00000200 | 4,097 | 4096 |
| azure/gpt-3.5-turbo-instruct-0914 | $0.00000150 | $0.00000200 | 4,097 | nan |
| azure/gpt-35-turbo-instruct | $0.00000150 | $0.00000200 | 4,097 | nan |
| azure/mistral-large-latest | $0.00000800 | $0.00002400 | 32,000 | nan |
| azure/mistral-large-2402 | $0.00000800 | $0.00002400 | 32,000 | nan |
| azure/command-r-plus | $0.00000300 | $0.00001500 | 128,000 | 4096 |
| azure/ada | $0.00000010 | $0.00000000 | 8,191 | nan |
| azure/text-embedding-ada-002 | $0.00000010 | $0.00000000 | 8,191 | nan |
| azure/text-embedding-3-large | $0.00000013 | $0.00000000 | 8,191 | nan |
| azure/text-embedding-3-small | $0.00000002 | $0.00000000 | 8,191 | nan |
| azure/standard/1024-x-1024/dall-e-3 | -- | $0.00000000 | nan | nan |
| azure/hd/1024-x-1024/dall-e-3 | -- | $0.00000000 | nan | nan |
| azure/standard/1024-x-1792/dall-e-3 | -- | $0.00000000 | nan | nan |
| azure/standard/1792-x-1024/dall-e-3 | -- | $0.00000000 | nan | nan |
| azure/hd/1024-x-1792/dall-e-3 | -- | $0.00000000 | nan | nan |
| azure/hd/1792-x-1024/dall-e-3 | -- | $0.00000000 | nan | nan |
| azure/standard/1024-x-1024/dall-e-2 | -- | $0.00000000 | nan | nan |
| babbage-002 | $0.00000040 | $0.00000040 | 16,384 | 4096 |
| davinci-002 | $0.00000200 | $0.00000200 | 16,384 | 4096 |
| gpt-3.5-turbo-instruct | $0.00000150 | $0.00000200 | 8,192 | 4096 |
| gpt-3.5-turbo-instruct-0914 | $0.00000150 | $0.00000200 | 8,192 | 4097 |
| claude-instant-1 | $0.00000163 | $0.00000551 | 100,000 | 8191 |
| mistral/mistral-tiny | $0.00000015 | $0.00000046 | 32,000 | 8191 |
| mistral/mistral-small | $0.00000200 | $0.00000600 | 32,000 | 8191 |
| mistral/mistral-small-latest | $0.00000200 | $0.00000600 | 32,000 | 8191 |
| mistral/mistral-medium | $0.00000270 | $0.00000810 | 32,000 | 8191 |
| mistral/mistral-medium-latest | $0.00000270 | $0.00000810 | 32,000 | 8191 |
| mistral/mistral-medium-2312 | $0.00000270 | $0.00000810 | 32,000 | 8191 |
| mistral/mistral-large-latest | $0.00000800 | $0.00002400 | 32,000 | 8191 |
| mistral/mistral-large-2402 | $0.00000800 | $0.00002400 | 32,000 | 8191 |
| mistral/open-mixtral-8x7b | $0.00000200 | $0.00000600 | 32,000 | 8191 |
| mistral/mistral-embed | $0.00000011 | -- | 8,192 | nan |
| deepseek-chat | $0.00000014 | $0.00000028 | 32,000 | 4096 |
| deepseek-coder | $0.00000014 | $0.00000028 | 16,000 | 4096 |
| groq/llama2-70b-4096 | $0.00000070 | $0.00000080 | 4,096 | 4096 |
| groq/llama3-8b-8192 | $0.00000010 | $0.00000010 | 8,192 | 8192 |
| groq/llama3-70b-8192 | $0.00000064 | $0.00000080 | 8,192 | 8192 |
| groq/mixtral-8x7b-32768 | $0.00000027 | $0.00000027 | 32,768 | 32768 |
| groq/gemma-7b-it | $0.00000010 | $0.00000010 | 8,192 | 8192 |
| claude-instant-1.2 | $0.00000016 | $0.00000055 | 100,000 | 8191 |
| claude-2 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| claude-2.1 | $0.00000800 | $0.00002400 | 200,000 | 8191 |
| claude-3-haiku-20240307 | $0.00000025 | $0.00000125 | 200,000 | 4096 |
| claude-3-opus-20240229 | $0.00001500 | $0.00007500 | 200,000 | 4096 |
| claude-3-sonnet-20240229 | $0.00000300 | $0.00001500 | 200,000 | 4096 |
| text-bison | $0.00000012 | $0.00000012 | 8,192 | 1024 |
| text-bison@001 | $0.00000012 | $0.00000012 | 8,192 | 1024 |
| text-unicorn | $0.00001000 | $0.00002800 | 8,192 | 1024 |
| text-unicorn@001 | $0.00001000 | $0.00002800 | 8,192 | 1024 |
| chat-bison | $0.00000012 | $0.00000012 | 8,192 | 4096 |
| chat-bison@001 | $0.00000012 | $0.00000012 | 8,192 | 4096 |
| chat-bison@002 | $0.00000012 | $0.00000012 | 8,192 | 4096 |
| chat-bison-32k | $0.00000012 | $0.00000012 | 32,000 | 8192 |
| code-bison | $0.00000012 | $0.00000012 | 6,144 | 1024 |
| code-bison@001 | $0.00000012 | $0.00000012 | 6,144 | 1024 |
| code-gecko@001 | $0.00000012 | $0.00000012 | 2,048 | 64 |
| code-gecko@002 | $0.00000012 | $0.00000012 | 2,048 | 64 |
| code-gecko | $0.00000012 | $0.00000012 | 2,048 | 64 |
| codechat-bison | $0.00000012 | $0.00000012 | 6,144 | 1024 |
| codechat-bison@001 | $0.00000012 | $0.00000012 | 6,144 | 1024 |
| codechat-bison-32k | $0.00000012 | $0.00000012 | 32,000 | 8192 |
| gemini-pro | $0.00000025 | $0.00000050 | 32,760 | 8192 |
| gemini-1.0-pro | $0.00000025 | $0.00000050 | 32,760 | 8192 |
| gemini-1.0-pro-001 | $0.00000025 | $0.00000050 | 32,760 | 8192 |
| gemini-1.0-pro-002 | $0.00000025 | $0.00000050 | 32,760 | 8192 |
| gemini-1.5-pro | $0.00000063 | $0.00000188 | 1,000,000 | 8192 |
| gemini-1.5-pro-preview-0215 | $0.00000063 | $0.00000188 | 1,000,000 | 8192 |
| gemini-1.5-pro-preview-0409 | $0.00000063 | $0.00000188 | 1,000,000 | 8192 |
| gemini-experimental | $0.00000000 | $0.00000000 | 1,000,000 | 8192 |
| gemini-pro-vision | $0.00000025 | $0.00000050 | 16,384 | 2048 |
| gemini-1.0-pro-vision | $0.00000025 | $0.00000050 | 16,384 | 2048 |
| gemini-1.0-pro-vision-001 | $0.00000025 | $0.00000050 | 16,384 | 2048 |
| vertex_ai/claude-3-sonnet@20240229 | $0.00000300 | $0.00001500 | 200,000 | 4096 |
| vertex_ai/claude-3-haiku@20240307 | $0.00000025 | $0.00000125 | 200,000 | 4096 |
| vertex_ai/claude-3-opus@20240229 | $0.00000150 | $0.00000750 | 200,000 | 4096 |
| textembedding-gecko | $0.00000001 | $0.00000000 | 3,072 | nan |
| textembedding-gecko-multilingual | $0.00000001 | $0.00000000 | 3,072 | nan |
| textembedding-gecko-multilingual@001 | $0.00000001 | $0.00000000 | 3,072 | nan |
| textembedding-gecko@001 | $0.00000001 | $0.00000000 | 3,072 | nan |
| textembedding-gecko@003 | $0.00000001 | $0.00000000 | 3,072 | nan |
| text-embedding-preview-0409 | $0.00000001 | $0.00000000 | 3,072 | nan |
| text-multilingual-embedding-preview-0409 | $0.00000001 | $0.00000000 | 3,072 | nan |
| palm/chat-bison | $0.00000012 | $0.00000012 | 8,192 | 4096 |
| palm/chat-bison-001 | $0.00000012 | $0.00000012 | 8,192 | 4096 |
| palm/text-bison | $0.00000012 | $0.00000012 | 8,192 | 1024 |
| palm/text-bison-001 | $0.00000012 | $0.00000012 | 8,192 | 1024 |
| palm/text-bison-safety-off | $0.00000012 | $0.00000012 | 8,192 | 1024 |
| palm/text-bison-safety-recitation-off | $0.00000012 | $0.00000012 | 8,192 | 1024 |
| gemini/gemini-pro | $0.00000000 | $0.00000000 | 32,760 | 8192 |
| gemini/gemini-1.5-pro | $0.00000000 | $0.00000000 | 1,000,000 | 8192 |
| gemini/gemini-1.5-pro-latest | $0.00000000 | $0.00000000 | 1,048,576 | 8192 |
| gemini/gemini-pro-vision | $0.00000000 | $0.00000000 | 30,720 | 2048 |
| command-r | $0.00000050 | $0.00000150 | 128,000 | 4096 |
| command-light | $0.00001500 | $0.00001500 | 4,096 | 4096 |
| command-r-plus | $0.00000300 | $0.00001500 | 128,000 | 4096 |
| command-nightly | $0.00001500 | $0.00001500 | 4,096 | 4096 |
| command | $0.00001500 | $0.00001500 | 4,096 | 4096 |
| command-medium-beta | $0.00001500 | $0.00001500 | 4,096 | 4096 |
| command-xlarge-beta | $0.00001500 | $0.00001500 | 4,096 | 4096 |
| replicate/llama-2-70b-chat:2c1608e18606fad2812020dc541930f2d0495ce32eee50074220b87300bc16e1 | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| replicate/meta/llama-2-13b | $0.00000010 | $0.00000050 | 4,096 | 4096 |
| replicate/meta/llama-2-13b-chat | $0.00000010 | $0.00000050 | 4,096 | 4096 |
| replicate/meta/llama-2-70b | $0.00000065 | $0.00000275 | 4,096 | 4096 |
| replicate/meta/llama-2-70b-chat | $0.00000065 | $0.00000275 | 4,096 | 4096 |
| replicate/meta/llama-2-7b | $0.00000005 | $0.00000025 | 4,096 | 4096 |
| replicate/meta/llama-2-7b-chat | $0.00000005 | $0.00000025 | 4,096 | 4096 |
| replicate/meta/llama-3-70b | $0.00000065 | $0.00000275 | 4,096 | 4096 |
| replicate/meta/llama-3-70b-instruct | $0.00000065 | $0.00000275 | 4,096 | 4096 |
| replicate/meta/llama-3-8b | $0.00000005 | $0.00000025 | 4,096 | 4096 |
| replicate/meta/llama-3-8b-instruct | $0.00000005 | $0.00000025 | 4,096 | 4096 |
| replicate/mistralai/mistral-7b-v0.1 | $0.00000005 | $0.00000025 | 4,096 | 4096 |
| replicate/mistralai/mistral-7b-instruct-v0.2 | $0.00000005 | $0.00000025 | 4,096 | 4096 |
| replicate/mistralai/mixtral-8x7b-instruct-v0.1 | $0.00000030 | $0.00000100 | 4,096 | 4096 |
| openrouter/microsoft/wizardlm-2-8x22b:nitro | $0.00000100 | $0.00000100 | nan | nan |
| openrouter/google/gemini-pro-1.5 | $0.00000250 | $0.00000750 | 1,000,000 | 8192 |
| openrouter/mistralai/mixtral-8x22b-instruct | $0.00000065 | $0.00000065 | nan | nan |
| openrouter/cohere/command-r-plus | $0.00000300 | $0.00001500 | nan | nan |
| openrouter/databricks/dbrx-instruct | $0.00000060 | $0.00000060 | nan | nan |
| openrouter/anthropic/claude-3-haiku | $0.00000025 | $0.00000125 | nan | nan |
| openrouter/anthropic/claude-3-sonnet | $0.00000300 | $0.00001500 | nan | nan |
| openrouter/mistralai/mistral-large | $0.00000800 | $0.00002400 | nan | nan |
| openrouter/cognitivecomputations/dolphin-mixtral-8x7b | $0.00000050 | $0.00000050 | nan | nan |
| openrouter/google/gemini-pro-vision | $0.00000012 | $0.00000038 | nan | nan |
| openrouter/fireworks/firellava-13b | $0.00000020 | $0.00000020 | nan | nan |
| openrouter/meta-llama/llama-3-8b-instruct:free | $0.00000000 | $0.00000000 | nan | nan |
| openrouter/meta-llama/llama-3-8b-instruct:extended | $0.00000022 | $0.00000225 | nan | nan |
| openrouter/meta-llama/llama-3-70b-instruct:nitro | $0.00000090 | $0.00000090 | nan | nan |
| openrouter/meta-llama/llama-3-70b-instruct | $0.00000059 | $0.00000079 | nan | nan |
| openrouter/openai/gpt-4-vision-preview | $0.00001000 | $0.00003000 | nan | nan |
| openrouter/openai/gpt-3.5-turbo | $0.00000150 | $0.00000200 | nan | nan |
| openrouter/openai/gpt-3.5-turbo-16k | $0.00000300 | $0.00000400 | nan | nan |
| openrouter/openai/gpt-4 | $0.00003000 | $0.00006000 | nan | nan |
| openrouter/anthropic/claude-instant-v1 | $0.00000163 | $0.00000551 | nan | 8191 |
| openrouter/anthropic/claude-2 | $0.00001102 | $0.00003268 | nan | 8191 |
| openrouter/anthropic/claude-3-opus | $0.00001500 | $0.00007500 | 200,000 | 4096 |
| openrouter/google/palm-2-chat-bison | $0.00000050 | $0.00000050 | nan | nan |
| openrouter/google/palm-2-codechat-bison | $0.00000050 | $0.00000050 | nan | nan |
| openrouter/meta-llama/llama-2-13b-chat | $0.00000020 | $0.00000020 | nan | nan |
| openrouter/meta-llama/llama-2-70b-chat | $0.00000150 | $0.00000150 | nan | nan |
| openrouter/meta-llama/codellama-34b-instruct | $0.00000050 | $0.00000050 | nan | nan |
| openrouter/nousresearch/nous-hermes-llama2-13b | $0.00000020 | $0.00000020 | nan | nan |
| openrouter/mancer/weaver | $0.00000563 | $0.00000563 | nan | nan |
| openrouter/gryphe/mythomax-l2-13b | $0.00000188 | $0.00000188 | nan | nan |
| openrouter/jondurbin/airoboros-l2-70b-2.1 | $0.00001388 | $0.00001388 | nan | nan |
| openrouter/undi95/remm-slerp-l2-13b | $0.00000188 | $0.00000188 | nan | nan |
| openrouter/pygmalionai/mythalion-13b | $0.00000188 | $0.00000188 | nan | nan |
| openrouter/mistralai/mistral-7b-instruct | $0.00000013 | $0.00000013 | nan | nan |
| openrouter/mistralai/mistral-7b-instruct:free | $0.00000000 | $0.00000000 | nan | nan |
| j2-ultra | $0.00001500 | $0.00001500 | 8,192 | 8192 |
| j2-mid | $0.00001000 | $0.00001000 | 8,192 | 8192 |
| j2-light | $0.00000300 | $0.00000300 | 8,192 | 8192 |
| dolphin | $0.00000050 | $0.00000050 | 16,384 | 16384 |
| chatdolphin | $0.00000050 | $0.00000050 | 16,384 | 16384 |
| luminous-base | $0.00003000 | $0.00003300 | nan | nan |
| luminous-base-control | $0.00003750 | $0.00004125 | nan | nan |
| luminous-extended | $0.00004500 | $0.00004950 | nan | nan |
| luminous-extended-control | $0.00005625 | $0.00006187 | nan | nan |
| luminous-supreme | $0.00017500 | $0.00019250 | nan | nan |
| luminous-supreme-control | $0.00021875 | $0.00024063 | nan | nan |
| ai21.j2-mid-v1 | $0.00001250 | $0.00001250 | 8,191 | 8191 |
| ai21.j2-ultra-v1 | $0.00001880 | $0.00001880 | 8,191 | 8191 |
| amazon.titan-text-lite-v1 | $0.00000030 | $0.00000040 | 42,000 | 4000 |
| amazon.titan-text-express-v1 | $0.00000130 | $0.00000170 | 42,000 | 8000 |
| amazon.titan-embed-text-v1 | $0.00000010 | $0.00000000 | 8,192 | nan |
| amazon.titan-embed-text-v2:0 | $0.00000020 | $0.00000000 | 8,192 | nan |
| mistral.mistral-7b-instruct-v0:2 | $0.00000015 | $0.00000020 | 32,000 | 8191 |
| mistral.mixtral-8x7b-instruct-v0:1 | $0.00000045 | $0.00000070 | 32,000 | 8191 |
| mistral.mistral-large-2402-v1:0 | $0.00000800 | $0.00002400 | 32,000 | 8191 |
| bedrock/us-west-2/mistral.mixtral-8x7b-instruct-v0:1 | $0.00000045 | $0.00000070 | 32,000 | 8191 |
| bedrock/us-east-1/mistral.mixtral-8x7b-instruct-v0:1 | $0.00000045 | $0.00000070 | 32,000 | 8191 |
| bedrock/eu-west-3/mistral.mixtral-8x7b-instruct-v0:1 | $0.00000059 | $0.00000091 | 32,000 | 8191 |
| bedrock/us-west-2/mistral.mistral-7b-instruct-v0:2 | $0.00000015 | $0.00000020 | 32,000 | 8191 |
| bedrock/us-east-1/mistral.mistral-7b-instruct-v0:2 | $0.00000015 | $0.00000020 | 32,000 | 8191 |
| bedrock/eu-west-3/mistral.mistral-7b-instruct-v0:2 | $0.00000020 | $0.00000026 | 32,000 | 8191 |
| bedrock/us-east-1/mistral.mistral-large-2402-v1:0 | $0.00000800 | $0.00002400 | 32,000 | 8191 |
| bedrock/us-west-2/mistral.mistral-large-2402-v1:0 | $0.00000800 | $0.00002400 | 32,000 | 8191 |
| bedrock/eu-west-3/mistral.mistral-large-2402-v1:0 | $0.00001040 | $0.00003120 | 32,000 | 8191 |
| anthropic.claude-3-sonnet-20240229-v1:0 | $0.00000300 | $0.00001500 | 200,000 | 4096 |
| anthropic.claude-3-haiku-20240307-v1:0 | $0.00000025 | $0.00000125 | 200,000 | 4096 |
| anthropic.claude-3-opus-20240229-v1:0 | $0.00001500 | $0.00007500 | 200,000 | 4096 |
| anthropic.claude-v1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/us-east-1/anthropic.claude-v1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/us-west-2/anthropic.claude-v1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/ap-northeast-1/anthropic.claude-v1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/anthropic.claude-v1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-v1 | -- | -- | 100,000 | 8191 |
| anthropic.claude-v2 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/us-east-1/anthropic.claude-v2 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/us-west-2/anthropic.claude-v2 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/ap-northeast-1/anthropic.claude-v2 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/anthropic.claude-v2 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-v2 | -- | -- | 100,000 | 8191 |
| anthropic.claude-v2:1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/us-east-1/anthropic.claude-v2:1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/us-west-2/anthropic.claude-v2:1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/ap-northeast-1/anthropic.claude-v2:1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/anthropic.claude-v2:1 | $0.00000800 | $0.00002400 | 100,000 | 8191 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-v2:1 | -- | -- | 100,000 | 8191 |
| anthropic.claude-instant-v1 | $0.00000163 | $0.00000551 | 100,000 | 8191 |
| bedrock/us-east-1/anthropic.claude-instant-v1 | $0.00000080 | $0.00000240 | 100,000 | 8191 |
| bedrock/us-east-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-east-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| bedrock/us-west-2/anthropic.claude-instant-v1 | $0.00000080 | $0.00000240 | 100,000 | 8191 |
| bedrock/ap-northeast-1/anthropic.claude-instant-v1 | $0.00000223 | $0.00000755 | 100,000 | 8191 |
| bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/anthropic.claude-instant-v1 | $0.00000248 | $0.00000838 | 100,000 | 8191 |
| bedrock/eu-central-1/1-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| bedrock/eu-central-1/6-month-commitment/anthropic.claude-instant-v1 | -- | -- | 100,000 | 8191 |
| cohere.command-text-v14 | $0.00000150 | $0.00000200 | 4,096 | 4096 |
| bedrock/*/1-month-commitment/cohere.command-text-v14 | -- | -- | 4,096 | 4096 |
| bedrock/*/6-month-commitment/cohere.command-text-v14 | -- | -- | 4,096 | 4096 |
| cohere.command-light-text-v14 | $0.00000030 | $0.00000060 | 4,096 | 4096 |
| bedrock/*/1-month-commitment/cohere.command-light-text-v14 | -- | -- | 4,096 | 4096 |
| bedrock/*/6-month-commitment/cohere.command-light-text-v14 | -- | -- | 4,096 | 4096 |
| cohere.command-r-plus-v1:0 | $0.00000300 | $0.00001500 | 128,000 | 4096 |
| cohere.command-r-v1:0 | $0.00000050 | $0.00000150 | 128,000 | 4096 |
| cohere.embed-english-v3 | $0.00000010 | $0.00000000 | 512 | nan |
| cohere.embed-multilingual-v3 | $0.00000010 | $0.00000000 | 512 | nan |
| meta.llama2-13b-chat-v1 | $0.00000075 | $0.00000100 | 4,096 | 4096 |
| meta.llama2-70b-chat-v1 | $0.00000195 | $0.00000256 | 4,096 | 4096 |
| meta.llama3-8b-instruct-v1:0 | $0.00000040 | $0.00000060 | 8,192 | 8192 |
| meta.llama3-70b-instruct-v1:0 | $0.00000265 | $0.00000350 | 8,192 | 8192 |
| 512-x-512/50-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan |
| 512-x-512/max-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan |
| max-x-max/50-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan |
| max-x-max/max-steps/stability.stable-diffusion-xl-v0 | -- | -- | 77 | nan |
| 1024-x-1024/50-steps/stability.stable-diffusion-xl-v1 | -- | -- | 77 | nan |
| 1024-x-1024/max-steps/stability.stable-diffusion-xl-v1 | -- | -- | 77 | nan |
| sagemaker/meta-textgeneration-llama-2-7b | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| sagemaker/meta-textgeneration-llama-2-7b-f | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| sagemaker/meta-textgeneration-llama-2-13b | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| sagemaker/meta-textgeneration-llama-2-13b-f | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| sagemaker/meta-textgeneration-llama-2-70b | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| sagemaker/meta-textgeneration-llama-2-70b-b-f | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| together-ai-up-to-3b | $0.00000010 | $0.00000010 | nan | nan |
| together-ai-3.1b-7b | $0.00000020 | $0.00000020 | nan | nan |
| together-ai-7.1b-20b | $0.00000040 | $0.00000040 | nan | nan |
| together-ai-20.1b-40b | $0.00000080 | $0.00000080 | nan | nan |
| together-ai-40.1b-70b | $0.00000090 | $0.00000090 | nan | nan |
| together_ai/mistralai/Mixtral-8x7B-Instruct-v0.1 | $0.00000060 | $0.00000060 | nan | nan |
| together_ai/mistralai/Mistral-7B-Instruct-v0.1 | -- | -- | nan | nan |
| together_ai/togethercomputer/CodeLlama-34b-Instruct | -- | -- | nan | nan |
| ollama/llama2 | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| ollama/llama2:13b | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| ollama/llama2:70b | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| ollama/llama2-uncensored | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| ollama/mistral | $0.00000000 | $0.00000000 | 8,192 | 8192 |
| ollama/codellama | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| ollama/orca-mini | $0.00000000 | $0.00000000 | 4,096 | 4096 |
| ollama/vicuna | $0.00000000 | $0.00000000 | 2,048 | 2048 |
| deepinfra/lizpreciatior/lzlv_70b_fp16_hf | $0.00000070 | $0.00000090 | 4,096 | 4096 |
| deepinfra/Gryphe/MythoMax-L2-13b | $0.00000022 | $0.00000022 | 4,096 | 4096 |
| deepinfra/mistralai/Mistral-7B-Instruct-v0.1 | $0.00000013 | $0.00000013 | 32,768 | 8191 |
| deepinfra/meta-llama/Llama-2-70b-chat-hf | $0.00000070 | $0.00000090 | 4,096 | 4096 |
| deepinfra/cognitivecomputations/dolphin-2.6-mixtral-8x7b | $0.00000027 | $0.00000027 | 32,768 | 8191 |
| deepinfra/codellama/CodeLlama-34b-Instruct-hf | $0.00000060 | $0.00000060 | 4,096 | 4096 |
| deepinfra/deepinfra/mixtral | $0.00000027 | $0.00000027 | 32,000 | 4096 |
| deepinfra/Phind/Phind-CodeLlama-34B-v2 | $0.00000060 | $0.00000060 | 16,384 | 4096 |
| deepinfra/mistralai/Mixtral-8x7B-Instruct-v0.1 | $0.00000027 | $0.00000027 | 32,768 | 8191 |
| deepinfra/deepinfra/airoboros-70b | $0.00000070 | $0.00000090 | 4,096 | 4096 |
| deepinfra/01-ai/Yi-34B-Chat | $0.00000060 | $0.00000060 | 4,096 | 4096 |
| deepinfra/01-ai/Yi-6B-200K | $0.00000013 | $0.00000013 | 200,000 | 4096 |
| deepinfra/jondurbin/airoboros-l2-70b-gpt4-1.4.1 | $0.00000070 | $0.00000090 | 4,096 | 4096 |
| deepinfra/meta-llama/Llama-2-13b-chat-hf | $0.00000022 | $0.00000022 | 4,096 | 4096 |
| deepinfra/amazon/MistralLite | $0.00000020 | $0.00000020 | 32,768 | 8191 |
| deepinfra/meta-llama/Llama-2-7b-chat-hf | $0.00000013 | $0.00000013 | 4,096 | 4096 |
| deepinfra/01-ai/Yi-34B-200K | $0.00000060 | $0.00000060 | 200,000 | 4096 |
| deepinfra/openchat/openchat_3.5 | $0.00000013 | $0.00000013 | 4,096 | 4096 |
| perplexity/codellama-34b-instruct | $0.00000035 | $0.00000140 | 16,384 | 16384 |
| perplexity/codellama-70b-instruct | $0.00000070 | $0.00000280 | 16,384 | 16384 |
| perplexity/pplx-7b-chat | $0.00000007 | $0.00000028 | 8,192 | 8192 |
| perplexity/pplx-70b-chat | $0.00000070 | $0.00000280 | 4,096 | 4096 |
| perplexity/pplx-7b-online | $0.00000000 | $0.00000028 | 4,096 | 4096 |
| perplexity/pplx-70b-online | $0.00000000 | $0.00000280 | 4,096 | 4096 |
| perplexity/llama-2-70b-chat | $0.00000070 | $0.00000280 | 4,096 | 4096 |
| perplexity/mistral-7b-instruct | $0.00000007 | $0.00000028 | 4,096 | 4096 |
| perplexity/mixtral-8x7b-instruct | $0.00000007 | $0.00000028 | 4,096 | 4096 |
| perplexity/sonar-small-chat | $0.00000007 | $0.00000028 | 16,384 | 16384 |
| perplexity/sonar-small-online | $0.00000000 | $0.00000028 | 12,000 | 12000 |
| perplexity/sonar-medium-chat | $0.00000060 | $0.00000180 | 16,384 | 16384 |
| perplexity/sonar-medium-online | $0.00000000 | $0.00000180 | 12,000 | 12000 |
| anyscale/mistralai/Mistral-7B-Instruct-v0.1 | $0.00000015 | $0.00000015 | 16,384 | 16384 |
| anyscale/Mixtral-8x7B-Instruct-v0.1 | $0.00000015 | $0.00000015 | 16,384 | 16384 |
| anyscale/HuggingFaceH4/zephyr-7b-beta | $0.00000015 | $0.00000015 | 16,384 | 16384 |
| anyscale/meta-llama/Llama-2-7b-chat-hf | $0.00000015 | $0.00000015 | 4,096 | 4096 |
| anyscale/meta-llama/Llama-2-13b-chat-hf | $0.00000025 | $0.00000025 | 4,096 | 4096 |
| anyscale/meta-llama/Llama-2-70b-chat-hf | $0.00000100 | $0.00000100 | 4,096 | 4096 |
| anyscale/codellama/CodeLlama-34b-Instruct-hf | $0.00000100 | $0.00000100 | 4,096 | 4096 |
| cloudflare/@cf/meta/llama-2-7b-chat-fp16 | $0.00000192 | $0.00000192 | 3,072 | 3072 |
| cloudflare/@cf/meta/llama-2-7b-chat-int8 | $0.00000192 | $0.00000192 | 2,048 | 2048 |
| cloudflare/@cf/mistral/mistral-7b-instruct-v0.1 | $0.00000192 | $0.00000192 | 8,192 | 8192 |
| cloudflare/@hf/thebloke/codellama-7b-instruct-awq | $0.00000192 | $0.00000192 | 4,096 | 4096 |
| voyage/voyage-01 | $0.00000010 | $0.00000000 | 4,096 | nan |
| voyage/voyage-lite-01 | $0.00000010 | $0.00000000 | 4,096 | nan |
| voyage/voyage-large-2 | $0.00000012 | $0.00000000 | 16,000 | nan |
| voyage/voyage-law-2 | $0.00000012 | $0.00000000 | 16,000 | nan |
| voyage/voyage-code-2 | $0.00000012 | $0.00000000 | 16,000 | nan |
| voyage/voyage-2 | $0.00000010 | $0.00000000 | 4,000 | nan |
| voyage/voyage-lite-02-instruct | $0.00000010 | $0.00000000 | 4,000 | nan |

View File

@@ -1,27 +0,0 @@
import pandas as pd
import tokencost
# Load the data
df = pd.DataFrame(tokencost.TOKEN_COSTS).T
df['max_input_tokens'] = df['max_input_tokens'].apply(lambda x: '{:,.0f}'.format(x))
df['max_tokens'] = df['max_tokens'].apply(lambda x: '{:,.0f}'.format(x))
# Updated function to format the cost or handle NaN
def format_cost(x):
if pd.isna(x):
return '--'
else:
# Ensure the number is treated as a float and format it
return '${:.8f}'.format(float(x))
# Apply the formatting function
df[['input_cost_per_token', 'output_cost_per_token']] = df[[
'input_cost_per_token', 'output_cost_per_token']].applymap(format_cost)
# Write the DataFrame as markdown to a file
with open('pricing_table.md', 'w') as f:
f.write(df[['max_tokens', 'max_input_tokens', 'input_cost_per_token', 'output_cost_per_token']].to_markdown())

File diff suppressed because it is too large Load Diff

73
update_prices.py Normal file
View File

@@ -0,0 +1,73 @@
import pandas as pd
import tokencost
import json
# Update model_prices.json with the latest costs from the LiteLLM cost tracker
def diff_dicts(dict1, dict2):
diff_keys = dict1.keys() ^ dict2.keys()
differences = {k: (dict1.get(k), dict2.get(k)) for k in diff_keys}
differences.update({k: (dict1[k], dict2[k]) for k in dict1 if k in dict2 and dict1[k] != dict2[k]})
if differences:
print("Differences found:")
for key, (val1, val2) in differences.items():
print(f"{key}: {val1} != {val2}")
else:
print("No differences found.")
if differences:
return True
else:
return False
with open('tokencost/model_prices.json', 'r') as f:
model_prices = json.load(f)
if diff_dicts(model_prices, tokencost.TOKEN_COSTS):
print('Updating model_prices.json')
with open('tokencost/model_prices.json', 'w') as f:
json.dump(tokencost.TOKEN_COSTS, f, indent=4)
# Load the data
df = pd.DataFrame(tokencost.TOKEN_COSTS).T
df['max_input_tokens'] = df['max_input_tokens'].apply(lambda x: '{:,.0f}'.format(x))
df['max_tokens'] = df['max_tokens'].apply(lambda x: '{:,.0f}'.format(x))
# Updated function to format the cost or handle NaN
def format_cost(x):
if pd.isna(x):
return '--'
else:
# Ensure the number is treated as a float and format it
return '${:.8f}'.format(float(x))
# Apply the formatting function
# Apply the formatting function using DataFrame.apply and lambda
df[['input_cost_per_token', 'output_cost_per_token']] = df[[
'input_cost_per_token', 'output_cost_per_token']].apply(lambda x: x.map(format_cost))
column_mapping = {
'input_cost_per_token': 'Prompt Cost (USD)',
'output_cost_per_token': 'Completion Cost (USD)',
'max_input_tokens': 'Max Prompt Tokens',
'max_output_tokens': 'Max Output Tokens',
'model_name': 'Model Name'
}
# Assuming the keys of the JSON data represent the model names and have been set as the index
df['Model Name'] = df.index
# Apply the column renaming
df.rename(columns=column_mapping, inplace=True)
# Write the DataFrame with the correct column names as markdown to a file
with open('pricing_table.md', 'w') as f:
f.write(df[['Model Name', 'Prompt Cost (USD)', 'Completion Cost (USD)',
'Max Prompt Tokens', 'Max Output Tokens']].to_markdown(index=False))