FactQuire
Source-verified facts about commercial LLM APIs: pricing, limits, lifecycle, and primary-source quotes.
| Provider | Model ID | Status | Input $/1M | Output $/1M | Context | Max Output |
|---|---|---|---|---|---|---|
| alibaba | qwen3-max | ga | 1.2 | 6.0 | 256000 | - |
| alibaba | qwen3-max-2026-01-23 | ga | 1.2 | 6.0 | 256000 | - |
| alibaba | qwen3.6-flash | ga | 0.25 | 1.5 | 1000000 | 64000 |
| alibaba | qwen3.6-flash-2026-04-16 | ga | 0.25 | 1.5 | 1000000 | 64000 |
| alibaba | qwen3.6-max-preview | ga | 1.3 | 7.8 | 256000 | - |
| alibaba | qwen3.6-plus | ga | 0.5 | 3.0 | 1000000 | 64000 |
| alibaba | qwen3.6-plus-2026-04-02 | ga | 0.5 | 3.0 | 1000000 | 64000 |
| alibaba | qwen3.7-max | ga | 2.5 | 7.5 | 1000000 | - |
| alibaba | qwen3.7-max-2026-05-17 | ga | 2.5 | 7.5 | 1000000 | - |
| alibaba | qwen3.7-max-2026-05-20 | ga | 2.5 | 7.5 | 1000000 | - |
| alibaba | qwen3.7-max-preview | ga | 2.5 | 7.5 | 1000000 | - |
| alibaba | qwen3.7-plus | ga | 0.4 | 1.6 | 1000000 | 64000 |
| alibaba | qwen3.7-plus-2026-05-26 | ga | 0.4 | 1.6 | 1000000 | 64000 |
| amazon | amazon.nova-lite-v1:0 | ga | 0.06 | 0.24 | 300000 | 10000 |
| amazon | amazon.nova-micro-v1:0 | ga | 0.035 | 0.14 | 128000 | 10000 |
| amazon | amazon.nova-premier-v1:0 | ga | 2.5 | 12.5 | 1000000 | 10000 |
| amazon | amazon.nova-pro-v1:0 | ga | 0.8 | 3.2 | 300000 | 10000 |
| amazon | anthropic.claude-3-5-sonnet-20241022-v2:0 | deprecated | 6.0 | 30.0 | 200000 | - |
| anthropic | claude-fable-5 | ga | 10 | 50 | 1000000 | 128000 |
| anthropic | claude-haiku-4-5-20251001 | ga | 1 | 5 | 200000 | 64000 |
| anthropic | claude-opus-4-6 | ga | 5 | 25 | 1000000 | - |
| anthropic | claude-opus-4-7 | ga | 5 | 25 | 1000000 | - |
| anthropic | claude-opus-4-8 | ga | 5 | 25 | 1000000 | 128000 |
| anthropic | claude-sonnet-5 | ga | 2 | 10 | 1000000 | 128000 |
| cohere | c4ai-aya-expanse-32b | ga | 0.5 | 1.5 | 128000 | 4000 |
| cohere | command | deprecated | 1.0 | 2.0 | 4000 | 4000 |
| cohere | command-a-03-2025 | ga | - | - | 256000 | 8000 |
| cohere | command-a-plus-05-2026 | ga | - | - | 128000 | 64000 |
| cohere | command-a-reasoning-08-2025 | ga | - | - | 256000 | 32000 |
| cohere | command-a-translate-08-2025 | ga | - | - | 8000 | 8000 |
| cohere | command-a-vision-07-2025 | ga | - | - | 128000 | 8000 |
| cohere | command-light | deprecated | 0.3 | 0.6 | 4000 | 4000 |
| cohere | command-r-03-2024 | deprecated | 0.5 | 1.5 | 128000 | 4000 |
| cohere | command-r-08-2024 | ga | - | - | 128000 | 4000 |
| cohere | command-r-plus-04-2024 | deprecated | 3.0 | 15.0 | 128000 | 4000 |
| cohere | command-r-plus-08-2024 | ga | 2.5 | 10.0 | 128000 | 4000 |
| cohere | command-r7b-12-2024 | ga | 0.0375 | 0.15 | 128000 | 4000 |
| cohere | tiny-aya-global | ga | - | - | 8000 | 8000 |
| deepseek | deepseek-v4-flash | ga | 0.14 | 0.28 | 1000000 | 384000 |
| deepseek | deepseek-v4-pro | ga | 0.435 | 0.87 | 1000000 | 384000 |
| fireworks | deepseek-v4-flash | ga | 0.14 | 0.28 | - | - |
| fireworks | deepseek-v4-pro | ga | 1.74 | 3.48 | - | - |
| fireworks | glm-5.1 | ga | 1.4 | 4.4 | - | - |
| fireworks | glm-5.1-fast | ga | 2.8 | 8.8 | - | - |
| fireworks | glm-5.2 | ga | 1.4 | 4.4 | - | - |
| fireworks | glm-5.2-fast | ga | 2.1 | 6.6 | - | - |
| fireworks | kimi-k2.6 | ga | 0.95 | 4.0 | - | - |
| fireworks | kimi-k2.6-fast | ga | 2.0 | 8.0 | - | - |
| fireworks | kimi-k2.7-code | ga | 0.95 | 4.0 | - | - |
| fireworks | kimi-k2.7-code-fast | ga | 1.9 | 8.0 | - | - |
| fireworks | llama-v3p3-70b-instruct | ga | 0.9 | 0.9 | 131072 | - |
| fireworks | minimax-m2.7 | ga | 0.3 | 1.2 | - | - |
| fireworks | minimax-m3 | ga | 0.3 | 1.2 | - | - |
| fireworks | openai-gpt-oss-120b | ga | 0.15 | 0.6 | - | - |
| fireworks | openai-gpt-oss-20b | ga | 0.07 | 0.3 | - | - |
| fireworks | qwen-3.7-plus | ga | 0.4 | 1.6 | - | - |
| fireworks | qwen2p5-vl-32b-instruct | ga | 0.9 | 0.9 | 128000 | - |
gemini-2.5-flash | ga | 0.3 | 2.5 | 1048576 | - | |
gemini-2.5-flash-lite | ga | 0.1 | 0.4 | - | - | |
gemini-2.5-flash-lite-preview-09-2025 | preview | 0.1 | 0.4 | - | - | |
gemini-2.5-flash-native-audio-preview-12-2025 | preview | 0.5 | 2.0 | - | - | |
gemini-2.5-flash-preview-tts | preview | 0.5 | 10.0 | - | - | |
gemini-2.5-pro | ga | 1.25 | 10.0 | - | - | |
gemini-3-flash-preview | preview | 0.5 | 3.0 | - | - | |
gemini-3.1-flash-lite | ga | 0.25 | 1.5 | - | - | |
gemini-3.1-flash-live-preview | preview | 0.75 | 4.5 | - | - | |
gemini-3.1-pro-preview | preview | 2.0 | 12.0 | - | - | |
| groq | llama-3.1-8b-instant | ga | 0.05 | 0.08 | 131072 | 131072 |
| groq | llama-3.3-70b-versatile | ga | 0.59 | 0.79 | 131072 | 32768 |
| groq | openai/gpt-oss-120b | ga | 0.15 | 0.6 | 131072 | 65536 |
| groq | openai/gpt-oss-20b | ga | 0.075 | 0.3 | 131072 | 65536 |
| minimax | minimax-m2 | ga | 0.3 | 1.2 | - | - |
| minimax | minimax-m2.1 | ga | 0.3 | 1.2 | - | - |
| minimax | minimax-m2.5 | ga | 0.3 | 1.2 | - | - |
| minimax | minimax-m2.7 | ga | 0.3 | 1.2 | - | - |
| minimax | minimax-m3 | ga | 0.3 | 1.2 | - | - |
| mistral | codestral-latest | ga | 0.3 | 0.9 | - | - |
| mistral | devstral-medium-latest | ga | 0.4 | 2.0 | - | - |
| mistral | devstral-small-latest | ga | 0.1 | 0.3 | - | - |
| mistral | magistral-medium-latest | ga | 2.0 | 5.0 | - | - |
| mistral | mistral-large-latest | ga | 0.5 | 1.5 | - | - |
| mistral | mistral-medium-latest | ga | 1.5 | 7.5 | - | - |
| mistral | mistral-small-latest | ga | 0.15 | 0.6 | - | - |
| mistral | voxtral-small-latest | ga | 0.1 | 0.4 | - | - |
| moonshot | kimi-k2.5 | ga | 0.6 | 3.0 | 256000 | - |
| moonshot | kimi-k2.6 | ga | 0.95 | 4.0 | 256000 | - |
| moonshot | kimi-k2.7-code | ga | 0.95 | 4.0 | 256000 | - |
| openai | gpt-5.4 | ga | 2.5 | 15.0 | 1050000 | 128000 |
| openai | gpt-5.5 | ga | 5.0 | 30.0 | 1050000 | 128000 |
| openai | gpt-5.5-pro | ga | 30.0 | 180.0 | 1050000 | 128000 |
| perplexity | perplexity/sonar | ga | 0.25 | 2.5 | - | - |
| perplexity | sonar-pro | ga | 3.0 | 15.0 | 200000 | - |
| perplexity | sonar-reasoning-pro | ga | 2.0 | 8.0 | 128000 | - |
| together | Qwen/Qwen2.5-7B-Instruct-Turbo | ga | 0.3 | 0.3 | 32768 | - |
| together | cogito-v2.1-671b | ga | 1.25 | 1.25 | - | - |
| together | deepseek-v4-pro | ga | 1.74 | 3.48 | - | - |
| together | gemma-3n-e4b-instruct | ga | 0.06 | 0.12 | - | - |
| together | gemma-4-31b | ga | 0.39 | 0.97 | - | - |
| together | gemma-4-31b-it-pearl | ga | 0.28 | 0.86 | - | - |
| together | glm-5.1 | ga | 1.4 | 4.4 | - | - |
| together | glm-5.2 | ga | 1.4 | 4.4 | - | - |
| together | gpt-oss-120b | ga | 0.15 | 0.6 | - | - |
| together | gpt-oss-20b | ga | 0.05 | 0.2 | - | - |
| together | kimi-k2.6 | ga | 1.2 | 4.5 | - | - |
| together | kimi-k2.7-code | ga | 0.95 | 4.0 | - | - |
| together | lfm2-24b-a2b | ga | 0.03 | 0.12 | - | - |
| together | llama-3.3-70b | ga | 1.04 | 1.04 | - | - |
| together | minimax-m2.5 | ga | 0.3 | 1.2 | - | - |
| together | minimax-m2.7 | ga | 0.3 | 1.2 | - | - |
| together | minimax-m3 | ga | 0.3 | 1.2 | - | - |
| together | nvidia-nemotron-3-ultra | ga | 0.6 | 3.6 | - | - |
| together | qwen3-235b-a22b-fp8-throughput | ga | 0.2 | 0.6 | - | - |
| together | qwen3.5-397b-a17b | ga | 0.6 | 3.6 | - | - |
| together | qwen3.5-9b | ga | 0.17 | 0.25 | - | - |
| together | qwen3.6-plus | ga | 0.5 | 3.0 | - | - |
| together | qwen3.7-max | ga | 1.25 | 3.75 | - | - |
| together | qwen3.7-plus | ga | 0.32 | 1.28 | - | - |
| together | rnj-1-instruct | ga | 0.15 | 0.15 | - | - |
| xai | grok-4.20-0309-non-reasoning | ga | 1.25 | 2.5 | 1000000 | - |
| xai | grok-4.20-0309-reasoning | ga | 1.25 | 2.5 | 1000000 | - |
| xai | grok-4.20-multi-agent-0309 | ga | 1.25 | 2.5 | 1000000 | - |
| xai | grok-4.3 | ga | 1.25 | 2.5 | 1000000 | - |
| xai | grok-build-0.1 | ga | 1.0 | 2.0 | 256000 | - |
| zhipu | glm-4-32b-0414-128k | ga | 0.1 | 0.1 | - | - |
| zhipu | glm-4.5 | ga | 0.6 | 2.2 | - | - |
| zhipu | glm-4.5-air | ga | 0.2 | 1.1 | - | - |
| zhipu | glm-4.5-airx | ga | 1.1 | 4.5 | - | - |
| zhipu | glm-4.5-x | ga | 2.2 | 8.9 | - | - |
| zhipu | glm-4.6 | ga | 0.6 | 2.2 | - | - |
| zhipu | glm-4.7 | ga | 0.6 | 2.2 | - | - |
| zhipu | glm-4.7-flashx | ga | 0.07 | 0.4 | - | - |
| zhipu | glm-5 | ga | 1.0 | 3.2 | - | - |
| zhipu | glm-5-turbo | ga | 1.2 | 4.0 | - | - |
| zhipu | glm-5.1 | ga | 1.4 | 4.4 | - | - |
| zhipu | glm-5.2 | ga | 1.4 | 4.4 | - | - |