ai-models.json
|
{ "backends": [ { "id": "gemini", "label": "Google Gemini" }, { "id": "claude", "label": "Anthropic Claude" }, { "id": "groq", "label": "Groq" }, { "id": "openai", "label": "OpenAI" }, { "id": "ollama", "label": "Ollama (Local)", "local": true } ], "models": [ { "id": "gemini-2.5-flash", "apiModelId": "gemini-2.5-flash", "label": "Gemini 2.5 Flash", "backend": "gemini" }, { "id": "gemini-2.5-pro", "apiModelId": "gemini-2.5-pro", "label": "Gemini 2.5 Pro", "backend": "gemini" }, { "id": "gemini-2.0-flash", "apiModelId": "gemini-2.0-flash", "label": "Gemini 2.0 Flash", "backend": "gemini" }, { "id": "gemini-2.0-flash-001", "apiModelId": "gemini-2.0-flash-001", "label": "Gemini 2.0 Flash 001", "backend": "gemini" }, { "id": "gemini-2.0-flash-lite-001", "apiModelId": "gemini-2.0-flash-lite-001", "label": "Gemini 2.0 Flash-Lite 001", "backend": "gemini" }, { "id": "gemini-2.0-flash-lite", "apiModelId": "gemini-2.0-flash-lite", "label": "Gemini 2.0 Flash-Lite", "backend": "gemini" }, { "id": "gemini-2.5-flash-preview-tts", "apiModelId": "gemini-2.5-flash-preview-tts", "label": "Gemini 2.5 Flash Preview TTS", "backend": "gemini" }, { "id": "gemini-2.5-pro-preview-tts", "apiModelId": "gemini-2.5-pro-preview-tts", "label": "Gemini 2.5 Pro Preview TTS", "backend": "gemini" }, { "id": "gemma-4-26b-a4b-it", "apiModelId": "gemma-4-26b-a4b-it", "label": "Gemma 4 26B A4B IT", "backend": "gemini" }, { "id": "gemma-4-31b-it", "apiModelId": "gemma-4-31b-it", "label": "Gemma 4 31B IT", "backend": "gemini" }, { "id": "gemini-flash-latest", "apiModelId": "gemini-flash-latest", "label": "Gemini Flash Latest", "backend": "gemini" }, { "id": "gemini-flash-lite-latest", "apiModelId": "gemini-flash-lite-latest", "label": "Gemini Flash-Lite Latest", "backend": "gemini" }, { "id": "gemini-pro-latest", "apiModelId": "gemini-pro-latest", "label": "Gemini Pro Latest", "backend": "gemini" }, { "id": "gemini-2.5-flash-lite", "apiModelId": "gemini-2.5-flash-lite", "label": "Gemini 2.5 Flash-Lite", "backend": "gemini" }, { "id": "gemini-2.5-flash-image", "apiModelId": "gemini-2.5-flash-image", "label": "Nano Banana", "backend": "gemini" }, { "id": "gemini-3-pro-preview", "apiModelId": "gemini-3-pro-preview", "label": "Gemini 3 Pro Preview", "backend": "gemini" }, { "id": "gemini-3-flash-preview", "apiModelId": "gemini-3-flash-preview", "label": "Gemini 3 Flash Preview", "backend": "gemini" }, { "id": "gemini-3.1-pro-preview", "apiModelId": "gemini-3.1-pro-preview", "label": "Gemini 3.1 Pro Preview", "backend": "gemini" }, { "id": "gemini-3.1-pro-preview-customtools", "apiModelId": "gemini-3.1-pro-preview-customtools", "label": "Gemini 3.1 Pro Preview Custom Tools", "backend": "gemini" }, { "id": "gemini-3.1-flash-lite-preview", "apiModelId": "gemini-3.1-flash-lite-preview", "label": "Gemini 3.1 Flash Lite Preview", "backend": "gemini" }, { "id": "gemini-3.1-flash-lite", "apiModelId": "gemini-3.1-flash-lite", "label": "Gemini 3.1 Flash Lite", "backend": "gemini" }, { "id": "gemini-3-pro-image-preview", "apiModelId": "gemini-3-pro-image-preview", "label": "Nano Banana Pro", "backend": "gemini" }, { "id": "gemini-3-pro-image", "apiModelId": "gemini-3-pro-image", "label": "Nano Banana Pro", "backend": "gemini" }, { "id": "nano-banana-pro-preview", "apiModelId": "nano-banana-pro-preview", "label": "Nano Banana Pro", "backend": "gemini" }, { "id": "gemini-3.1-flash-image-preview", "apiModelId": "gemini-3.1-flash-image-preview", "label": "Nano Banana 2", "backend": "gemini" }, { "id": "gemini-3.1-flash-image", "apiModelId": "gemini-3.1-flash-image", "label": "Nano Banana 2", "backend": "gemini" }, { "id": "gemini-3.5-flash", "apiModelId": "gemini-3.5-flash", "label": "Gemini 3.5 Flash", "backend": "gemini" }, { "id": "lyria-3-clip-preview", "apiModelId": "lyria-3-clip-preview", "label": "Lyria 3 Clip Preview", "backend": "gemini" }, { "id": "lyria-3-pro-preview", "apiModelId": "lyria-3-pro-preview", "label": "Lyria 3 Pro Preview", "backend": "gemini" }, { "id": "gemini-3.1-flash-tts-preview", "apiModelId": "gemini-3.1-flash-tts-preview", "label": "Gemini 3.1 Flash TTS Preview", "backend": "gemini" }, { "id": "gemini-robotics-er-1.5-preview", "apiModelId": "gemini-robotics-er-1.5-preview", "label": "Gemini Robotics-ER 1.5 Preview", "backend": "gemini" }, { "id": "gemini-robotics-er-1.6-preview", "apiModelId": "gemini-robotics-er-1.6-preview", "label": "Gemini Robotics-ER 1.6 Preview", "backend": "gemini" }, { "id": "gemini-2.5-computer-use-preview-10-2025", "apiModelId": "gemini-2.5-computer-use-preview-10-2025", "label": "Gemini 2.5 Computer Use Preview 10-2025", "backend": "gemini" }, { "id": "antigravity-preview-05-2026", "apiModelId": "antigravity-preview-05-2026", "label": "Antigravity Agent Preview", "backend": "gemini" }, { "id": "deep-research-max-preview-04-2026", "apiModelId": "deep-research-max-preview-04-2026", "label": "Deep Research Max Preview (Apr-21-2026)", "backend": "gemini" }, { "id": "deep-research-preview-04-2026", "apiModelId": "deep-research-preview-04-2026", "label": "Deep Research Preview (Apr-21-2026)", "backend": "gemini" }, { "id": "deep-research-pro-preview-12-2025", "apiModelId": "deep-research-pro-preview-12-2025", "label": "Deep Research Pro Preview (Dec-12-2025)", "backend": "gemini" }, { "id": "claude-opus-4", "apiModelId": "claude-opus-4-20250514", "label": "Opus 4", "backend": "claude" }, { "id": "claude-sonnet-4", "apiModelId": "claude-sonnet-4-20250514", "label": "Sonnet 4", "backend": "claude" }, { "id": "claude-haiku-4-5", "apiModelId": "claude-haiku-4-5-20251001", "label": "Haiku 4.5", "backend": "claude" }, { "id": "claude-sonnet-4-5", "apiModelId": "claude-sonnet-4-5", "label": "Sonnet 4.5 (alias)", "backend": "claude" }, { "id": "claude-sonnet-4-6", "apiModelId": "claude-sonnet-4-6", "label": "Sonnet 4.6 (alias)", "backend": "claude" }, { "id": "claude-opus-4-6", "apiModelId": "claude-opus-4-6", "label": "Opus 4.6 (alias)", "backend": "claude" }, { "id": "groq-openai-gpt-oss-20b", "apiModelId": "openai/gpt-oss-20b", "label": "Openai/Gpt Oss 20b", "backend": "groq" }, { "id": "groq-canopylabs-orpheus-arabic-saudi", "apiModelId": "canopylabs/orpheus-arabic-saudi", "label": "Canopylabs/Orpheus Arabic Saudi", "backend": "groq" }, { "id": "groq-groq-compound-mini", "apiModelId": "groq/compound-mini", "label": "Groq/Compound Mini", "backend": "groq" }, { "id": "groq-groq-compound", "apiModelId": "groq/compound", "label": "Groq/Compound", "backend": "groq" }, { "id": "groq-llama-3.1-8b-instant", "apiModelId": "llama-3.1-8b-instant", "label": "Llama 3.1 8b Instant", "backend": "groq" }, { "id": "groq-llama-4-scout-17b-16e", "apiModelId": "meta-llama/llama-4-scout-17b-16e-instruct", "label": "Llama 4 Scout 17b 16e Instruct", "backend": "groq" }, { "id": "groq-llama-3.3-70b-versatile", "apiModelId": "llama-3.3-70b-versatile", "label": "Llama 3.3 70b Versatile", "backend": "groq" }, { "id": "groq-canopylabs-orpheus-v1-english", "apiModelId": "canopylabs/orpheus-v1-english", "label": "Canopylabs/Orpheus V1 English", "backend": "groq" }, { "id": "groq-allam-2-7b", "apiModelId": "allam-2-7b", "label": "Allam 2 7b", "backend": "groq" }, { "id": "groq-openai-gpt-oss-120b", "apiModelId": "openai/gpt-oss-120b", "label": "Openai/Gpt Oss 120b", "backend": "groq" }, { "id": "groq-qwen-qwen3-32b", "apiModelId": "qwen/qwen3-32b", "label": "Qwen/Qwen3 32b", "backend": "groq" }, { "id": "openai-gpt-5.5", "apiModelId": "gpt-5.5", "label": "GPT-5.5", "backend": "openai" }, { "id": "openai-gpt-5.5-pro", "apiModelId": "gpt-5.5-pro", "label": "GPT-5.5 Pro", "backend": "openai" }, { "id": "ollama-gemma4-e4b-it-q4-k-m", "apiModelId": "gemma4:e4b-it-q4_K_M", "label": "gemma4:e4b-it-q4_K_M (8.0B) Q4_K_M", "backend": "ollama" } ], "defaults": { "gemini": "gemini-3.1-flash-lite", "claude": "claude-sonnet-4-6", "groq": "groq-openai-gpt-oss-120b", "ollama": "ollama-gemma4-e4b-it-q4-k-m" }, "fallbackChains": { "gemini-3.1-pro-preview": [ "gemini-2.5-pro", "gemini-2.5-flash" ], "gemini-3-flash-preview": [ "gemini-2.5-flash", "groq-llama-3.3-70b-versatile" ], "gemini-3.1-flash-lite": [ "gemini-2.5-flash-lite", "groq-llama-3.1-8b-instant" ], "gemini-flash-lite-latest": [ "gemini-2.5-flash-lite", "groq-llama-3.1-8b-instant" ], "gemini-2.5-pro": [ "gemini-2.5-flash", "groq-llama-3.3-70b-versatile" ], "gemini-2.5-flash": [ "gemini-2.5-flash-lite", "groq-llama-3.3-70b-versatile" ], "gemini-2.5-flash-lite": [ "groq-llama-3.1-8b-instant" ], "claude-opus-4-7": [ "claude-sonnet-4-6", "gemini-2.5-pro" ], "claude-sonnet-4-6": [ "claude-haiku-4-5", "gemini-2.5-flash" ], "claude-haiku-4-5": [ "gemini-2.5-flash-lite", "groq-llama-3.1-8b-instant" ], "groq-llama-3.3-70b-versatile": [ "groq-llama-3.1-8b-instant", "gemini-2.5-flash" ], "groq-llama-4-scout-17b-16e": [ "groq-llama-3.3-70b-versatile", "gemini-2.5-flash" ], "groq-openai-gpt-oss-120b": [ "groq-llama-3.3-70b-versatile", "gemini-2.5-flash" ], "openai-gpt-5.5": [ "gemini-2.5-flash", "groq-llama-3.3-70b-versatile" ] }, "contextWindows": { "gemini": 1048576, "claude": 1048576, "groq": 131072, "openai": 131072, "ollama": 131072 }, "pricing": { "_comment": "USD per 1M tokens. cachedInputPer1M is the reduced rate for cache-hit input tokens. Updated 2026-05-03.", "gemini-3.1-pro-preview": { "inputPer1M": 3, "outputPer1M": 15 }, "gemini-3-flash-preview": { "inputPer1M": 0.75, "outputPer1M": 3 }, "gemini-flash-lite-latest": { "inputPer1M": 0.375, "outputPer1M": 1.5 }, "gemini-2.5-pro": { "inputPer1M": 1.25, "outputPer1M": 10, "cachedInputPer1M": 0.3125 }, "gemini-2.5-flash": { "inputPer1M": 0.3, "outputPer1M": 2.5, "cachedInputPer1M": 0.075 }, "gemini-2.5-flash-lite": { "inputPer1M": 0.1, "outputPer1M": 0.4, "cachedInputPer1M": 0.025 }, "gemini-2.0-flash": { "inputPer1M": 0.1, "outputPer1M": 0.4, "cachedInputPer1M": 0.025 }, "gemini-2.0-flash-lite": { "inputPer1M": 0.075, "outputPer1M": 0.3, "cachedInputPer1M": 0.01875 }, "claude-opus-4-7": { "inputPer1M": 5, "outputPer1M": 25, "cachedInputPer1M": 0.5 }, "claude-sonnet-4-6": { "inputPer1M": 3, "outputPer1M": 15, "cachedInputPer1M": 0.3 }, "claude-opus-4-6": { "inputPer1M": 5, "outputPer1M": 25, "cachedInputPer1M": 0.5 }, "claude-sonnet-4-5": { "inputPer1M": 3, "outputPer1M": 15, "cachedInputPer1M": 0.3 }, "claude-haiku-4-5": { "inputPer1M": 1, "outputPer1M": 5, "cachedInputPer1M": 0.1 }, "groq-llama-3.3-70b-versatile": { "inputPer1M": 0.59, "outputPer1M": 0.79 }, "groq-llama-3.1-8b-instant": { "inputPer1M": 0.05, "outputPer1M": 0.08 }, "groq-llama-4-scout-17b-16e": { "inputPer1M": 0.11, "outputPer1M": 0.34 }, "groq-openai-gpt-oss-120b": { "inputPer1M": 0.15, "outputPer1M": 0.6 }, "groq-openai-gpt-oss-20b": { "inputPer1M": 0.075, "outputPer1M": 0.3 }, "openai-gpt-5.5": { "inputPer1M": 2, "outputPer1M": 8 }, "openai-gpt-5.5-pro": { "inputPer1M": 10, "outputPer1M": 40 } }, "lastRefreshed": "2026-06-01T16:32:15.840Z" } |