ai-models.json

{
  "backends": [
    {
      "id": "gemini",
      "label": "Google Gemini"
    },
    {
      "id": "claude",
      "label": "Anthropic Claude"
    },
    {
      "id": "groq",
      "label": "Groq"
    },
    {
      "id": "openai",
      "label": "OpenAI"
    }
  ],
  "models": [
    {
      "id": "gemini-2.5-flash",
      "apiModelId": "gemini-2.5-flash",
      "label": "Gemini 2.5 Flash",
      "backend": "gemini"
    },
    {
      "id": "gemini-2.5-pro",
      "apiModelId": "gemini-2.5-pro",
      "label": "Gemini 2.5 Pro",
      "backend": "gemini"
    },
    {
      "id": "gemini-2.0-flash",
      "apiModelId": "gemini-2.0-flash",
      "label": "Gemini 2.0 Flash",
      "backend": "gemini"
    },
    {
      "id": "gemini-2.0-flash-001",
      "apiModelId": "gemini-2.0-flash-001",
      "label": "Gemini 2.0 Flash 001",
      "backend": "gemini"
    },
    {
      "id": "gemini-2.0-flash-lite-001",
      "apiModelId": "gemini-2.0-flash-lite-001",
      "label": "Gemini 2.0 Flash-Lite 001",
      "backend": "gemini"
    },
    {
      "id": "gemini-2.0-flash-lite",
      "apiModelId": "gemini-2.0-flash-lite",
      "label": "Gemini 2.0 Flash-Lite",
      "backend": "gemini"
    },
    {
      "id": "gemini-2.5-flash-preview-tts",
      "apiModelId": "gemini-2.5-flash-preview-tts",
      "label": "Gemini 2.5 Flash Preview TTS",
      "backend": "gemini"
    },
    {
      "id": "gemini-2.5-pro-preview-tts",
      "apiModelId": "gemini-2.5-pro-preview-tts",
      "label": "Gemini 2.5 Pro Preview TTS",
      "backend": "gemini"
    },
    {
      "id": "gemma-3-1b-it",
      "apiModelId": "gemma-3-1b-it",
      "label": "Gemma 3 1B",
      "backend": "gemini"
    },
    {
      "id": "gemma-3-4b-it",
      "apiModelId": "gemma-3-4b-it",
      "label": "Gemma 3 4B",
      "backend": "gemini"
    },
    {
      "id": "gemma-3-12b-it",
      "apiModelId": "gemma-3-12b-it",
      "label": "Gemma 3 12B",
      "backend": "gemini"
    },
    {
      "id": "gemma-3-27b-it",
      "apiModelId": "gemma-3-27b-it",
      "label": "Gemma 3 27B",
      "backend": "gemini"
    },
    {
      "id": "gemma-3n-e4b-it",
      "apiModelId": "gemma-3n-e4b-it",
      "label": "Gemma 3n E4B",
      "backend": "gemini"
    },
    {
      "id": "gemma-3n-e2b-it",
      "apiModelId": "gemma-3n-e2b-it",
      "label": "Gemma 3n E2B",
      "backend": "gemini"
    },
    {
      "id": "gemini-flash-latest",
      "apiModelId": "gemini-flash-latest",
      "label": "Gemini Flash Latest",
      "backend": "gemini"
    },
    {
      "id": "gemini-flash-lite-latest",
      "apiModelId": "gemini-flash-lite-latest",
      "label": "Gemini Flash-Lite Latest",
      "backend": "gemini"
    },
    {
      "id": "gemini-pro-latest",
      "apiModelId": "gemini-pro-latest",
      "label": "Gemini Pro Latest",
      "backend": "gemini"
    },
    {
      "id": "gemini-2.5-flash-lite",
      "apiModelId": "gemini-2.5-flash-lite",
      "label": "Gemini 2.5 Flash-Lite",
      "backend": "gemini"
    },
    {
      "id": "gemini-2.5-flash-image",
      "apiModelId": "gemini-2.5-flash-image",
      "label": "Nano Banana",
      "backend": "gemini"
    },
    {
      "id": "gemini-2.5-flash-lite-preview-09-2025",
      "apiModelId": "gemini-2.5-flash-lite-preview-09-2025",
      "label": "Gemini 2.5 Flash-Lite Preview Sep 2025",
      "backend": "gemini"
    },
    {
      "id": "gemini-3-pro-preview",
      "apiModelId": "gemini-3.1-pro-preview",
      "label": "Gemini 3 Pro Preview (redirects to 3.1)",
      "backend": "gemini"
    },
    {
      "id": "gemini-3-flash-preview",
      "apiModelId": "gemini-3-flash-preview",
      "label": "Gemini 3 Flash Preview",
      "backend": "gemini"
    },
    {
      "id": "gemini-3.1-pro-preview",
      "apiModelId": "gemini-3.1-pro-preview",
      "label": "Gemini 3.1 Pro Preview",
      "backend": "gemini"
    },
    {
      "id": "gemini-3.1-pro-preview-customtools",
      "apiModelId": "gemini-3.1-pro-preview-customtools",
      "label": "Gemini 3.1 Pro Preview Custom Tools",
      "backend": "gemini"
    },
    {
      "id": "gemini-3.1-flash-lite-preview",
      "apiModelId": "gemini-3.1-flash-lite-preview",
      "label": "Gemini 3.1 Flash Lite Preview",
      "backend": "gemini"
    },
    {
      "id": "gemini-3-pro-image-preview",
      "apiModelId": "gemini-3-pro-image-preview",
      "label": "Nano Banana Pro",
      "backend": "gemini"
    },
    {
      "id": "nano-banana-pro-preview",
      "apiModelId": "nano-banana-pro-preview",
      "label": "Nano Banana Pro",
      "backend": "gemini"
    },
    {
      "id": "gemini-3.1-flash-image-preview",
      "apiModelId": "gemini-3.1-flash-image-preview",
      "label": "Nano Banana 2",
      "backend": "gemini"
    },
    {
      "id": "lyria-3-clip-preview",
      "apiModelId": "lyria-3-clip-preview",
      "label": "Lyria 3 Clip Preview",
      "backend": "gemini"
    },
    {
      "id": "lyria-3-pro-preview",
      "apiModelId": "lyria-3-pro-preview",
      "label": "Lyria 3 Pro Preview",
      "backend": "gemini"
    },
    {
      "id": "gemini-robotics-er-1.5-preview",
      "apiModelId": "gemini-robotics-er-1.5-preview",
      "label": "Gemini Robotics-ER 1.5 Preview",
      "backend": "gemini"
    },
    {
      "id": "gemini-2.5-computer-use-preview-10-2025",
      "apiModelId": "gemini-2.5-computer-use-preview-10-2025",
      "label": "Gemini 2.5 Computer Use Preview 10-2025",
      "backend": "gemini"
    },
    {
      "id": "deep-research-pro-preview-12-2025",
      "apiModelId": "deep-research-pro-preview-12-2025",
      "label": "Deep Research Pro Preview (Dec-12-2025)",
      "backend": "gemini"
    },
    {
      "id": "claude-opus-4-7",
      "apiModelId": "claude-opus-4-7",
      "label": "Opus 4.7 (flagship)",
      "backend": "claude"
    },
    {
      "id": "claude-sonnet-4-6",
      "apiModelId": "claude-sonnet-4-6",
      "label": "Sonnet 4.6",
      "backend": "claude"
    },
    {
      "id": "claude-haiku-4-5",
      "apiModelId": "claude-haiku-4-5-20251001",
      "label": "Haiku 4.5",
      "backend": "claude"
    },
    {
      "id": "claude-opus-4-6",
      "apiModelId": "claude-opus-4-6",
      "label": "Opus 4.6 (legacy)",
      "backend": "claude"
    },
    {
      "id": "claude-sonnet-4-5",
      "apiModelId": "claude-sonnet-4-5",
      "label": "Sonnet 4.5 (legacy)",
      "backend": "claude"
    },
    {
      "id": "groq-allam-2-7b",
      "apiModelId": "allam-2-7b",
      "label": "Allam 2 7b",
      "backend": "groq"
    },
    {
      "id": "groq-openai-gpt-oss-120b",
      "apiModelId": "openai/gpt-oss-120b",
      "label": "Openai/Gpt Oss 120b",
      "backend": "groq"
    },
    {
      "id": "groq-qwen-qwen3-32b",
      "apiModelId": "qwen/qwen3-32b",
      "label": "Qwen/Qwen3 32b",
      "backend": "groq"
    },
    {
      "id": "groq-llama-4-scout-17b-16e",
      "apiModelId": "meta-llama/llama-4-scout-17b-16e-instruct",
      "label": "Llama 4 Scout 17b 16e Instruct",
      "backend": "groq"
    },
    {
      "id": "groq-llama-3.1-8b-instant",
      "apiModelId": "llama-3.1-8b-instant",
      "label": "Llama 3.1 8b Instant",
      "backend": "groq"
    },
    {
      "id": "groq-llama-3.3-70b-versatile",
      "apiModelId": "llama-3.3-70b-versatile",
      "label": "Llama 3.3 70b Versatile",
      "backend": "groq"
    },
    {
      "id": "groq-moonshotai-kimi-k2-instruct-0905",
      "apiModelId": "moonshotai/kimi-k2-instruct-0905",
      "label": "Moonshotai/Kimi K2 Instruct 0905",
      "backend": "groq"
    },
    {
      "id": "groq-moonshotai-kimi-k2",
      "apiModelId": "moonshotai/kimi-k2-instruct",
      "label": "Moonshotai/Kimi K2 Instruct",
      "backend": "groq"
    },
    {
      "id": "groq-groq-compound",
      "apiModelId": "groq/compound",
      "label": "Groq/Compound",
      "backend": "groq"
    },
    {
      "id": "groq-groq-compound-mini",
      "apiModelId": "groq/compound-mini",
      "label": "Groq/Compound Mini",
      "backend": "groq"
    },
    {
      "id": "groq-canopylabs-orpheus-v1-english",
      "apiModelId": "canopylabs/orpheus-v1-english",
      "label": "Canopylabs/Orpheus V1 English",
      "backend": "groq"
    },
    {
      "id": "groq-canopylabs-orpheus-arabic-saudi",
      "apiModelId": "canopylabs/orpheus-arabic-saudi",
      "label": "Canopylabs/Orpheus Arabic Saudi",
      "backend": "groq"
    },
    {
      "id": "groq-openai-gpt-oss-20b",
      "apiModelId": "openai/gpt-oss-20b",
      "label": "Openai/Gpt Oss 20b",
      "backend": "groq"
    },
    {
      "id": "openai-gpt-5.5",
      "apiModelId": "gpt-5.5",
      "label": "GPT-5.5",
      "backend": "openai"
    },
    {
      "id": "openai-gpt-5.5-pro",
      "apiModelId": "gpt-5.5-pro",
      "label": "GPT-5.5 Pro",
      "backend": "openai"
    }
  ],
  "defaults": {
    "gemini": "gemini-3.1-flash-lite-preview",
    "claude": "claude-sonnet-4-6",
    "groq": "groq-openai-gpt-oss-120b"
  },
  "fallbackChains": {
    "gemini-3.1-pro-preview": ["gemini-2.5-pro", "gemini-2.5-flash"],
    "gemini-3-flash-preview": ["gemini-2.5-flash", "groq-llama-3.3-70b-versatile"],
    "gemini-3.1-flash-lite-preview": ["gemini-2.5-flash-lite", "groq-llama-3.1-8b-instant"],
    "gemini-2.5-pro": ["gemini-2.5-flash", "groq-llama-3.3-70b-versatile"],
    "gemini-2.5-flash": ["gemini-2.5-flash-lite", "groq-llama-3.3-70b-versatile"],
    "gemini-2.5-flash-lite": ["groq-llama-3.1-8b-instant"],
    "claude-opus-4-7": ["claude-sonnet-4-6", "gemini-2.5-pro"],
    "claude-sonnet-4-6": ["claude-haiku-4-5", "gemini-2.5-flash"],
    "claude-haiku-4-5": ["gemini-2.5-flash-lite", "groq-llama-3.1-8b-instant"],
    "groq-llama-3.3-70b-versatile": ["groq-llama-3.1-8b-instant", "gemini-2.5-flash"],
    "groq-llama-4-scout-17b-16e": ["groq-llama-3.3-70b-versatile", "gemini-2.5-flash"],
    "groq-openai-gpt-oss-120b": ["groq-llama-3.3-70b-versatile", "gemini-2.5-flash"],
    "openai-gpt-5.5": ["gemini-2.5-flash", "groq-llama-3.3-70b-versatile"]
  },
  "contextWindows": {
    "gemini": 1048576,
    "claude": 1048576,
    "groq": 131072,
    "openai": 131072
  },
  "pricing": {
    "_comment": "USD per 1M tokens. cachedInputPer1M is the reduced rate for cache-hit input tokens. Updated 2026-05-03.",
    "gemini-3.1-pro-preview": { "inputPer1M": 3.00, "outputPer1M": 15.00 },
    "gemini-3-flash-preview": { "inputPer1M": 0.75, "outputPer1M": 3.00 },
    "gemini-3.1-flash-lite-preview": { "inputPer1M": 0.375, "outputPer1M": 1.50 },
    "gemini-2.5-pro": { "inputPer1M": 1.25, "outputPer1M": 10.00, "cachedInputPer1M": 0.3125 },
    "gemini-2.5-flash": { "inputPer1M": 0.30, "outputPer1M": 2.50, "cachedInputPer1M": 0.075 },
    "gemini-2.5-flash-lite": { "inputPer1M": 0.10, "outputPer1M": 0.40, "cachedInputPer1M": 0.025 },
    "gemini-2.0-flash": { "inputPer1M": 0.10, "outputPer1M": 0.40, "cachedInputPer1M": 0.025 },
    "gemini-2.0-flash-lite": { "inputPer1M": 0.075, "outputPer1M": 0.30, "cachedInputPer1M": 0.01875 },
    "claude-opus-4-7": { "inputPer1M": 5.00, "outputPer1M": 25.00, "cachedInputPer1M": 0.50 },
    "claude-sonnet-4-6": { "inputPer1M": 3.00, "outputPer1M": 15.00, "cachedInputPer1M": 0.30 },
    "claude-opus-4-6": { "inputPer1M": 5.00, "outputPer1M": 25.00, "cachedInputPer1M": 0.50 },
    "claude-sonnet-4-5": { "inputPer1M": 3.00, "outputPer1M": 15.00, "cachedInputPer1M": 0.30 },
    "claude-haiku-4-5": { "inputPer1M": 1.00, "outputPer1M": 5.00, "cachedInputPer1M": 0.10 },
    "groq-llama-3.3-70b-versatile": { "inputPer1M": 0.59, "outputPer1M": 0.79 },
    "groq-llama-3.1-8b-instant": { "inputPer1M": 0.05, "outputPer1M": 0.08 },
    "groq-llama-4-scout-17b-16e": { "inputPer1M": 0.11, "outputPer1M": 0.34 },
    "groq-openai-gpt-oss-120b": { "inputPer1M": 0.15, "outputPer1M": 0.60 },
    "groq-openai-gpt-oss-20b": { "inputPer1M": 0.075, "outputPer1M": 0.30 },
    "openai-gpt-5.5": { "inputPer1M": 2.00, "outputPer1M": 8.00 },
    "openai-gpt-5.5-pro": { "inputPer1M": 10.00, "outputPer1M": 40.00 }
  },
  "lastRefreshed": "2026-05-03T10:30:00.000Z"
}