{
  "$schema": "./models.schema.json",
  "updated": "2026-06-07",
  "models": [
    {
      "id": "anthropic/claude-opus-4.7",
      "provider": "Anthropic",
      "family": "Claude Opus",
      "version": "4.7",
      "released": "2026-04-15",
      "ctx": 1000000,
      "modality": [
        "text",
        "vision",
        "tool"
      ],
      "status": "current",
      "delta": "+0.3",
      "url": "https://www.anthropic.com/news",
      "notes": "Long-context reasoning improvements; better tool use under uncertainty; reduced sycophancy."
    },
    {
      "id": "anthropic/claude-sonnet-4.5",
      "provider": "Anthropic",
      "family": "Claude Sonnet",
      "version": "4.5",
      "released": "2026-03-20",
      "ctx": 1000000,
      "modality": [
        "text",
        "vision",
        "tool"
      ],
      "status": "current",
      "delta": "+0.1",
      "url": "https://www.anthropic.com/news",
      "notes": "Speed/cost-optimized; near-Opus reasoning on most benchmarks."
    },
    {
      "id": "anthropic/claude-haiku-4",
      "provider": "Anthropic",
      "family": "Claude Haiku",
      "version": "4",
      "released": "2026-02-10",
      "ctx": 500000,
      "modality": [
        "text",
        "vision"
      ],
      "status": "current",
      "delta": "—",
      "url": "https://www.anthropic.com/news",
      "notes": "Sub-second latency; agent workflows; budget tier."
    },
    {
      "id": "openai/gpt-5.5",
      "provider": "OpenAI",
      "family": "GPT",
      "version": "5.5",
      "released": "2026-05-01",
      "ctx": 400000,
      "modality": [
        "text",
        "vision",
        "audio",
        "tool"
      ],
      "status": "current",
      "delta": "+0.5",
      "url": "https://openai.com/blog",
      "notes": "Unified reasoning model; auto-router replaces o-series picker."
    },
    {
      "id": "openai/gpt-5",
      "provider": "OpenAI",
      "family": "GPT",
      "version": "5.0",
      "released": "2025-12-12",
      "ctx": 400000,
      "modality": [
        "text",
        "vision",
        "tool"
      ],
      "status": "stable",
      "delta": "—",
      "url": "https://openai.com/blog",
      "notes": "Initial GPT-5 launch; replaced o3/o4-mini routing."
    },
    {
      "id": "openai/o4-mini",
      "provider": "OpenAI",
      "family": "o-series",
      "version": "4-mini",
      "released": "2025-09-18",
      "ctx": 200000,
      "modality": [
        "text",
        "tool"
      ],
      "status": "legacy",
      "delta": "—",
      "url": "https://openai.com/blog",
      "notes": "Reasoning-tuned mini; superseded by GPT-5 auto-router."
    },
    {
      "id": "google/gemini-3-pro",
      "provider": "Google DeepMind",
      "family": "Gemini",
      "version": "3 Pro",
      "released": "2026-04-22",
      "ctx": 2000000,
      "modality": [
        "text",
        "vision",
        "audio",
        "video",
        "tool"
      ],
      "status": "current",
      "delta": "+1.0",
      "url": "https://deepmind.google/discover/blog/",
      "notes": "2M token context; native video understanding; Deep Think mode."
    },
    {
      "id": "google/gemini-3-flash",
      "provider": "Google DeepMind",
      "family": "Gemini",
      "version": "3 Flash",
      "released": "2026-04-22",
      "ctx": 1000000,
      "modality": [
        "text",
        "vision",
        "audio"
      ],
      "status": "current",
      "delta": "+1.0",
      "url": "https://deepmind.google/discover/blog/",
      "notes": "High-throughput tier; multimodal at low latency."
    },
    {
      "id": "google/gemini-3-nano",
      "provider": "Google DeepMind",
      "family": "Gemini",
      "version": "3 Nano",
      "released": "2026-04-22",
      "ctx": 128000,
      "modality": [
        "text",
        "vision"
      ],
      "status": "current",
      "delta": "+1.0",
      "url": "https://deepmind.google/discover/blog/",
      "notes": "On-device tier; ships with newer Pixel/Android."
    },
    {
      "id": "xai/grok-4.3",
      "provider": "xAI",
      "family": "Grok",
      "version": "4.3",
      "released": "2026-05-15",
      "ctx": 256000,
      "modality": [
        "text",
        "vision",
        "tool"
      ],
      "status": "current",
      "delta": "+0.3",
      "url": "https://x.ai/blog",
      "notes": "Real-time X integration; agent improvements; faster tool loops."
    },
    {
      "id": "xai/grok-4-heavy",
      "provider": "xAI",
      "family": "Grok",
      "version": "4 Heavy",
      "released": "2025-11-30",
      "ctx": 256000,
      "modality": [
        "text",
        "vision",
        "tool"
      ],
      "status": "stable",
      "delta": "—",
      "url": "https://x.ai/blog",
      "notes": "Multi-agent reasoning tier (premium plus)."
    },
    {
      "id": "meta/llama-4-maverick",
      "provider": "Meta",
      "family": "Llama",
      "version": "4 Maverick",
      "released": "2025-10-01",
      "ctx": 1000000,
      "modality": [
        "text",
        "vision"
      ],
      "status": "current",
      "delta": "—",
      "url": "https://ai.meta.com/blog/",
      "notes": "MoE; 17B active / 400B total; instruction-tuned flagship open weights."
    },
    {
      "id": "meta/llama-4-scout",
      "provider": "Meta",
      "family": "Llama",
      "version": "4 Scout",
      "released": "2025-10-01",
      "ctx": 10000000,
      "modality": [
        "text",
        "vision"
      ],
      "status": "current",
      "delta": "—",
      "url": "https://ai.meta.com/blog/",
      "notes": "10M token context; MoE 17B active / 109B total."
    },
    {
      "id": "meta/llama-4-behemoth",
      "provider": "Meta",
      "family": "Llama",
      "version": "4 Behemoth",
      "released": "2025-12-15",
      "ctx": 1000000,
      "modality": [
        "text",
        "vision"
      ],
      "status": "current",
      "delta": "—",
      "url": "https://ai.meta.com/blog/",
      "notes": "2T total params; teacher model; not open-weight (yet)."
    },
    {
      "id": "mistral/mistral-large-3",
      "provider": "Mistral",
      "family": "Mistral",
      "version": "Large 3",
      "released": "2026-01-22",
      "ctx": 256000,
      "modality": [
        "text",
        "vision",
        "tool"
      ],
      "status": "current",
      "delta": "+1.0",
      "url": "https://mistral.ai/news/",
      "notes": "Improved multilingual; function calling parity with frontier."
    },
    {
      "id": "mistral/codestral-25",
      "provider": "Mistral",
      "family": "Codestral",
      "version": "25",
      "released": "2025-08-14",
      "ctx": 256000,
      "modality": [
        "text"
      ],
      "status": "current",
      "delta": "—",
      "url": "https://mistral.ai/news/",
      "notes": "Code-specialized; 80+ languages; FIM optimized."
    },
    {
      "id": "deepseek/deepseek-v4",
      "provider": "DeepSeek",
      "family": "DeepSeek",
      "version": "V4",
      "released": "2026-02-28",
      "ctx": 128000,
      "modality": [
        "text",
        "tool"
      ],
      "status": "current",
      "delta": "+1.0",
      "url": "https://api-docs.deepseek.com",
      "notes": "MoE architecture refinements; aggressive pricing remains."
    },
    {
      "id": "deepseek/deepseek-r2",
      "provider": "DeepSeek",
      "family": "DeepSeek-R (reasoning)",
      "version": "R2",
      "released": "2026-03-15",
      "ctx": 128000,
      "modality": [
        "text"
      ],
      "status": "current",
      "delta": "+1.0",
      "url": "https://api-docs.deepseek.com",
      "notes": "Chain-of-thought reasoning successor to R1; open weights."
    },
    {
      "id": "alibaba/qwen-3-max",
      "provider": "Alibaba",
      "family": "Qwen",
      "version": "3 Max",
      "released": "2026-01-10",
      "ctx": 1000000,
      "modality": [
        "text",
        "vision",
        "audio"
      ],
      "status": "current",
      "delta": "+1.0",
      "url": "https://qwenlm.github.io/blog/",
      "notes": "Massive multilingual; strong code; competitive with frontier closed models."
    },
    {
      "id": "alibaba/qwen-3-coder",
      "provider": "Alibaba",
      "family": "Qwen",
      "version": "3 Coder",
      "released": "2026-02-20",
      "ctx": 256000,
      "modality": [
        "text"
      ],
      "status": "current",
      "delta": "+1.0",
      "url": "https://qwenlm.github.io/blog/",
      "notes": "Agent-tuned coder model; open weights."
    },
    {
      "id": "cohere/command-r-plus-3",
      "provider": "Cohere",
      "family": "Command",
      "version": "R+ 3",
      "released": "2026-03-05",
      "ctx": 256000,
      "modality": [
        "text",
        "tool"
      ],
      "status": "current",
      "delta": "+1.0",
      "url": "https://cohere.com/blog",
      "notes": "RAG-specialized; tool-use leader at this tier."
    },
    {
      "id": "nousresearch/hermes-5",
      "provider": "Nous Research",
      "family": "Hermes",
      "version": "5",
      "released": "2026-04-10",
      "ctx": 256000,
      "modality": [
        "text",
        "tool"
      ],
      "status": "current",
      "delta": "+1.0",
      "url": "https://nousresearch.com",
      "notes": "Open-source agent model; trained on real tool-call traces."
    },
    {
      "id": "perplexity/sonar-pro-2",
      "provider": "Perplexity",
      "family": "Sonar",
      "version": "Pro 2",
      "released": "2026-04-01",
      "ctx": 200000,
      "modality": [
        "text",
        "tool"
      ],
      "status": "current",
      "delta": "+1.0",
      "url": "https://perplexity.ai/hub",
      "notes": "Search-grounded; web-native answers; citations first-class."
    },
    {
      "id": "01ai/yi-large-2",
      "provider": "01.AI",
      "family": "Yi",
      "version": "Large 2",
      "released": "2025-11-12",
      "ctx": 200000,
      "modality": [
        "text"
      ],
      "status": "current",
      "delta": "—",
      "url": "https://01.ai",
      "notes": "Bilingual leader (en/zh); strong reasoning at mid-tier price."
    }
  ]
}