{
  "lastUpdated": "2026-04-26",
  "currency": "USD",
  "unit": "per_million_tokens",
  "note": "Prices are best-effort manual snapshots from each provider's pricing page. Verify before invoicing. See /pricing-changelog/ for change history.",
  "models": [
    {
      "slug": "claude-opus",
      "displayName": "Claude Opus 4.7",
      "provider": "anthropic",
      "family": "claude",
      "apiId": "claude-opus-4-7",
      "contextWindow": 200000,
      "input": 15.00,
      "output": 75.00,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "api",
      "confidence": "exact",
      "notes": "Pricing from anthropic.com/pricing"
    },
    {
      "slug": "claude-sonnet",
      "displayName": "Claude Sonnet 4.6",
      "provider": "anthropic",
      "family": "claude",
      "apiId": "claude-sonnet-4-6",
      "contextWindow": 200000,
      "input": 3.00,
      "output": 15.00,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "api",
      "confidence": "exact",
      "notes": "Pricing from anthropic.com/pricing"
    },
    {
      "slug": "claude-haiku",
      "displayName": "Claude Haiku 4.5",
      "provider": "anthropic",
      "family": "claude",
      "apiId": "claude-haiku-4-5-20251001",
      "contextWindow": 200000,
      "input": 0.80,
      "output": 4.00,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "api",
      "confidence": "exact",
      "notes": "Pricing from anthropic.com/pricing"
    },
    {
      "slug": "gpt-4o",
      "displayName": "GPT-4o",
      "provider": "openai",
      "family": "gpt",
      "apiId": "gpt-4o-2024-08-06",
      "contextWindow": 128000,
      "input": 2.50,
      "output": 10.00,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "browser-tiktoken-o200k",
      "confidence": "exact",
      "notes": "Pricing from openai.com/api/pricing"
    },
    {
      "slug": "gpt-4o-mini",
      "displayName": "GPT-4o mini",
      "provider": "openai",
      "family": "gpt",
      "apiId": "gpt-4o-mini",
      "contextWindow": 128000,
      "input": 0.15,
      "output": 0.60,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "browser-tiktoken-o200k",
      "confidence": "exact",
      "notes": "Pricing from openai.com/api/pricing"
    },
    {
      "slug": "gpt-4-turbo",
      "displayName": "GPT-4 Turbo",
      "provider": "openai",
      "family": "gpt",
      "apiId": "gpt-4-turbo-2024-04-09",
      "contextWindow": 128000,
      "input": 10.00,
      "output": 30.00,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "browser-tiktoken-cl100k",
      "confidence": "exact",
      "notes": "Pricing from openai.com/api/pricing"
    },
    {
      "slug": "gemini-2-5-pro",
      "displayName": "Gemini 2.5 Pro",
      "provider": "google",
      "family": "gemini",
      "apiId": "gemini-2.5-pro",
      "contextWindow": 2000000,
      "input": 1.25,
      "output": 10.00,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "api",
      "confidence": "exact",
      "notes": "Pricing from ai.google.dev/pricing — input rate for ≤200k context"
    },
    {
      "slug": "gemini-2-5-flash",
      "displayName": "Gemini 2.5 Flash",
      "provider": "google",
      "family": "gemini",
      "apiId": "gemini-2.5-flash",
      "contextWindow": 1000000,
      "input": 0.075,
      "output": 0.30,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "api",
      "confidence": "exact",
      "notes": "Pricing from ai.google.dev/pricing"
    },
    {
      "slug": "llama-3-1-405b",
      "displayName": "Llama 3.1 405B",
      "provider": "meta",
      "family": "llama",
      "apiId": "meta-llama/llama-3.1-405b-instruct",
      "contextWindow": 128000,
      "input": 3.50,
      "output": 3.50,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "browser-bpe-llama",
      "confidence": "approx-3pct",
      "notes": "Indicative pricing via Together.ai; tokenizer ≈±3% vs reference"
    },
    {
      "slug": "llama-3-1-70b",
      "displayName": "Llama 3.1 70B",
      "provider": "meta",
      "family": "llama",
      "apiId": "meta-llama/llama-3.1-70b-instruct",
      "contextWindow": 128000,
      "input": 0.59,
      "output": 0.79,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "browser-bpe-llama",
      "confidence": "approx-3pct",
      "notes": "Indicative pricing via Together.ai; tokenizer ≈±3% vs reference"
    },
    {
      "slug": "llama-3-1-8b",
      "displayName": "Llama 3.1 8B",
      "provider": "meta",
      "family": "llama",
      "apiId": "meta-llama/llama-3.1-8b-instruct",
      "contextWindow": 128000,
      "input": 0.18,
      "output": 0.18,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "browser-bpe-llama",
      "confidence": "approx-3pct",
      "notes": "Indicative pricing via Together.ai; tokenizer ≈±3% vs reference"
    },
    {
      "slug": "mistral-large",
      "displayName": "Mistral Large",
      "provider": "mistral",
      "family": "mistral",
      "apiId": "mistral-large-latest",
      "contextWindow": 128000,
      "input": 2.00,
      "output": 6.00,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "browser-bpe-mistral",
      "confidence": "approx-3pct",
      "notes": "Pricing from mistral.ai/pricing; tokenizer ≈±3% vs reference"
    },
    {
      "slug": "deepseek-v3",
      "displayName": "DeepSeek V3",
      "provider": "deepseek",
      "family": "deepseek",
      "apiId": "deepseek-chat",
      "contextWindow": 128000,
      "input": 0.27,
      "output": 1.10,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "browser-bpe-deepseek",
      "confidence": "approx-3pct",
      "notes": "Pricing from api-docs.deepseek.com; tokenizer ≈±3% vs reference"
    },
    {
      "slug": "qwen-2-5-72b",
      "displayName": "Qwen 2.5 72B",
      "provider": "alibaba",
      "family": "qwen",
      "apiId": "qwen2.5-72b-instruct",
      "contextWindow": 131072,
      "input": 0.90,
      "output": 0.90,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "browser-bpe-qwen",
      "confidence": "approx-3pct",
      "notes": "Indicative pricing via Together.ai; tokenizer ≈±3% vs reference"
    },
    {
      "slug": "qwen-2-5-coder",
      "displayName": "Qwen 2.5 Coder 32B",
      "provider": "alibaba",
      "family": "qwen",
      "apiId": "qwen2.5-coder-32b-instruct",
      "contextWindow": 131072,
      "input": 0.80,
      "output": 0.80,
      "deprecated": false,
      "deprecatedAt": null,
      "tokenizerStrategy": "browser-bpe-qwen",
      "confidence": "approx-3pct",
      "notes": "Indicative pricing via Together.ai; tokenizer ≈±3% vs reference"
    }
  ]
}
