<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>AI Frontier Model Tracker - New Releases</title>
    <description>New frontier AI model releases tracked by DemandSphere. Benchmarks, pricing, and capabilities from OpenAI, Anthropic, Google, xAI, Meta, DeepSeek, and more.</description>
    <link>https://www.demandsphere.com/research/ai-frontier-model-tracker/releases/</link>
    <atom:link href="https://www.demandsphere.com/research/ai-frontier-model-tracker/releases/feed.xml" rel="self" type="application/rss+xml"/>
    <language>en-us</language>
    <lastBuildDate>Sun, 12 Apr 2026 18:29:31 +0000</lastBuildDate>
    <copyright>CC BY-NC 4.0 DemandSphere, Inc.</copyright>
    
    
    
    <item>
      <title>Muse Spark (Meta) - Reasoning</title>
      <description>First model from Meta Superintelligence Labs. 89.5% GPQA Diamond, 50.2% HLE (Contemplating mode). Natively multimodal with visual chain of thought and multi-agent orchestration. 262K context. Free at meta.ai. #1 on HealthBench Hard (42.8) and CharXiv Reasoning (86.4). Context: 262K tokens.</description>
      <link>https://ai.meta.com/blog/introducing-muse-spark-msl/</link>
      <guid isPermaLink="false">ds-tracker-muse-spark-2026-04-08</guid>
      <pubDate>Wed, 08 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>Meta</category>
    </item>
    
    
    <item>
      <title>Gemma 4 26B-A4B (Google) - General</title>
      <description>MoE - 3.8B active / 25.2B total. Near 31B performance at a fraction of the compute. Apache 2.0. Context: 256K tokens. Open weights.</description>
      <link>https://ai.google.dev/gemma/docs/core/model_card_4</link>
      <guid isPermaLink="false">ds-tracker-ge4-26-2026-04-02</guid>
      <pubDate>Thu, 02 Apr 2026 00:00:00 +0000</pubDate>
      <category>General</category>
      <category>Open</category>
      <category>Google</category>
    </item>
    
    
    <item>
      <title>Gemma 4 31B (Google) - General</title>
      <description>Strongest open Gemma model. 85.2% MMLU-Pro, 84.3% GPQA Diamond. Hybrid attention with sliding window. Apache 2.0. Context: 256K tokens. Open weights.</description>
      <link>https://ai.google.dev/gemma/docs/core/model_card_4</link>
      <guid isPermaLink="false">ds-tracker-ge4-31-2026-04-02</guid>
      <pubDate>Thu, 02 Apr 2026 00:00:00 +0000</pubDate>
      <category>General</category>
      <category>Open</category>
      <category>Google</category>
    </item>
    
    
    <item>
      <title>MiniMax M2.7 (MiniMax) - Reasoning</title>
      <description>MiniMax March 2026 flagship. Self-evolving agentic model. 56.2% SWE-Pro. 205K context with automatic caching. $0.30/$1.20 per 1M tokens. Context: 205K tokens. Pricing: $0.3/M input, $1.2/M output.</description>
      <link>https://openrouter.ai/minimax/minimax-m2.7</link>
      <guid isPermaLink="false">ds-tracker-mm27-2026-03-18</guid>
      <pubDate>Wed, 18 Mar 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>MiniMax</category>
    </item>
    
    
    <item>
      <title>GPT-5.4 Mini (OpenAI) - Reasoning</title>
      <description>Cost-efficient reasoning model. 400K context. Near GPT-5.4 Standard performance at 70% lower cost. Multimodal with computer use support. Context: 400K tokens. Pricing: $0.75/M input, $4.5/M output.</description>
      <link>https://openai.com/index/introducing-gpt-5-4-mini-and-nano/</link>
      <guid isPermaLink="false">ds-tracker-gpt-54m-2026-03-17</guid>
      <pubDate>Tue, 17 Mar 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>OpenAI</category>
    </item>
    
    
    <item>
      <title>Grok 4.20 (xAI) - Reasoning</title>
      <description>xAI current flagship as of March 31, 2026. 2M token context window. Four-agent collaborative multi-agent variant available. Reasoning on/off toggle. $2/$6 per 1M tokens. Context: 2000K tokens. Pricing: $2/M input, $6/M output.</description>
      <link>https://docs.x.ai/developers/models</link>
      <guid isPermaLink="false">ds-tracker-grok420-2026-03-10</guid>
      <pubDate>Tue, 10 Mar 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>xAI</category>
    </item>
    
    
    <item>
      <title>GPT-5.4 (OpenAI) - Reasoning</title>
      <description>OpenAI March 2026 flagship. First model with native Computer Use API (75% OSWorld, above human baseline of 72.4%). 1M context in Codex/API. 33% fewer hallucinations vs GPT-5.2. 83% GDPval. GPT-5.2 retires June 5, 2026. Context: 1050K tokens. Pricing: $2.5/M input, $15/M output.</description>
      <link>https://openai.com/index/introducing-gpt-5-4/</link>
      <guid isPermaLink="false">ds-tracker-gpt-54-2026-03-05</guid>
      <pubDate>Thu, 05 Mar 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>OpenAI</category>
    </item>
    
    
    <item>
      <title>Gemini 3.1 Pro (Google) - Reasoning</title>
      <description>First model to break 1500 LMArena Elo. 94.3% GPQA Diamond. 41% HLE - highest published score. Deep Think mode. 1M context. $4/$18 per 1M tokens above 200K. Context: 1000K tokens. Pricing: $2/M input, $12/M output.</description>
      <link>https://ai.google.dev/gemini-api/docs/models</link>
      <guid isPermaLink="false">ds-tracker-g3p-2026-02-19</guid>
      <pubDate>Thu, 19 Feb 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>Google</category>
    </item>
    
    
    <item>
      <title>Claude Sonnet 4.6 (Anthropic) - General</title>
      <description>Current production Sonnet. Frontier coding and agent performance. Top Arena-Code Elo for everyday use. Context: 1000K tokens. Pricing: $3/M input, $15/M output.</description>
      <link>https://docs.anthropic.com/en/docs/about-claude/models</link>
      <guid isPermaLink="false">ds-tracker-cs46-2026-02-17</guid>
      <pubDate>Tue, 17 Feb 2026 00:00:00 +0000</pubDate>
      <category>General</category>
      <category>Closed</category>
      <category>Anthropic</category>
    </item>
    
    
    <item>
      <title>Qwen3.5 397B-A17B (Alibaba/Qwen) - Reasoning</title>
      <description>MoE - 17B active / 397B total. 88.4% GPQA Diamond. 201 languages. Extensible to 1M context. Apache 2.0. Context: 262K tokens. Pricing: $0.6/M input, $3.6/M output. Open weights.</description>
      <link>https://qwen.ai/blog/qwen3.5</link>
      <guid isPermaLink="false">ds-tracker-qw35-2026-02-16</guid>
      <pubDate>Mon, 16 Feb 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Open</category>
      <category>Alibaba/Qwen</category>
    </item>
    
    
    <item>
      <title>MiniMax M2.5 (MiniMax) - Reasoning</title>
      <description>229B MoE / 10B active. 80.2% SWE-bench. 0.6pts behind Claude Opus 4.6. Most-used open model on OpenRouter. Context: 205K tokens. Pricing: $0.3/M input, $2.4/M output. Open weights.</description>
      <link>https://www.minimax.io/news/minimax-m25</link>
      <guid isPermaLink="false">ds-tracker-mm25-2026-02-12</guid>
      <pubDate>Thu, 12 Feb 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Open</category>
      <category>MiniMax</category>
    </item>
    
    
    <item>
      <title>Claude Opus 4.6 (Anthropic) - Reasoning</title>
      <description>Arena Code Elo 1548. 80.8% SWE-bench. 89.11% MMLU-Pro (vals.ai). Leads for coding and nuanced writing. Context: 1000K tokens. Pricing: $5/M input, $25/M output.</description>
      <link>https://docs.anthropic.com/en/docs/about-claude/models</link>
      <guid isPermaLink="false">ds-tracker-co46-2026-02-05</guid>
      <pubDate>Thu, 05 Feb 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>Anthropic</category>
    </item>
    
    
    <item>
      <title>Kimi K2.5 (Moonshot AI) - Reasoning</title>
      <description>Multimodal K2 with native vision, video. Agent Swarm: up to 100 parallel sub-agents. Modified MIT. Context: 262K tokens. Pricing: $0.6/M input, $2.5/M output. Open weights.</description>
      <link>https://kimi.ai</link>
      <guid isPermaLink="false">ds-tracker-kk25-2026-01-27</guid>
      <pubDate>Tue, 27 Jan 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Open</category>
      <category>Moonshot AI</category>
    </item>
    
    
    <item>
      <title>Gemini 3 Flash (Google) - General</title>
      <description>Budget champion - 78% SWE-bench, 90.4% GPQA Diamond, 99.7% AIME 2025. Best value in Dec 2025 frontier. Context: 1000K tokens. Pricing: $0.5/M input, $3/M output.</description>
      <link>https://ai.google.dev/gemini-api/docs/models</link>
      <guid isPermaLink="false">ds-tracker-g3f-2025-12-17</guid>
      <pubDate>Wed, 17 Dec 2025 00:00:00 +0000</pubDate>
      <category>General</category>
      <category>Closed</category>
      <category>Google</category>
    </item>
    
    
    <item>
      <title>DeepSeek V3.2 (DeepSeek) - General</title>
      <description>685B MoE / 37B active. DeepSeek Sparse Attention: 70% long-context cost reduction. MIT license. Context: 128K tokens. Pricing: $0.28/M input, $0.42/M output. Open weights.</description>
      <link>https://deepseek.com</link>
      <guid isPermaLink="false">ds-tracker-dsv32-2025-12-01</guid>
      <pubDate>Mon, 01 Dec 2025 00:00:00 +0000</pubDate>
      <category>General</category>
      <category>Open</category>
      <category>DeepSeek</category>
    </item>
    
    
    <item>
      <title>Claude Opus 4.5 (Anthropic) - Reasoning</title>
      <description>80.9% SWE-bench (record Nov 2025). 89.5% MMLU-Pro. Long-horizon agentic tasks. Extended thinking mode. Context: 200K tokens. Pricing: $5/M input, $25/M output.</description>
      <link>https://docs.anthropic.com/en/docs/about-claude/models</link>
      <guid isPermaLink="false">ds-tracker-co45-2025-11-24</guid>
      <pubDate>Mon, 24 Nov 2025 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>Anthropic</category>
    </item>
    
    
    <item>
      <title>Grok 4.1 Fast (xAI) - Reasoning</title>
      <description>Grok 4 capabilities at dramatically lower cost ($0.20/$0.50). #2 LMArena Elo Dec 2025. Leads EQ-Bench for creative. Real-time X data. Context: 2000K tokens. Pricing: $0.2/M input, $0.5/M output.</description>
      <link>https://docs.x.ai/docs/models</link>
      <guid isPermaLink="false">ds-tracker-grok41-2025-11-19</guid>
      <pubDate>Wed, 19 Nov 2025 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>xAI</category>
    </item>
    
    
    <item>
      <title>Claude Haiku 4.5 (Anthropic) - General</title>
      <description>Fastest efficient Anthropic model. First Haiku with extended thinking and computer use. 73.3% SWE-bench. Context: 200K tokens. Pricing: $1/M input, $5/M output.</description>
      <link>https://docs.anthropic.com/en/docs/about-claude/models</link>
      <guid isPermaLink="false">ds-tracker-ch45-2025-10-15</guid>
      <pubDate>Wed, 15 Oct 2025 00:00:00 +0000</pubDate>
      <category>General</category>
      <category>Closed</category>
      <category>Anthropic</category>
    </item>
    
    
    <item>
      <title>Claude Sonnet 4.5 (Anthropic) - General</title>
      <description>Leading coding model. 77.2% SWE-bench Verified. 30+ hour autonomous task operation. Computer use, extended thinking. Context: 200K tokens. Pricing: $3/M input, $15/M output.</description>
      <link>https://docs.anthropic.com/en/docs/about-claude/models</link>
      <guid isPermaLink="false">ds-tracker-cs45-2025-09-29</guid>
      <pubDate>Mon, 29 Sep 2025 00:00:00 +0000</pubDate>
      <category>General</category>
      <category>Closed</category>
      <category>Anthropic</category>
    </item>
    
    
    <item>
      <title>Hermes 4 405B (Nous Research) - Reasoning</title>
      <description>96.3% MATH-500, 81.9% AIME&apos;24, 70.5% GPQA Diamond. Trained w/ DataForge + Atropos RL on 192 B200 GPUs. Llama 3.1 license. Context: 131K tokens. Pricing: $1/M input, $3/M output. Open weights.</description>
      <link>https://huggingface.co/NousResearch/Hermes-4-405B</link>
      <guid isPermaLink="false">ds-tracker-h4-405-2025-08-26</guid>
      <pubDate>Tue, 26 Aug 2025 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Open</category>
      <category>Nous Research</category>
    </item>
    
  </channel>
</rss>
