<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>AI Frontier Model Tracker - New Releases</title>
    <description>New frontier AI model releases tracked by DemandSphere. Benchmarks, pricing, and capabilities from OpenAI, Anthropic, Google, xAI, Meta, DeepSeek, and more.</description>
    <link>https://www.demandsphere.com/research/demandsphere-radar/ai-frontier-model-tracker/releases/</link>
    <atom:link href="https://www.demandsphere.com/research/demandsphere-radar/ai-frontier-model-tracker/releases/feed.xml" rel="self" type="application/rss+xml"/>
    <language>en-us</language>
    <lastBuildDate>Sat, 16 May 2026 13:56:11 +0000</lastBuildDate>
    <copyright>CC BY-NC 4.0 DemandSphere, Inc.</copyright>
    
    
    
    <item>
      <title>Grok 4.3 (xAI) - Reasoning</title>
      <description>1M context. Three reasoning intensity levels. $1.25/$2.50 per 1M tokens. GA May 6 (beta Apr 17). Context: 2000K tokens. Pricing: $1.25/M input, $2.5/M output.</description>
      <link>https://piunikaweb.com/2026/04/17/xai-grok-4-3-beta-supergrok-heavy/</link>
      <guid isPermaLink="false">ds-tracker-grok43-2026-05-06</guid>
      <pubDate>Wed, 06 May 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>xAI</category>
    </item>
    
    
    <item>
      <title>GPT-5.5 Instant (OpenAI) - Reasoning</title>
      <description>New ChatGPT default, replacing GPT-5.3 Instant. 52.5% fewer hallucinations on high-stakes prompts (medicine, law, finance). 81.2 AIME 2025 (vs 65.4 prior). Vision supported. API alias: chat-latest.</description>
      <link>https://openai.com/index/gpt-5-5-instant/</link>
      <guid isPermaLink="false">ds-tracker-gpt-55i-2026-05-05</guid>
      <pubDate>Tue, 05 May 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>OpenAI</category>
    </item>
    
    
    <item>
      <title>Mistral Medium 3.5 (Mistral AI) - Dense</title>
      <description>128B dense model. 256K context. Open weights (modified MIT). Strong coding and agentic capabilities. 77.6% SWE-Bench Verified. $1.50/$7.50 per 1M tokens. Context: 256K tokens. Pricing: $1.5/M input, $7.5/M output. Open weights.</description>
      <link>https://mistral.ai/news/vibe-remote-agents-mistral-medium-3-5</link>
      <guid isPermaLink="false">ds-tracker-mis-med35-2026-04-29</guid>
      <pubDate>Wed, 29 Apr 2026 00:00:00 +0000</pubDate>
      <category>Dense</category>
      <category>Open</category>
      <category>Mistral AI</category>
    </item>
    
    
    <item>
      <title>DeepSeek V4 Flash (DeepSeek) - Reasoning</title>
      <description>284B MoE / 13B active. MIT license. Same hybrid attention as V4-Pro. 88.1% GPQA Diamond, 91.6% LiveCodeBench. 1M context. $0.14/$0.28 per 1M tokens - 96% cheaper than GPT-5.4 output. Context: 1000K tokens. Pricing: $0.14/M input, $0.28/M output. Open weights.</description>
      <link>https://huggingface.co/deepseek-ai/DeepSeek-V4-Flash</link>
      <guid isPermaLink="false">ds-tracker-dsv4f-2026-04-24</guid>
      <pubDate>Fri, 24 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Open</category>
      <category>DeepSeek</category>
    </item>
    
    
    <item>
      <title>DeepSeek V4 Pro (DeepSeek) - Reasoning</title>
      <description>1.6T MoE / 49B active. MIT license. Trained on 32T+ tokens. Hybrid Attention (CSA+HCA): 27% inference FLOPs and 10% KV cache vs V3 at 1M tokens. 90.1% GPQA Diamond, 80.6% SWE-bench Verified, 93.5% LiveCodeBench (SOTA), 37.7% HLE. Three reasoning modes (non-think, high, max). Context: 1000K tokens. Pricing: $1.74/M input, $3.48/M output. Open weights.</description>
      <link>https://huggingface.co/deepseek-ai/DeepSeek-V4-Pro</link>
      <guid isPermaLink="false">ds-tracker-dsv4p-2026-04-24</guid>
      <pubDate>Fri, 24 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Open</category>
      <category>DeepSeek</category>
    </item>
    
    
    <item>
      <title>GPT-5.5 Pro (OpenAI) - Reasoning</title>
      <description>Higher-accuracy variant of GPT-5.5 with extended compute. $30/$180 per 1M tokens. Context: 1000K tokens. Pricing: $30/M input, $180/M output.</description>
      <link>https://openai.com/index/introducing-gpt-5-5/</link>
      <guid isPermaLink="false">ds-tracker-gpt-55p-2026-04-24</guid>
      <pubDate>Fri, 24 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>OpenAI</category>
    </item>
    
    
    <item>
      <title>Hy3 Preview (Tencent) - Reasoning</title>
      <description>295B MoE / 21B active. 87.2% GPQA Diamond, 74.4% SWE-bench Verified. Hybrid fast/slow thinking. 256K context. Tencent Hy Community License. Open weights. Context: 256K tokens. Open weights.</description>
      <link>https://huggingface.co/tencent/Hy3-preview</link>
      <guid isPermaLink="false">ds-tracker-hy3-2026-04-23</guid>
      <pubDate>Thu, 23 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Open</category>
      <category>Tencent</category>
    </item>
    
    
    <item>
      <title>GPT-5.5 (OpenAI) - Reasoning</title>
      <description>OpenAI&apos;s most capable model. Stronger coding, agentic tasks, and research. $5/$30 per 1M tokens. 1M context. Context: 1000K tokens. Pricing: $5/M input, $30/M output.</description>
      <link>https://openai.com/index/introducing-gpt-5-5/</link>
      <guid isPermaLink="false">ds-tracker-gpt-55-2026-04-23</guid>
      <pubDate>Thu, 23 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>OpenAI</category>
    </item>
    
    
    <item>
      <title>Qwen3.6-27B (Alibaba/Qwen) - Reasoning</title>
      <description>Dense 27B open-weight vision model. Apache 2.0. Hybrid Gated DeltaNet + Gated Attention. 87.8% GPQA Diamond, 77.2% SWE-bench, 83.9% LiveCodeBench v6. 262K native context (1M extended). Thinking preservation across turns. Context: 262K tokens. Open weights.</description>
      <link>https://huggingface.co/Qwen/Qwen3.6-27B</link>
      <guid isPermaLink="false">ds-tracker-qw36-27b-2026-04-22</guid>
      <pubDate>Wed, 22 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Open</category>
      <category>Alibaba/Qwen</category>
    </item>
    
    
    <item>
      <title>Qwen3.6-Max-Preview (Alibaba/Qwen) - Reasoning</title>
      <description>Most powerful Qwen model. Top scores on 6 programming benchmarks. Enhanced agent coding, world knowledge, instruction following vs Qwen3.6-Plus. Free preview on Bailian. Context: 256K tokens.</description>
      <link>https://cntechpost.com/2026/04/20/alibaba-releases-qwen3-6-max-preview-stronger-instruction-following-capabilities/</link>
      <guid isPermaLink="false">ds-tracker-qw36-max-2026-04-20</guid>
      <pubDate>Mon, 20 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>Alibaba/Qwen</category>
    </item>
    
    
    <item>
      <title>GPT-Rosalind (OpenAI) - Reasoning</title>
      <description>First domain-specific OpenAI model. Life sciences: genomics, protein engineering, drug discovery. Research preview for qualified US enterprise customers. Partners: Amgen, Moderna, Allen Institute, Thermo Fisher.</description>
      <link>https://openai.com/index/introducing-gpt-rosalind/</link>
      <guid isPermaLink="false">ds-tracker-gpt-ros-2026-04-16</guid>
      <pubDate>Thu, 16 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>OpenAI</category>
    </item>
    
    
    <item>
      <title>Claude Opus 4.7 (Anthropic) - Reasoning</title>
      <description>#1 SWE-bench Verified (87.6%). #1 SWE-bench Pro (64.3%). 94.2% GPQA Diamond. High-res vision (3.75MP). New xhigh effort level. Agentic task budgets. $5/$25 per 1M tokens. Context: 1000K tokens. Pricing: $5/M input, $25/M output.</description>
      <link>https://www.anthropic.com/news/claude-opus-4-7</link>
      <guid isPermaLink="false">ds-tracker-co47-2026-04-16</guid>
      <pubDate>Thu, 16 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>Anthropic</category>
    </item>
    
    
    <item>
      <title>Qwen3.6 35B-A3B (Alibaba/Qwen) - Reasoning</title>
      <description>MoE - 3B active / 35B total, 256 experts. Runs on a laptop. 73.4% SWE-bench Verified. Natively multimodal. Extensible to 1M context. Apache 2.0. Context: 262K tokens. Open weights.</description>
      <link>https://qwen.ai/blog?id=qwen3.6-35b-a3b</link>
      <guid isPermaLink="false">ds-tracker-qw36-35b-2026-04-16</guid>
      <pubDate>Thu, 16 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Open</category>
      <category>Alibaba/Qwen</category>
    </item>
    
    
    <item>
      <title>Kimi K2.6 (Moonshot AI) - Reasoning</title>
      <description>1T MoE / 32B active. Four variants: Instant, Thinking, Agent, Agent Swarm (300 sub-agents, 4K coordinated steps). Open-weight, Modified MIT. 262K context. Context: 262K tokens. Pricing: $0.6/M input, $2.5/M output. Open weights.</description>
      <link>https://www.kimi.com/code</link>
      <guid isPermaLink="false">ds-tracker-kk26-2026-04-13</guid>
      <pubDate>Mon, 13 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Open</category>
      <category>Moonshot AI</category>
    </item>
    
    
    <item>
      <title>Muse Spark (Meta) - Reasoning</title>
      <description>First model from Meta Superintelligence Labs. 89.5% GPQA Diamond, 50.2% HLE (Contemplating mode). Natively multimodal with visual chain of thought and multi-agent orchestration. 262K context. Free at meta.ai. #1 on HealthBench Hard (42.8) and CharXiv Reasoning (86.4). Context: 262K tokens.</description>
      <link>https://ai.meta.com/blog/introducing-muse-spark-msl/</link>
      <guid isPermaLink="false">ds-tracker-muse-spark-2026-04-08</guid>
      <pubDate>Wed, 08 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>Meta</category>
    </item>
    
    
    <item>
      <title>GLM-5.1 (Zhipu AI) - Reasoning</title>
      <description>754B MoE / 40B active. #1 SWE-Bench Pro (58.4%), beating GPT-5.4 (57.7%) and Opus 4.6 (57.3%). 8-hour autonomous coding loops. MIT license. Context: 200K tokens. Pricing: $1.4/M input, $4.4/M output. Open weights.</description>
      <link>https://docs.z.ai/release-notes/new-released</link>
      <guid isPermaLink="false">ds-tracker-glm51-2026-04-07</guid>
      <pubDate>Tue, 07 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Open</category>
      <category>Zhipu AI</category>
    </item>
    
    
    <item>
      <title>Qwen3.6-Plus (Alibaba/Qwen) - Reasoning</title>
      <description>Proprietary flagship. 1M native context, 65K output tokens. 78.8% SWE-bench Verified. Always-on chain-of-thought. Native function calling and tool use. Context: 1000K tokens. Pricing: $0.29/M input, $1.65/M output.</description>
      <link>https://qwen.ai/blog?id=qwen3.6</link>
      <guid isPermaLink="false">ds-tracker-qw36-2026-04-02</guid>
      <pubDate>Thu, 02 Apr 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>Alibaba/Qwen</category>
    </item>
    
    
    <item>
      <title>Gemma 4 26B-A4B (Google) - General</title>
      <description>MoE - 3.8B active / 25.2B total. Near 31B performance at a fraction of the compute. Apache 2.0. Context: 256K tokens. Open weights.</description>
      <link>https://ai.google.dev/gemma/docs/core/model_card_4</link>
      <guid isPermaLink="false">ds-tracker-ge4-26-2026-04-02</guid>
      <pubDate>Thu, 02 Apr 2026 00:00:00 +0000</pubDate>
      <category>General</category>
      <category>Open</category>
      <category>Google</category>
    </item>
    
    
    <item>
      <title>Gemma 4 31B (Google) - General</title>
      <description>Strongest open Gemma model. 85.2% MMLU-Pro, 84.3% GPQA Diamond. Hybrid attention with sliding window. Apache 2.0. Context: 256K tokens. Open weights.</description>
      <link>https://ai.google.dev/gemma/docs/core/model_card_4</link>
      <guid isPermaLink="false">ds-tracker-ge4-31-2026-04-02</guid>
      <pubDate>Thu, 02 Apr 2026 00:00:00 +0000</pubDate>
      <category>General</category>
      <category>Open</category>
      <category>Google</category>
    </item>
    
    
    <item>
      <title>MiniMax M2.7 (MiniMax) - Reasoning</title>
      <description>MiniMax March 2026 flagship. Self-evolving agentic model. 56.2% SWE-Pro. 205K context with automatic caching. $0.30/$1.20 per 1M tokens. Context: 205K tokens. Pricing: $0.3/M input, $1.2/M output.</description>
      <link>https://openrouter.ai/minimax/minimax-m2.7</link>
      <guid isPermaLink="false">ds-tracker-mm27-2026-03-18</guid>
      <pubDate>Wed, 18 Mar 2026 00:00:00 +0000</pubDate>
      <category>Reasoning</category>
      <category>Closed</category>
      <category>MiniMax</category>
    </item>
    
  </channel>
</rss>
