diff --git a/.kilo/KILO_SPEC.md b/.kilo/KILO_SPEC.md
index 0b0f1db..2f5e469 100644
--- a/.kilo/KILO_SPEC.md
+++ b/.kilo/KILO_SPEC.md
@@ -433,35 +433,40 @@ Provider availability depends on configuration. Common providers include:
 
 | Agent | Role | Model |
 |-------|------|-------|
-| `@RequirementRefiner` | Converts vague ideas and bug reports into strict User Stories with acceptance criteria checklists. | ollama-cloud/kimi-k2-thinking |
-| `@HistoryMiner` | Analyzes git history to find duplicates and past solutions, preventing regression and duplicate work. | ollama-cloud/nemotron-3-super |
-| `@SystemAnalyst` | Designs technical specifications, data schemas, and API contracts before implementation. | ollama-cloud/nemotron-3-super |
-| `@SdetEngineer` | Writes tests following TDD methodology. | ollama-cloud/qwen3-coder:480b |
-| `@LeadDeveloper` | Primary code writer for backend and core logic. | ollama-cloud/nemotron-3-super |
-| `@FrontendDeveloper` | Handles UI implementation with multimodal capabilities. | ollama-cloud/kimi-k2.5 |
-| `@BackendDeveloper` | Backend specialist for Node. | ollama-cloud/deepseek-v3.2 |
-| `@GoDeveloper` | Go backend specialist for Gin, Echo, APIs, and database integration. | ollama-cloud/qwen3-coder:480b |
+| `@RequirementRefiner` | Converts vague ideas and bug reports into strict User Stories with acceptance criteria checklists. | ollama-cloud/kimi-k2.6 |
+| `@HistoryMiner` | Analyzes git history to find duplicates and past solutions, preventing regression and duplicate work. | ollama-cloud/kimi-k2.6 |
+| `@SystemAnalyst` | Designs technical specifications, data schemas, and API contracts before implementation. | ollama-cloud/glm-5.1 |
+| `@SdetEngineer` | Writes tests following TDD methodology. | ollama-cloud/kimi-k2.6 |
+| `@LeadDeveloper` | Primary code writer for backend and core logic. | ollama-cloud/kimi-k2.6 |
+| `@FrontendDeveloper` | Handles UI implementation with multimodal capabilities. | ollama-cloud/kimi-k2.6 |
+| `@BackendDeveloper` | Backend specialist for Node. | ollama-cloud/kimi-k2.6 |
+| `@GoDeveloper` | Go backend specialist for Gin, Echo, APIs, and database integration. | ollama-cloud/deepseek-v4-pro-max |
 | `@DevopsEngineer` | DevOps specialist for Docker, Kubernetes, CI/CD pipeline automation, and infrastructure management. | ollama-cloud/kimi-k2.6 |
-| `@CodeSkeptic` | Adversarial code reviewer. | ollama-cloud/minimax-m2.5 |
-| `@TheFixer` | Iteratively fixes bugs based on specific error reports and test failures. | ollama-cloud/minimax-m2.5 |
-| `@PerformanceEngineer` | Reviews code for performance issues. | ollama-cloud/nemotron-3-super |
-| `@SecurityAuditor` | Scans for security vulnerabilities, OWASP Top 10, dependency CVEs, and hardcoded secrets. | ollama-cloud/nemotron-3-super |
-| `@VisualTester` | Visual regression testing agent that compares screenshots and detects UI differences using pixelmatch and image diff. | ollama-cloud/qwen3-coder:480b |
+| `@CodeSkeptic` | Adversarial code reviewer. | ollama-cloud/kimi-k2.6 |
+| `@TheFixer` | Iteratively fixes bugs based on specific error reports and test failures. | ollama-cloud/kimi-k2.6 |
+| `@PerformanceEngineer` | Reviews code for performance issues. | ollama-cloud/deepseek-v4-pro-max |
+| `@SecurityAuditor` | Scans for security vulnerabilities, OWASP Top 10, dependency CVEs, and hardcoded secrets. | ollama-cloud/deepseek-v4-pro-max |
+| `@VisualTester` | Visual regression testing agent that compares screenshots and detects UI differences using pixelmatch and image diff. | ollama-cloud/kimi-k2.6 |
 | `@Orchestrator` | Main dispatcher. | ollama-cloud/kimi-k2.6 |
-| `@ReleaseManager` | Manages git operations, semantic versioning, branching, and deployments. | ollama-cloud/devstral-2:123b |
-| `@Evaluator` | Scores agent effectiveness after task completion for continuous improvement. | ollama-cloud/nemotron-3-super |
-| `@PromptOptimizer` | Improves agent system prompts based on performance failures. | ollama-cloud/glm-5.1 |
-| `@ProductOwner` | Manages issue checklists, status labels, tracks progress and coordinates with human users. | ollama-cloud/glm-5.1 |
+| `@ReleaseManager` | Manages git operations, semantic versioning, branching, and deployments. | ollama-cloud/glm-5.1 |
+| `@Evaluator` | Scores agent effectiveness after task completion for continuous improvement. | ollama-cloud/kimi-k2.6 |
+| `@PromptOptimizer` | Improves agent system prompts based on performance failures. | ollama-cloud/kimi-k2.6 |
+| `@ProductOwner` | Manages issue checklists, status labels, tracks progress and coordinates with human users. | ollama-cloud/kimi-k2.6 |
 | `@AgentArchitect` | Creates, modifies, and reviews new agents, workflows, and skills based on capability gap analysis. | ollama-cloud/kimi-k2.6 |
-| `@CapabilityAnalyst` | Analyzes task requirements against available agents, workflows, and skills. | ollama-cloud/nemotron-3-super |
-| `@WorkflowArchitect` | Creates and maintains workflow definitions with complete architecture, Gitea integration, and quality gates. | ollama-cloud/gpt-oss:120b |
-| `@MarkdownValidator` | Validates and corrects Markdown descriptions for Gitea issues. | ollama-cloud/nemotron-3-nano:30b |
+| `@CapabilityAnalyst` | Analyzes task requirements against available agents, workflows, and skills. | ollama-cloud/glm-5.1 |
+| `@WorkflowArchitect` | Creates and maintains workflow definitions with complete architecture, Gitea integration, and quality gates. | ollama-cloud/kimi-k2.6 |
+| `@MarkdownValidator` | Validates and corrects Markdown descriptions for Gitea issues. | ollama-cloud/kimi-k2.6 |
 | `@BrowserAutomation` | Browser automation agent using Playwright MCP for E2E testing, form filling, navigation, and web interaction. | ollama-cloud/kimi-k2.6 |
-| `@Planner` | Advanced task planner using Chain of Thought, Tree of Thoughts, and Plan-Execute-Reflect. | ollama-cloud/nemotron-3-super |
-| `@Reflector` | Self-reflection agent using Reflexion pattern - learns from mistakes. | ollama-cloud/nemotron-3-super |
-| `@MemoryManager` | Manages agent memory systems - short-term (context), long-term (vector store), and episodic (experiences). | ollama-cloud/nemotron-3-super |
-| `@IncidentResponder` | Server incident response, live forensics, malware removal, hardening, and SSH-based cleanup. | ollama-cloud/kimi-k2.6 |
-| `@WorkflowCrossChecker` | Pre-flight inter-agent conflict and architecture validation; asks uncomfortable questions before expensive work. | ollama-cloud/deepseek-v4-pro-max |
+| `@Planner` | Advanced task planner using Chain of Thought, Tree of Thoughts, and Plan-Execute-Reflect. | ollama-cloud/deepseek-v4-pro-max |
+| `@Reflector` | Self-reflection agent using Reflexion pattern - learns from mistakes. | ollama-cloud/deepseek-v4-pro-max |
+| `@MemoryManager` | Manages agent memory systems - short-term (context), long-term (vector store), and episodic (experiences). | ollama-cloud/deepseek-v4-pro-max |
+| `@ArchitectIndexer` | Indexes and maps project codebase architecture into . | ollama-cloud/kimi-k2.6 |
+| `@FlutterDeveloper` | Flutter mobile specialist for cross-platform apps, state management, and UI components. | ollama-cloud/kimi-k2.6 |
+| `@PhpDeveloper` | PHP specialist for Laravel, Symfony, WordPress, and modular architecture. | ollama-cloud/kimi-k2.6 |
+| `@PipelineJudge` | Automated pipeline judge. | ollama-cloud/glm-5.1 |
+| `@PythonDeveloper` | Python specialist for Django, FastAPI, data processing, and ML pipelines. | ollama-cloud/kimi-k2.6 |
+| `@IncidentResponder` | Server incident response and system hardening specialist. | ollama-cloud/kimi-k2.6 |
+| `@WorkflowCrossChecker` | Workflow cross-checker and process inspector. | ollama-cloud/kimi-k2.6 |
 
 
 
diff --git a/AGENTS.md b/AGENTS.md
index c59da98..2bbafe2 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -52,6 +52,11 @@ These agents are invoked automatically by `/pipeline` or manually via `@mention`
 | `@BackendDeveloper` | Backend specialist for Node | When backend needed |
 | `@GoDeveloper` | Go backend specialist for Gin, Echo, APIs, and database integration | When Go backend needed |
 | `@DevopsEngineer` | DevOps specialist for Docker, Kubernetes, CI/CD pipeline automation, and infrastructure management | When deployment/infra needed |
+| `@ArchitectIndexer` | Indexes and maps project codebase architecture into  | Manual invocation |
+| `@FlutterDeveloper` | Flutter mobile specialist for cross-platform apps, state management, and UI components | Manual invocation |
+| `@PhpDeveloper` | PHP specialist for Laravel, Symfony, WordPress, and modular architecture | Manual invocation |
+| `@PythonDeveloper` | Python specialist for Django, FastAPI, data processing, and ML pipelines | Manual invocation |
+| `@IncidentResponder` | Server incident response and system hardening specialist | Manual invocation |
 
 ### Quality Assurance
 | Agent | Role | When Invoked |
@@ -86,8 +91,9 @@ These agents are invoked automatically by `/pipeline` or manually via `@mention`
 | `@AgentArchitect` | Creates, modifies, and reviews new agents, workflows, and skills based on capability gap analysis | When gaps identified |
 | `@CapabilityAnalyst` | Analyzes task requirements against available agents, workflows, and skills | When starting new task |
 | `@WorkflowArchitect` | Creates and maintains workflow definitions with complete architecture, Gitea integration, and quality gates | New workflow needed |
-| `@WorkflowCrossChecker` | Pre-flight inter-agent conflict and architecture validation; asks uncomfortable questions before expensive work | Before parallel spawn or state transitions |
 | `@MarkdownValidator` | Validates and corrects Markdown descriptions for Gitea issues | Before issue creation |
+| `@PipelineJudge` | Automated pipeline judge | Manual invocation |
+| `@WorkflowCrossChecker` | Workflow cross-checker and process inspector | Manual invocation |
 
 ### Security & Incident Response
 | Agent | Role | When Invoked |
diff --git a/agent-evolution/index.html b/agent-evolution/index.html
index e1ba105..782cf52 100644
--- a/agent-evolution/index.html
+++ b/agent-evolution/index.html
@@ -983,6 +983,7 @@
             <button class="hm-tab-btn" onclick="switchHmTab('gitea')">Gitea History</button>
             <button class="hm-tab-btn" onclick="switchHmTab('skills')">Skills</button>
             <button class="hm-tab-btn" onclick="switchHmTab('models')">Model Timeline</button>
+            <button class="hm-tab-btn" onclick="switchHmTab('graph')">Performance Graph</button>
         </div>
         <div class="modal-body" id="hmModalBody">
             <!-- Content injected by JS -->
@@ -1162,33 +1163,15 @@ function renderOverview() {
         `).join('')
         : '<p style="color: var(--text-muted);">No history yet</p>';
 
-    // Recommended agents (use inline recs if available)
-    let recAgents = [];
-    if (INLINE_RECOMMENDATIONS && INLINE_RECOMMENDATIONS.length > 0) {
-        recAgents = INLINE_RECOMMENDATIONS.slice(0, 6).map(r => ({ agent: r.agent, current: { recommendations: [{ priority: r.impact, target: r.source_of_truth_model || r.recommended_model, reason: r.rationale, score_before: r.score_before, score_after: r.score_after, score_delta: r.score_delta }], model: r.current_model_in_agent_versions || r.current_model, category: 'Core Dev', description: '', benchmark: { fit_score: r.score_after || 0 } } }));
-    } else {
-        recAgents = Object.entries(agentData.agents)
-            .filter(([_, a]) => a.current.recommendations && a.current.recommendations.length > 0)
-            .slice(0, 6);
-    }
+    // Recommended agents from live data
+    const recAgents = Object.entries(agentData.agents || {})
+        .filter(([_, a]) => (a.current?.recommendations || []).length > 0)
+        .slice(0, 6);
 
     document.getElementById('recCount').textContent = recAgents.length;
-    if (INLINE_RECOMMENDATIONS && INLINE_RECOMMENDATIONS.length > 0) {
-        document.getElementById('recAgents').innerHTML = recAgents.map((r, idx) => renderRecCard({
-            agent: r.agent,
-            current_model: r.current?.model || '',
-            recommended_model: r.current?.recommendations?.[0]?.target || '',
-            impact: r.current?.recommendations?.[0]?.priority?.toLowerCase() || 'medium',
-            score_before: r.current?.recommendations?.[0]?.score_before || 0,
-            score_after: r.current?.recommendations?.[0]?.score_after || 0,
-            score_delta: r.current?.recommendations?.[0]?.score_delta || 0,
-            rationale: r.current?.recommendations?.[0]?.reason || ''
-        }, idx)).join('');
-    } else {
-        document.getElementById('recAgents').innerHTML = recAgents.map(([name, agent]) => 
-            renderAgentCard(name, agent, true)
-        ).join('');
-    }
+    document.getElementById('recAgents').innerHTML = recAgents.map(([name, agent]) => 
+        renderAgentCard(name, agent, true)
+    ).join('');
 }
 
 // Render All Agents
@@ -1327,24 +1310,19 @@ function renderTimeline() {
 
 // Render Recommendations (v3 style with swap visuals)
 function renderRecommendations() {
-    // Use inline recommendations or fall back to agent data
-    let recs = [];
-    if (INLINE_RECOMMENDATIONS && INLINE_RECOMMENDATIONS.length > 0) {
-        recs = INLINE_RECOMMENDATIONS;
-    } else {
-        recs = Object.entries(agentData.agents)
-            .filter(([_, a]) => a.current.recommendations && a.current.recommendations.length > 0)
-            .map(([name, agent]) => ({
-                agent: name,
-                current_model: agent.current.model,
-                recommended_model: agent.current.recommendations[0]?.target,
-                impact: agent.current.recommendations[0]?.priority?.toLowerCase() || 'medium',
-                score_before: agent.current.recommendations[0]?.score_before || 0,
-                score_after: agent.current.recommendations[0]?.score_after || 0,
-                score_delta: agent.current.recommendations[0]?.score_delta || 0,
-                rationale: agent.current.recommendations[0]?.reason || ''
-            }));
-    }
+    const recs = Object.entries(agentData.agents || {})
+        .filter(([_, a]) => (a.current?.recommendations || []).length > 0) 
+        .map(([name, agent]) => ({
+            agent: name,
+            current_model: agent.current?.model,
+            recommended_model: agent.current?.recommendations?.[0]?.target,
+            impact: agent.current?.recommendations?.[0]?.priority?.toLowerCase() || 'medium',
+            score_before: agent.current?.recommendations?.[0]?.score_before || 0,
+            score_after: agent.current?.recommendations?.[0]?.score_after || 0,
+            score_delta: agent.current?.recommendations?.[0]?.score_delta || 0,
+            rationale: agent.current?.recommendations?.[0]?.reason || '',
+            current_model_in_agent_versions: agent.current?.model
+        }));
 
     if (recs.length === 0) {
         document.getElementById('allRecommendations').innerHTML = '<p style="color:var(--text-muted);text-align:center;padding:40px;">No recommendations available</p>';
@@ -1493,7 +1471,7 @@ function renderHeatmap() {
             h += `<td style="background:${hmColor(s)};color:${hmText(s)};cursor:pointer" class="${cur ? 'hm-cur' : ''}" title="${ag.n} × ${hmModels[j].n}: ${s}"
                 onmouseover="showTT(event,'${ag.n}','${hmModels[j].n} (${hmModels[j].p})',${s},${best},${cur},${hmModels[j].if})"
                 onmouseout="hideTT()"
-                onclick="showCellDetail('${hmModels[j].full}', '${ag.n}')">${s}${marks}</td>`;
+                onclick="openHmModal(event, '${ag.n}', '${hmModels[j].n}', ${s}, ${hmModels[j].if})">${s}${marks}</td>`;
         });
         h += '</tr>';
     });
@@ -1556,7 +1534,8 @@ function closeHmModal() {
 }
 
 // Show cell detail modal with Chart.js line chart and prompt history
-function showCellDetail(modelName, agentName) {
+function showCellDetail(event, modelName, agentName) {
+    event.stopPropagation();
     const agent = agentData.agents[agentName];
     if (!agent) {
         console.error('Agent not found:', agentName);
@@ -1770,9 +1749,13 @@ function renderHmModalContent(tabName) {
         case 'models':
             content = renderModelsTab(agent);
             break;
+        case 'graph':
+            content = renderGraphTab(agent);
+            break;
     }
 
     body.innerHTML = `<div class="hm-tab-content active" style="display:block">${content}</div>`;
+    if (tabName === 'graph') setTimeout(() => renderCellChart(hmCurrentAgent, agent.current?.model || ''), 50);
 }
 
 function renderPromptTab(agent) {
@@ -1911,6 +1894,46 @@ function renderModelsTab(agent) {
     return html;
 }
 
+function renderGraphTab(agent) {
+    return `
+        <div style="margin-bottom:20px">
+            <h3 style="margin-bottom:10px;color:var(--accent-cyan)">Performance Over Time</h3>
+            <div style="position:relative;height:300px">
+                <canvas id="cellChartCanvas"></canvas>
+            </div>
+        </div>
+        <div>
+            <h3 style="margin-bottom:10px;color:var(--accent-cyan)">Prompt Change History</h3>
+            <div id="promptHistoryList" style="max-height:300px;overflow-y:auto">
+                ${renderPromptHistory(agent)}
+            </div>
+        </div>
+    `;
+}
+
+function renderPromptHistory(agent) {
+    const promptChanges = (agent.history || []).filter(item => item.change_type === 'prompt_change');
+
+    if (promptChanges.length === 0) {
+        return '<p style="color:var(--text-muted);text-align:center;padding:20px">No prompt change history found</p>';
+    }
+
+    let html = '<ul style="list-style:none;padding:0">';
+    promptChanges.forEach(change => {
+        html += `
+            <li style="padding:10px;border-bottom:1px solid var(--border);margin-bottom:10px">
+                <div style="display:flex;justify-content:space-between;margin-bottom:5px">
+                    <span style="font-family:'JetBrains Mono',monospace;font-size:.8em;color:var(--text-muted)">${formatDate(change.date)}</span>
+                    <span style="font-family:'JetBrains Mono',monospace;font-size:.8em;color:var(--accent-cyan)">${change.commit ? change.commit.substring(0,7) : 'unknown'}</span>
+                </div>
+                <div style="font-size:.9em;color:var(--text-secondary)">${change.reason || 'No reason provided'}</div>
+            </li>
+        `;
+    });
+    html += '</ul>';
+    return html;
+}
+
 // Compute composite score for any model name
 // Formula (v2): IF_score * 0.85 + context_window_bonus (SWE-bench removed — all values unverifiable)
 function computeAgentScore(modelName) {
@@ -2344,7 +2367,7 @@ function simulateApply() {
             progressStatus.textContent = 'Complete!';
             progressResult.classList.add('show');
             
-            const recs = INLINE_RECOMMENDATIONS && INLINE_RECOMMENDATIONS.length > 0 ? INLINE_RECOMMENDATIONS : [];
+            const recs = Object.values(agentData.agents || {}).filter(a => (a.current?.recommendations || []).length > 0);
             progressResultText.textContent = `✅ ${recs.length} recommendations applied. Run 'bun run sync:evolution' to update dashboard.`;
         }
     }
@@ -2395,11 +2418,11 @@ function showResearchModal() {
                 step.classList.add('done');
             });
             
-            const recs = INLINE_RECOMMENDATIONS && INLINE_RECOMMENDATIONS.length > 0 ? INLINE_RECOMMENDATIONS : [];
-            const modelsCount = new Set(recs.map(r => r.current_model).concat(recs.map(r => r.source_of_truth_model || r.recommended_model))).size;
-            const recsCount = recs.filter(r => r.score_delta > 0).length;
-            
-            document.getElementById('researchSummaryText').textContent = 
+            const recs = Object.values(agentData.agents || {}).filter(a => (a.current?.recommendations || []).length > 0);
+            const modelsCount = new Set(recs.flatMap(a => [a.current?.model, a.current?.recommendations?.[0]?.target])).size;
+            const recsCount = recs.filter(a => (a.current?.recommendations?.[0]?.score_delta || 0) > 0).length;
+
+            document.getElementById('researchSummaryText').textContent =
                 `${modelsCount} models evaluated. ${recsCount} recommendations found. ${recs.length - recsCount} idle models detected.`;
             researchSummary.classList.add('show');
         }
diff --git a/agent-evolution/index.standalone.html b/agent-evolution/index.standalone.html
index f756b9f..7174e12 100644
--- a/agent-evolution/index.standalone.html
+++ b/agent-evolution/index.standalone.html
@@ -983,6 +983,7 @@
             <button class="hm-tab-btn" onclick="switchHmTab('gitea')">Gitea History</button>
             <button class="hm-tab-btn" onclick="switchHmTab('skills')">Skills</button>
             <button class="hm-tab-btn" onclick="switchHmTab('models')">Model Timeline</button>
+            <button class="hm-tab-btn" onclick="switchHmTab('graph')">Performance Graph</button>
         </div>
         <div class="modal-body" id="hmModalBody">
             <!-- Content injected by JS -->
@@ -1016,7 +1017,7 @@ Chart.defaults.borderColor = '#1e2d45';
 Chart.defaults.font.family = "'Inter', sans-serif";
 
 // Inline recommendation data fallback (from model-research-latest.json)
-const INLINE_RECOMMENDATIONS = []; // REMOVED — data now comes from agentData, not hardcoded
+const INLINE_RECOMMENDATIONS = []; // Deprecated — data now comes from agentData.agents[].current.recommendations
 
 // Inline benchmark data (fallback when embedded data doesn't have model_benchmarks)
 // SOURCE: agent-evolution/data/model-benchmarks-verified.json v2.0.0
@@ -5736,33 +5737,15 @@ function renderOverview() {
         `).join('')
         : '<p style="color: var(--text-muted);">No history yet</p>';
 
-    // Recommended agents (use inline recs if available)
-    let recAgents = [];
-    if (INLINE_RECOMMENDATIONS && INLINE_RECOMMENDATIONS.length > 0) {
-        recAgents = INLINE_RECOMMENDATIONS.slice(0, 6).map(r => ({ agent: r.agent, current: { recommendations: [{ priority: r.impact, target: r.source_of_truth_model || r.recommended_model, reason: r.rationale, score_before: r.score_before, score_after: r.score_after, score_delta: r.score_delta }], model: r.current_model_in_agent_versions || r.current_model, category: 'Core Dev', description: '', benchmark: { fit_score: r.score_after || 0 } } }));
-    } else {
-        recAgents = Object.entries(agentData.agents)
-            .filter(([_, a]) => a.current.recommendations && a.current.recommendations.length > 0)
-            .slice(0, 6);
-    }
+    // Recommended agents from live data
+    const recAgents = Object.entries(agentData.agents || {})
+        .filter(([_, a]) => (a.current?.recommendations || []).length > 0)
+        .slice(0, 6);
 
     document.getElementById('recCount').textContent = recAgents.length;
-    if (INLINE_RECOMMENDATIONS && INLINE_RECOMMENDATIONS.length > 0) {
-        document.getElementById('recAgents').innerHTML = recAgents.map((r, idx) => renderRecCard({
-            agent: r.agent,
-            current_model: r.current?.model || '',
-            recommended_model: r.current?.recommendations?.[0]?.target || '',
-            impact: r.current?.recommendations?.[0]?.priority?.toLowerCase() || 'medium',
-            score_before: r.current?.recommendations?.[0]?.score_before || 0,
-            score_after: r.current?.recommendations?.[0]?.score_after || 0,
-            score_delta: r.current?.recommendations?.[0]?.score_delta || 0,
-            rationale: r.current?.recommendations?.[0]?.reason || ''
-        }, idx)).join('');
-    } else {
-        document.getElementById('recAgents').innerHTML = recAgents.map(([name, agent]) => 
-            renderAgentCard(name, agent, true)
-        ).join('');
-    }
+    document.getElementById('recAgents').innerHTML = recAgents.map(([name, agent]) => 
+        renderAgentCard(name, agent, true)
+    ).join('');
 }
 
 // Render All Agents
@@ -6068,7 +6051,7 @@ function renderHeatmap() {
             h += `<td style="background:${hmColor(s)};color:${hmText(s)};cursor:pointer" class="${cur ? 'hm-cur' : ''}" title="${ag.n} × ${hmModels[j].n}: ${s}"
                 onmouseover="showTT(event,'${ag.n}','${hmModels[j].n} (${hmModels[j].p})',${s},${best},${cur},${hmModels[j].if})"
                 onmouseout="hideTT()"
-                onclick="showCellDetail('${hmModels[j].full}', '${ag.n}')">${s}${marks}</td>`;
+                onclick="openHmModal(event, '${ag.n}', '${hmModels[j].n}', ${s}, ${hmModels[j].if})">${s}${marks}</td>`;
         });
         h += '</tr>';
     });
@@ -6131,7 +6114,8 @@ function closeHmModal() {
 }
 
 // Show cell detail modal with Chart.js line chart and prompt history
-function showCellDetail(modelName, agentName) {
+function showCellDetail(event, modelName, agentName) {
+    event.stopPropagation();
     const agent = agentData.agents[agentName];
     if (!agent) {
         console.error('Agent not found:', agentName);
@@ -6345,9 +6329,13 @@ function renderHmModalContent(tabName) {
         case 'models':
             content = renderModelsTab(agent);
             break;
+        case 'graph':
+            content = renderGraphTab(agent);
+            break;
     }
 
     body.innerHTML = `<div class="hm-tab-content active" style="display:block">${content}</div>`;
+    if (tabName === 'graph') setTimeout(() => renderCellChart(hmCurrentAgent, agent.current?.model || ''), 50);
 }
 
 function renderPromptTab(agent) {
@@ -6486,6 +6474,46 @@ function renderModelsTab(agent) {
     return html;
 }
 
+function renderGraphTab(agent) {
+    return `
+        <div style="margin-bottom:20px">
+            <h3 style="margin-bottom:10px;color:var(--accent-cyan)">Performance Over Time</h3>
+            <div style="position:relative;height:300px">
+                <canvas id="cellChartCanvas"></canvas>
+            </div>
+        </div>
+        <div>
+            <h3 style="margin-bottom:10px;color:var(--accent-cyan)">Prompt Change History</h3>
+            <div id="promptHistoryList" style="max-height:300px;overflow-y:auto">
+                ${renderPromptHistory(agent)}
+            </div>
+        </div>
+    `;
+}
+
+function renderPromptHistory(agent) {
+    const promptChanges = (agent.history || []).filter(item => item.change_type === 'prompt_change');
+
+    if (promptChanges.length === 0) {
+        return '<p style="color:var(--text-muted);text-align:center;padding:20px">No prompt change history found</p>';
+    }
+
+    let html = '<ul style="list-style:none;padding:0">';
+    promptChanges.forEach(change => {
+        html += `
+            <li style="padding:10px;border-bottom:1px solid var(--border);margin-bottom:10px">
+                <div style="display:flex;justify-content:space-between;margin-bottom:5px">
+                    <span style="font-family:'JetBrains Mono',monospace;font-size:.8em;color:var(--text-muted)">${formatDate(change.date)}</span>
+                    <span style="font-family:'JetBrains Mono',monospace;font-size:.8em;color:var(--accent-cyan)">${change.commit ? change.commit.substring(0,7) : 'unknown'}</span>
+                </div>
+                <div style="font-size:.9em;color:var(--text-secondary)">${change.reason || 'No reason provided'}</div>
+            </li>
+        `;
+    });
+    html += '</ul>';
+    return html;
+}
+
 // Compute composite score for any model name
 // Formula (v2): IF_score * 0.85 + context_window_bonus (SWE-bench removed — all values unverifiable)
 function computeAgentScore(modelName) {
@@ -6919,7 +6947,7 @@ function simulateApply() {
             progressStatus.textContent = 'Complete!';
             progressResult.classList.add('show');
             
-            const recs = INLINE_RECOMMENDATIONS && INLINE_RECOMMENDATIONS.length > 0 ? INLINE_RECOMMENDATIONS : [];
+            const recs = Object.values(agentData.agents || {}).filter(a => (a.current?.recommendations || []).length > 0);
             progressResultText.textContent = `✅ ${recs.length} recommendations applied. Run 'bun run sync:evolution' to update dashboard.`;
         }
     }
@@ -6970,11 +6998,11 @@ function showResearchModal() {
                 step.classList.add('done');
             });
             
-            const recs = INLINE_RECOMMENDATIONS && INLINE_RECOMMENDATIONS.length > 0 ? INLINE_RECOMMENDATIONS : [];
-            const modelsCount = new Set(recs.map(r => r.current_model).concat(recs.map(r => r.source_of_truth_model || r.recommended_model))).size;
-            const recsCount = recs.filter(r => r.score_delta > 0).length;
-            
-            document.getElementById('researchSummaryText').textContent = 
+            const recs = Object.values(agentData.agents || {}).filter(a => (a.current?.recommendations || []).length > 0);
+            const modelsCount = new Set(recs.flatMap(a => [a.current?.model, a.current?.recommendations?.[0]?.target])).size;
+            const recsCount = recs.filter(a => (a.current?.recommendations?.[0]?.score_delta || 0) > 0).length;
+
+            document.getElementById('researchSummaryText').textContent =
                 `${modelsCount} models evaluated. ${recsCount} recommendations found. ${recs.length - recsCount} idle models detected.`;
             researchSummary.classList.add('show');
         }
diff --git a/agent-evolution/research-dashboard.html b/agent-evolution/research-dashboard.html
index 2f21577..a3fafb7 100644
--- a/agent-evolution/research-dashboard.html
+++ b/agent-evolution/research-dashboard.html
@@ -3,7 +3,7 @@
 <head>
     <meta charset="UTF-8">
     <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>APAW Agent Model Research — generated 2026-04-30</title>
+    <title>APAW Agent Model Research — generated 2026-05-24</title>
     <link href="https://fonts.googleapis.com/css2?family=JetBrains+Mono:wght@300;400;500;600;700&family=Outfit:wght@300;400;500;600;700;800;900&display=swap" rel="stylesheet">
     <style>
         :root {
@@ -255,16 +255,16 @@
 <div class="container">
     <div class="header">
         <h1>APAW Agent Model Research v2</h1>
-        <div class="sub">Live dashboard • 15 models × 30 agents • 2026-04-30</div>
+        <div class="sub">Live dashboard • 15 models × 30 agents • 2026-05-24</div>
     </div>
 
     <div class="tabs" id="tabBar">
-        <button class="tab-btn active" onclick="switchTab('overview')">Обзор</button>
-        <button class="tab-btn" onclick="switchTab('groq')">Groq Free Tier</button>
-        <button class="tab-btn" onclick="switchTab('models')">Все модели</button>
-        <button class="tab-btn" onclick="switchTab('heatmap')">Матрица</button>
-        <button class="tab-btn" onclick="switchTab('recs')">Рекомендации</button>
-        <button class="tab-btn" onclick="switchTab('impact')">Анализ профита</button>
+        <button class="tab-btn active" onclick="switchTab('overview', this)">Обзор</button>
+        <button class="tab-btn" onclick="switchTab('groq', this)">Groq Free Tier</button>
+        <button class="tab-btn" onclick="switchTab('models', this)">Все модели</button>
+        <button class="tab-btn" onclick="switchTab('heatmap', this)">Матрица</button>
+        <button class="tab-btn" onclick="switchTab('recs', this)">Рекомендации</button>
+        <button class="tab-btn" onclick="switchTab('impact', this)">Анализ профита</button>
     </div>
 
     <!-- ========== TAB: OVERVIEW ========== -->
@@ -419,20 +419,87 @@
 
 <script>
 // BENCHMARK_DATA_PLACEHOLDER - REPLACED BY BUILD SCRIPT
-// Generated from model-benchmarks.json on 2026-04-30T07:34:02.062Z
+// Generated from model-benchmarks.json on 2026-05-26T12:55:21.038Z
 const EMBEDDED_DATA = {
   "version": "1.0.0",
-  "generated": "2026-04-30T07:00:00Z",
-  "source": "capability-index.yaml v3 optimal",
-  "total_agents": 30,
-  "total_models_tracked": 11,
+  "generated": "2026-05-24T01:00:00Z",
+  "source": "ollama-cloud-models-v2026-05-24",
+  "total_agents": 34,
+  "total_models_tracked": 13,
   "providers": [
-    "ollama",
-    "ollama-cloud",
-    "openrouter",
-    "groq"
+    "ollama-cloud"
   ],
   "models": [
+    {
+      "id": "deepseek-v4-pro-max",
+      "name": "DeepSeek V4-Pro Max",
+      "organization": "DeepSeek",
+      "parameters": "1.6T/49B active MoE",
+      "context_window": "1M",
+      "swe_bench": 80.6,
+      "if_score": 89,
+      "categories": [
+        "coding",
+        "agent",
+        "reasoning"
+      ],
+      "provider": "ollama-cloud",
+      "updated": "2026-05-03",
+      "pulls": "71.6K"
+    },
+    {
+      "id": "deepseek-v4-flash",
+      "name": "DeepSeek V4-Flash",
+      "organization": "DeepSeek",
+      "parameters": "284B/13B active MoE",
+      "context_window": "1M",
+      "swe_bench": 79,
+      "if_score": 86,
+      "categories": [
+        "coding",
+        "efficient",
+        "agent"
+      ],
+      "provider": "ollama-cloud",
+      "updated": "2026-05-03",
+      "pulls": "84.4K"
+    },
+    {
+      "id": "kimi-k2.6",
+      "name": "Kimi K2.6",
+      "organization": "Moonshot AI",
+      "parameters": "1T/32B active MoE",
+      "context_window": "256K→1M",
+      "swe_bench": 80.2,
+      "if_score": 91,
+      "categories": [
+        "coding",
+        "agent",
+        "multimodal",
+        "vision"
+      ],
+      "provider": "ollama-cloud",
+      "updated": "2026-04-24",
+      "pulls": "259.7K"
+    },
+    {
+      "id": "kimi-k2.5",
+      "name": "Kimi K2.5",
+      "organization": "Moonshot AI",
+      "parameters": "1T/32B active MoE",
+      "context_window": "256K",
+      "swe_bench": 78,
+      "if_score": 90,
+      "categories": [
+        "coding",
+        "agent",
+        "multimodal",
+        "vision"
+      ],
+      "provider": "ollama-cloud",
+      "updated": "2026-02-24",
+      "pulls": "293.2K"
+    },
     {
       "id": "qwen3-coder-480b",
       "name": "Qwen3-Coder 480B",
@@ -445,14 +512,47 @@ const EMBEDDED_DATA = {
         "coding",
         "agent"
       ],
-      "description": "SOTA open-source кодинг. Сравним с Claude Sonnet 4.",
-      "tags": [
-        "coding",
-        "agent",
+      "provider": "ollama-cloud",
+      "updated": "2026-02-24",
+      "pulls": "N/A (legacy track)"
+    },
+    {
+      "id": "qwen3.5-122b",
+      "name": "Qwen 3.5 122B",
+      "organization": "Qwen",
+      "parameters": "122B/10B active",
+      "context_window": "128K",
+      "swe_bench": null,
+      "if_score": 92,
+      "categories": [
+        "reasoning",
+        "efficient",
+        "vision",
         "tools"
       ],
-      "openrouter": false,
-      "provider": "ollama"
+      "provider": "ollama-cloud",
+      "updated": "2026-05-22",
+      "pulls": "12.4M"
+    },
+    {
+      "id": "gemma4-27b",
+      "name": "Gemma 4 (27B)",
+      "organization": "Google",
+      "parameters": "27B",
+      "context_window": "128K",
+      "swe_bench": null,
+      "if_score": 85,
+      "categories": [
+        "coding",
+        "agent",
+        "reasoning",
+        "vision",
+        "audio"
+      ],
+      "provider": "ollama-cloud",
+      "updated": "2026-05-22",
+      "pulls": "10.1M",
+      "note": "Updated 2 days ago. Frontier-level performance at each size."
     },
     {
       "id": "minimax-m2.5",
@@ -466,13 +566,9 @@ const EMBEDDED_DATA = {
         "coding",
         "agent"
       ],
-      "description": "Лидер SWE-bench 80.2%. Полный lifecycle разработки.",
-      "tags": [
-        "coding",
-        "agent"
-      ],
-      "openrouter": false,
-      "provider": "ollama"
+      "provider": "ollama-cloud",
+      "updated": "2026-02-24",
+      "pulls": "2.2M"
     },
     {
       "id": "minimax-m2.7",
@@ -487,85 +583,42 @@ const EMBEDDED_DATA = {
         "agent",
         "efficient"
       ],
-      "description": "Самообучаемая. 56.2% SWE-Pro. 100 TPS. $0.30/M.",
-      "tags": [
-        "coding",
-        "agent",
-        "self-evolving"
-      ],
-      "openrouter": false,
-      "provider": "ollama"
+      "provider": "ollama-cloud",
+      "updated": "2026-03-24",
+      "pulls": "2.2M"
     },
     {
-      "id": "deepseek-v4-pro-max",
-      "name": "DeepSeek V4-Pro",
-      "organization": "DeepSeek",
-      "parameters": "1.6T/49B active MoE",
-      "context_window": "1M",
-      "swe_bench": 80.6,
-      "if_score": 89,
+      "id": "glm-5.1",
+      "name": "GLM-5.1",
+      "organization": "Z.ai",
+      "parameters": "744B/40B active",
+      "context_window": "128K",
+      "swe_bench": null,
+      "if_score": 90,
       "categories": [
-        "coding",
-        "agent",
-        "reasoning"
-      ],
-      "description": "SWE-V 80.6, LiveCodeBench 93.5(#1!), Terminal-Bench 67.9, Codeforces 3206, 1M ctx, 27% FLOPs vs V3.2. MIT.",
-      "tags": [
-        "coding",
-        "agent",
-        "thinking",
-        "tools"
-      ],
-      "openrouter": false,
-      "provider": "ollama-cloud"
-    },
-    {
-      "id": "deepseek-v4-flash",
-      "name": "DeepSeek V4-Pro",
-      "organization": "DeepSeek",
-      "parameters": "284B/13B active MoE",
-      "context_window": "1M",
-      "swe_bench": 79,
-      "if_score": 86,
-      "categories": [
-        "coding",
-        "efficient",
+        "reasoning",
         "agent"
       ],
-      "description": "SWE-V ~79%, Flash Max = Pro уровень reasoning. 13B active = ультрабыстрый. 1M ctx. FP4+FP8. MIT.",
-      "tags": [
-        "coding",
-        "efficient",
-        "agent",
-        "thinking"
-      ],
-      "openrouter": false,
-      "provider": "ollama-cloud"
+      "provider": "ollama-cloud",
+      "updated": "2026-04-24",
+      "pulls": "2.2M",
+      "note": "Next-gen flagship. SWE-Bench Pro SOTA."
     },
     {
-      "id": "kimi-k2-6",
-      "name": "Kimi K2.6",
-      "organization": "Moonshot AI",
-      "parameters": "1T/32B active MoE",
-      "context_window": "256K",
-      "swe_bench": 80.2,
-      "if_score": 91,
+      "id": "glm-5",
+      "name": "GLM-5",
+      "organization": "Z.ai",
+      "parameters": "744B/40B active",
+      "context_window": "128K",
+      "swe_bench": null,
+      "if_score": 90,
       "categories": [
-        "coding",
-        "agent",
-        "multimodal"
+        "reasoning",
+        "agent"
       ],
-      "description": "SWE-Pro 58.6(#1!), SWE-V 80.2, Terminal-Bench 66.7, HLE 54.0(#1!), BrowseComp 83.2. 13h autonomous. 300 sub-agent swarm. Modified MIT.",
-      "tags": [
-        "coding",
-        "agent",
-        "swarm",
-        "vision",
-        "thinking",
-        "tools"
-      ],
-      "openrouter": false,
-      "provider": "ollama-cloud"
+      "provider": "ollama-cloud",
+      "updated": "2026-02-24",
+      "pulls": "2.3M"
     },
     {
       "id": "nemotron-3-super",
@@ -580,1563 +633,853 @@ const EMBEDDED_DATA = {
         "reasoning",
         "efficient"
       ],
-      "description": "SWE-bench 60.5%. RULER@1M 91.75%! Но IF ниже — Mamba-layers иногда «теряют» инструкции в длинных промптах.",
-      "tags": [
-        "agent",
-        "1M-ctx",
-        "thinking"
-      ],
-      "openrouter": false,
-      "provider": "ollama"
+      "provider": "ollama-cloud",
+      "updated": "2026-03-24",
+      "pulls": "2.4M"
     },
     {
-      "id": "glm-5.1",
-      "name": "GLM-5",
-      "organization": "Z.ai",
-      "parameters": "744B/40B active",
+      "id": "nemotron-3-nano",
+      "name": "Nemotron 3 Nano",
+      "organization": "NVIDIA",
+      "parameters": "30B/4B",
       "context_window": "128K",
       "swe_bench": null,
-      "if_score": 90,
+      "if_score": 68,
       "categories": [
-        "reasoning",
-        "agent"
+        "agent",
+        "efficient"
       ],
-      "description": "Мощный reasoning. Arena ELO 1451. Отличный instruction following (IFEval ~90+).",
-      "tags": [
-        "reasoning",
-        "agent"
-      ],
-      "openrouter": false,
-      "provider": "ollama"
+      "provider": "ollama-cloud",
+      "updated": "2026-03-24",
+      "pulls": "453K"
     },
     {
-      "id": "deepseek-v4",
-      "name": "DeepSeek V4-Pro",
-      "organization": "DeepSeek",
-      "parameters": "Large MoE",
+      "id": "devstral-2",
+      "name": "Devstral 2",
+      "organization": "Mistral / Devstral",
+      "parameters": "123B",
+      "context_window": "128K",
+      "swe_bench": null,
+      "if_score": 80,
+      "categories": [
+        "coding",
+        "agent"
+      ],
+      "provider": "ollama-cloud",
+      "updated": "2026-02-24",
+      "pulls": "223.2K"
+    },
+    {
+      "id": "devstral-small-2",
+      "name": "Devstral Small 2",
+      "organization": "Mistral / Devstral",
+      "parameters": "24B",
       "context_window": "128K",
       "swe_bench": null,
       "if_score": 75,
-      "categories": [
-        "reasoning"
-      ],
-      "description": "Хороший reasoning, но IF нестабилен — иногда игнорирует формат вывода.",
-      "tags": [
-        "reasoning"
-      ],
-      "openrouter": false,
-      "provider": "ollama"
-    },
-    {
-      "id": "qwen3-5-122b",
-      "name": "Qwen 3.5 122B",
-      "organization": "Qwen",
-      "parameters": "122B/10B active",
-      "context_window": "128K",
-      "swe_bench": null,
-      "if_score": 92,
-      "categories": [
-        "reasoning",
-        "efficient"
-      ],
-      "description": "IFEval 92.6%! Лучший IF среди open-source. Multimodal. Thinking.",
-      "tags": [
-        "vision",
-        "thinking",
-        "tools"
-      ],
-      "openrouter": false,
-      "provider": "ollama"
-    },
-    {
-      "id": "qwen3-coder-next",
-      "name": "Qwen3-Coder-Next",
-      "organization": "Qwen",
-      "parameters": "80B/3B active",
-      "context_window": "128K",
-      "swe_bench": 70,
-      "if_score": 84,
       "categories": [
         "coding",
-        "efficient"
+        "agent"
       ],
-      "description": "70% SWE-bench с 3B active! Хороший IF для кодинга.",
-      "tags": [
-        "coding",
-        "efficient",
-        "tools"
-      ],
-      "openrouter": false,
-      "provider": "ollama"
-    },
-    {
-      "id": "cogito-2-1-671b",
-      "name": "Cogito 2.1 671B",
-      "organization": "Cognitive",
-      "parameters": "671B MoE",
-      "context_window": "128K",
-      "swe_bench": null,
-      "if_score": 76,
-      "categories": [
-        "reasoning"
-      ],
-      "description": "MIT лицензия. 671B total. IF неплохой, но уступает GLM/Qwen.",
-      "tags": [
-        "reasoning"
-      ],
-      "openrouter": false,
-      "provider": "ollama"
-    },
-    {
-      "id": "qwen3-6-plus",
-      "name": "Qwen 3.6 Plus",
-      "organization": "Qwen",
-      "parameters": "Hybrid MoE",
-      "context_window": "1M",
-      "swe_bench": 78.8,
-      "if_score": 91,
-      "categories": [
-        "coding",
-        "agent",
-        "reasoning"
-      ],
-      "description": "FREE на OpenRouter! 1M контекст. Always-on CoT. Превосходный IF — наследник Qwen 3.5 (92.6%).",
-      "tags": [
-        "coding",
-        "agent",
-        "1M-ctx",
-        "free"
-      ],
-      "openrouter": true,
-      "provider": "openrouter"
-    },
-    {
-      "id": "step-3-5-flash",
-      "name": "Step 3.5 Flash",
-      "organization": "StepFun",
-      "parameters": "MoE",
-      "context_window": "128K",
-      "swe_bench": null,
-      "if_score": 79,
-      "categories": [
-        "efficient"
-      ],
-      "description": "Бесплатна на OpenRouter. IF средний.",
-      "tags": [
-        "efficient",
-        "free"
-      ],
-      "openrouter": true,
-      "provider": "openrouter"
-    },
-    {
-      "id": "deepseek-r1",
-      "name": "DeepSeek R1",
-      "organization": "DeepSeek",
-      "parameters": "671B MoE",
-      "context_window": "128K",
-      "swe_bench": null,
-      "if_score": 73,
-      "categories": [
-        "reasoning"
-      ],
-      "description": "Мощные reasoning-цепочки. Но IF слабый — часто генерирует лишний reasoning вместо ответа.",
-      "tags": [
-        "reasoning",
-        "thinking",
-        "free"
-      ],
-      "openrouter": true,
-      "provider": "openrouter"
-    }
-  ],
-  "groq_models": [
-    {
-      "id": "openai/gpt-oss-20b",
-      "rpm": 30,
-      "rpd": "1K",
-      "tpm": "8K",
-      "tpd": "200K",
-      "speed": "1200+",
-      "use_case": "Ультра-быстрый fallback для лёгких ролей (markdown-validator)."
-    },
-    {
-      "id": "llama-3.1-8b-instant",
-      "rpm": 30,
-      "rpd": "14.4K",
-      "tpm": "6K",
-      "tpd": "500K",
-      "speed": "~800",
-      "use_case": "14.4K RPD! Самый высокий лимит. Для health-check / ping ролей."
-    },
-    {
-      "id": "groq/compound",
-      "rpm": 30,
-      "rpd": "250",
-      "tpm": "70K",
-      "tpd": "—",
-      "speed": "varies",
-      "use_case": "Мультимодельная агрегация. Для research-задач."
-    },
-    {
-      "id": "groq/compound-mini",
-      "rpm": 30,
-      "rpd": "250",
-      "tpm": "70K",
-      "tpd": "—",
-      "speed": "varies",
-      "use_case": "Лёгкая версия compound."
-    },
-    {
-      "id": "llama-prompt-guard-2",
-      "rpm": 30,
-      "rpd": "14.4K",
-      "tpm": "15K",
-      "tpd": "500K",
-      "speed": "~1K",
-      "use_case": "Security: входной фильтр для security-auditor (14.4K RPD!)."
+      "provider": "ollama-cloud",
+      "updated": "2026-02-24",
+      "pulls": "838.8K"
     }
   ],
+  "if_scores": {
+    "deepseek-v4-pro-max": 89,
+    "deepseek-v4-flash": 86,
+    "kimi-k2.6": 91,
+    "kimi-k2.5": 90,
+    "qwen3-coder-480b": 88,
+    "qwen3.5-122b": 92,
+    "gemma4-27b": 85,
+    "minimax-m2.5": 82,
+    "minimax-m2.7": 80,
+    "glm-5.1": 90,
+    "glm-5": 90,
+    "nemotron-3-super": 78,
+    "nemotron-3-nano": 68,
+    "devstral-2": 80,
+    "devstral-small-2": 75
+  },
   "agent_model_scores": [
     {
       "agent": "lead-developer",
       "current_model_index": 0,
-      "current_model_id": "qwen3-coder-480b",
-      "reasoning_effort": "H",
       "scores": {
         "qwen3-coder-480b": 92,
+        "deepseek-v4-pro-max": 88,
+        "deepseek-v4-flash": 85,
+        "kimi-k2.6": 90,
+        "kimi-k2.5": 88,
+        "qwen3.5-122b": 86,
+        "gemma4-27b": 83,
         "minimax-m2.5": 86,
         "minimax-m2.7": 82,
-        "nemotron-3-super": 70,
         "glm-5.1": 68,
-        "deepseek-v4-pro-max": 88,
-        "qwen3-5-122b": 66,
-        "qwen3-coder-next": 80,
-        "qwen3-6-plus": 88,
-        "kimi-k2-6": 90
+        "nemotron-3-super": 70,
+        "devstral-2": 84,
+        "devstral-small-2": 78
       }
     },
     {
       "agent": "frontend-developer",
-      "current_model_index": 1,
-      "current_model_id": "minimax-m2.5",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 86,
+        "deepseek-v4-pro-max": 82,
+        "deepseek-v4-flash": 80,
+        "kimi-k2.6": 86,
+        "kimi-k2.5": 84,
+        "qwen3.5-122b": 84,
+        "gemma4-27b": 85,
         "minimax-m2.5": 92,
         "minimax-m2.7": 88,
+        "glm-5.1": 56,
         "nemotron-3-super": 62,
-        "glm-5.1": 56,
-        "deepseek-v4-pro-max": 82,
-        "qwen3-5-122b": 60,
-        "qwen3-coder-next": 76,
-        "qwen3-6-plus": 88,
-        "kimi-k2-6": 86
-      }
-    },
-    {
-      "agent": "php-developer",
-      "current_model_index": 0,
-      "current_model_id": "qwen3-coder-480b",
-      "reasoning_effort": "H",
-      "scores": {
-        "qwen3-coder-480b": 87,
-        "minimax-m2.5": 76,
-        "minimax-m2.7": 72,
-        "nemotron-3-super": 64,
-        "glm-5.1": 56,
-        "deepseek-v4-pro-max": 74,
-        "qwen3-5-122b": 60,
-        "qwen3-coder-next": 76,
-        "qwen3-6-plus": 84,
-        "kimi-k2-6": 86
-      }
-    },
-    {
-      "agent": "python-developer",
-      "current_model_index": 0,
-      "current_model_id": "qwen3-coder-480b",
-      "reasoning_effort": "H",
-      "scores": {
-        "qwen3-coder-480b": 90,
-        "minimax-m2.5": 82,
-        "minimax-m2.7": 78,
-        "nemotron-3-super": 66,
-        "glm-5.1": 60,
-        "deepseek-v4-pro-max": 78,
-        "qwen3-5-122b": 64,
-        "qwen3-coder-next": 78,
-        "qwen3-6-plus": 88,
-        "kimi-k2-6": 88
+        "devstral-2": 80,
+        "devstral-small-2": 74
       }
     },
     {
       "agent": "backend-developer",
-      "current_model_index": 0,
-      "current_model_id": "qwen3-coder-480b",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 91,
+        "deepseek-v4-pro-max": 86,
+        "kimi-k2.6": 90,
+        "qwen3.5-122b": 85,
+        "gemma4-27b": 84,
         "minimax-m2.5": 84,
         "minimax-m2.7": 80,
-        "nemotron-3-super": 68,
         "glm-5.1": 63,
-        "deepseek-v4-pro-max": 86,
-        "qwen3-5-122b": 62,
-        "qwen3-coder-next": 78,
-        "qwen3-6-plus": 87,
-        "kimi-k2-6": 90
+        "nemotron-3-super": 68,
+        "devstral-2": 82,
+        "devstral-small-2": 76
       }
     },
     {
       "agent": "go-developer",
-      "current_model_index": 3,
-      "current_model_id": "deepseek-v4-pro-max",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 85,
+        "deepseek-v4-pro-max": 88,
+        "deepseek-v4-flash": 84,
+        "kimi-k2.6": 86,
+        "qwen3.5-122b": 80,
+        "gemma4-27b": 80,
         "minimax-m2.5": 78,
         "minimax-m2.7": 74,
-        "nemotron-3-super": 66,
         "glm-5.1": 58,
-        "deepseek-v4-pro-max": 88,
-        "qwen3-5-122b": 58,
-        "qwen3-coder-next": 74,
-        "qwen3-6-plus": 82,
-        "kimi-k2-6": 86
+        "nemotron-3-super": 66,
+        "devstral-2": 82,
+        "devstral-small-2": 74
       }
     },
     {
-      "agent": "flutter-developer",
-      "current_model_index": 0,
-      "current_model_id": "qwen3-coder-480b",
-      "reasoning_effort": "M",
+      "agent": "python-developer",
       "scores": {
-        "qwen3-coder-480b": 86,
-        "minimax-m2.5": 70,
-        "minimax-m2.7": 66,
-        "nemotron-3-super": 60,
-        "glm-5.1": 53,
+        "qwen3-coder-480b": 90,
         "deepseek-v4-pro-max": 78,
-        "qwen3-5-122b": 58,
-        "qwen3-coder-next": 74,
-        "qwen3-6-plus": 82,
-        "kimi-k2-6": 84
+        "kimi-k2.6": 88,
+        "qwen3.5-122b": 86,
+        "gemma4-27b": 82,
+        "minimax-m2.5": 82,
+        "minimax-m2.7": 78,
+        "glm-5.1": 60,
+        "nemotron-3-super": 66,
+        "devstral-2": 86,
+        "devstral-small-2": 80
+      }
+    },
+    {
+      "agent": "php-developer",
+      "scores": {
+        "qwen3-coder-480b": 87,
+        "deepseek-v4-pro-max": 74,
+        "kimi-k2.6": 86,
+        "qwen3.5-122b": 84,
+        "gemma4-27b": 82,
+        "minimax-m2.5": 76,
+        "minimax-m2.7": 72,
+        "glm-5.1": 56,
+        "nemotron-3-super": 64,
+        "devstral-2": 80,
+        "devstral-small-2": 74
       }
     },
     {
       "agent": "devops-engineer",
-      "current_model_index": -1,
-      "current_model_id": "kimi-k2.6",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 66,
+        "deepseek-v4-pro-max": 80,
+        "kimi-k2.6": 88,
+        "qwen3.5-122b": 75,
+        "gemma4-27b": 78,
         "minimax-m2.5": 53,
         "minimax-m2.7": 48,
-        "nemotron-3-super": 78,
         "glm-5.1": 75,
-        "deepseek-v4-pro-max": 86,
-        "qwen3-5-122b": 70,
-        "qwen3-coder-next": 54,
-        "qwen3-6-plus": 76,
-        "kimi-k2-6": 88
+        "nemotron-3-super": 78,
+        "devstral-2": 72,
+        "devstral-small-2": 68
       }
     },
     {
       "agent": "sdet-engineer",
-      "current_model_index": 0,
-      "current_model_id": "qwen3-coder-480b",
-      "reasoning_effort": "H",
       "scores": {
         "qwen3-coder-480b": 88,
+        "deepseek-v4-pro-max": 84,
+        "kimi-k2.6": 87,
+        "qwen3.5-122b": 86,
+        "gemma4-27b": 82,
         "minimax-m2.5": 84,
         "minimax-m2.7": 80,
-        "nemotron-3-super": 70,
         "glm-5.1": 63,
-        "deepseek-v4-pro-max": 84,
-        "qwen3-5-122b": 64,
-        "qwen3-coder-next": 78,
-        "qwen3-6-plus": 84,
-        "kimi-k2-6": 87
+        "nemotron-3-super": 70,
+        "devstral-2": 86,
+        "devstral-small-2": 80
       }
     },
     {
       "agent": "code-skeptic",
-      "current_model_index": 1,
-      "current_model_id": "minimax-m2.5",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 82,
+        "deepseek-v4-pro-max": 82,
+        "kimi-k2.6": 82,
+        "qwen3.5-122b": 80,
+        "gemma4-27b": 80,
         "minimax-m2.5": 85,
         "minimax-m2.7": 80,
-        "nemotron-3-super": 73,
         "glm-5.1": 72,
-        "deepseek-v4-pro-max": 82,
-        "qwen3-5-122b": 70,
-        "qwen3-coder-next": 72,
-        "qwen3-6-plus": 80,
-        "kimi-k2-6": 82
+        "nemotron-3-super": 73,
+        "devstral-2": 82,
+        "devstral-small-2": 76
       }
     },
     {
       "agent": "security-auditor",
-      "current_model_index": 3,
-      "current_model_id": "deepseek-v4-pro-max",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 76,
+        "deepseek-v4-pro-max": 80,
+        "kimi-k2.6": 80,
+        "qwen3.5-122b": 78,
+        "gemma4-27b": 78,
         "minimax-m2.5": 74,
         "minimax-m2.7": 68,
-        "nemotron-3-super": 76,
         "glm-5.1": 68,
-        "deepseek-v4-pro-max": 80,
-        "qwen3-5-122b": 72,
-        "qwen3-coder-next": 64,
-        "qwen3-6-plus": 75,
-        "kimi-k2-6": 80
+        "nemotron-3-super": 76,
+        "devstral-2": 78,
+        "devstral-small-2": 72
       }
     },
     {
       "agent": "performance-engineer",
-      "current_model_index": 3,
-      "current_model_id": "deepseek-v4-pro-max",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 78,
+        "deepseek-v4-pro-max": 84,
+        "kimi-k2.6": 82,
+        "qwen3.5-122b": 76,
+        "gemma4-27b": 76,
         "minimax-m2.5": 75,
         "minimax-m2.7": 70,
-        "nemotron-3-super": 78,
         "glm-5.1": 74,
-        "deepseek-v4-pro-max": 84,
-        "qwen3-5-122b": 70,
-        "qwen3-coder-next": 67,
-        "qwen3-6-plus": 76,
-        "kimi-k2-6": 82
+        "nemotron-3-super": 78,
+        "devstral-2": 80,
+        "devstral-small-2": 74
       }
     },
     {
       "agent": "the-fixer",
-      "current_model_index": -1,
-      "current_model_id": "kimi-k2.6",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 89,
+        "deepseek-v4-pro-max": 88,
+        "kimi-k2.6": 90,
+        "qwen3.5-122b": 86,
+        "gemma4-27b": 82,
         "minimax-m2.5": 88,
         "minimax-m2.7": 84,
-        "nemotron-3-super": 71,
         "glm-5.1": 64,
-        "deepseek-v4-pro-max": 88,
-        "qwen3-5-122b": 64,
-        "qwen3-coder-next": 82,
-        "qwen3-6-plus": 86,
-        "kimi-k2-6": 90
+        "nemotron-3-super": 71,
+        "devstral-2": 86,
+        "devstral-small-2": 82
       }
     },
     {
       "agent": "browser-automation",
-      "current_model_index": 0,
-      "current_model_id": "qwen3-coder-480b",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 87,
+        "deepseek-v4-pro-max": 82,
+        "kimi-k2.6": 86,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 84,
         "minimax-m2.5": 72,
         "minimax-m2.7": 68,
-        "nemotron-3-super": 61,
         "glm-5.1": 53,
-        "deepseek-v4-pro-max": 82,
-        "qwen3-5-122b": 56,
-        "qwen3-coder-next": 72,
-        "qwen3-6-plus": 82,
-        "kimi-k2-6": 86
+        "nemotron-3-super": 61,
+        "devstral-2": 80,
+        "devstral-small-2": 74
       }
     },
     {
       "agent": "visual-tester",
-      "current_model_index": 0,
-      "current_model_id": "qwen3-coder-480b",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 82,
+        "deepseek-v4-pro-max": 76,
+        "kimi-k2.6": 78,
+        "qwen3.5-122b": 76,
+        "gemma4-27b": 78,
         "minimax-m2.5": 68,
         "minimax-m2.7": 64,
-        "nemotron-3-super": 55,
         "glm-5.1": 48,
-        "deepseek-v4-pro-max": 76,
-        "qwen3-5-122b": 54,
-        "qwen3-coder-next": 66,
-        "qwen3-6-plus": 76,
-        "kimi-k2-6": 78
+        "nemotron-3-super": 55,
+        "devstral-2": 74,
+        "devstral-small-2": 68
       }
     },
     {
       "agent": "system-analyst",
-      "current_model_index": 7,
-      "current_model_id": "glm-5.1",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 70,
+        "deepseek-v4-pro-max": 88,
+        "kimi-k2.6": 86,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 82,
         "minimax-m2.5": 66,
         "minimax-m2.7": 63,
-        "nemotron-3-super": 74,
         "glm-5.1": 82,
-        "deepseek-v4-pro-max": 88,
-        "qwen3-5-122b": 76,
-        "qwen3-coder-next": 58,
-        "qwen3-6-plus": 80,
-        "kimi-k2-6": 86
+        "nemotron-3-super": 74,
+        "devstral-2": 80,
+        "devstral-small-2": 74
       }
     },
     {
       "agent": "capability-analyst",
-      "current_model_index": 7,
-      "current_model_id": "glm-5.1",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 72,
+        "deepseek-v4-pro-max": 82,
+        "kimi-k2.6": 82,
+        "qwen3.5-122b": 80,
+        "gemma4-27b": 80,
         "minimax-m2.5": 68,
         "minimax-m2.7": 66,
-        "nemotron-3-super": 76,
         "glm-5.1": 78,
-        "deepseek-v4-pro-max": 82,
-        "qwen3-5-122b": 75,
-        "qwen3-coder-next": 60,
-        "qwen3-6-plus": 79,
-        "kimi-k2-6": 82
+        "nemotron-3-super": 76,
+        "devstral-2": 78,
+        "devstral-small-2": 72
       }
     },
     {
       "agent": "orchestrator",
-      "current_model_index": -1,
-      "current_model_id": "kimi-k2.6",
-      "reasoning_effort": "H",
       "scores": {
         "qwen3-coder-480b": 74,
+        "deepseek-v4-pro-max": 86,
+        "kimi-k2.6": 92,
+        "qwen3.5-122b": 84,
+        "gemma4-27b": 82,
         "minimax-m2.5": 70,
         "minimax-m2.7": 68,
-        "nemotron-3-super": 80,
         "glm-5.1": 82,
-        "deepseek-v4-pro-max": 86,
-        "qwen3-5-122b": 78,
-        "qwen3-coder-next": 62,
-        "qwen3-6-plus": 84,
-        "kimi-k2-6": 92
+        "nemotron-3-super": 80,
+        "devstral-2": 80,
+        "devstral-small-2": 74
       }
     },
     {
       "agent": "release-manager",
-      "current_model_index": 7,
-      "current_model_id": "glm-5.1",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 72,
+        "deepseek-v4-pro-max": 78,
+        "kimi-k2.6": 78,
+        "qwen3.5-122b": 76,
+        "gemma4-27b": 76,
         "minimax-m2.5": 66,
         "minimax-m2.7": 64,
-        "nemotron-3-super": 74,
         "glm-5.1": 76,
-        "deepseek-v4-pro-max": 78,
-        "qwen3-5-122b": 72,
-        "qwen3-coder-next": 60,
-        "qwen3-6-plus": 76,
-        "kimi-k2-6": 78
+        "nemotron-3-super": 74,
+        "devstral-2": 76,
+        "devstral-small-2": 70
       }
     },
     {
       "agent": "evaluator",
-      "current_model_index": 7,
-      "current_model_id": "glm-5.1",
-      "reasoning_effort": "H",
       "scores": {
         "qwen3-coder-480b": 70,
+        "deepseek-v4-pro-max": 84,
+        "kimi-k2.6": 84,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 80,
         "minimax-m2.5": 73,
         "minimax-m2.7": 70,
-        "nemotron-3-super": 78,
         "glm-5.1": 78,
-        "deepseek-v4-pro-max": 84,
-        "qwen3-5-122b": 76,
-        "qwen3-coder-next": 58,
-        "qwen3-6-plus": 81,
-        "kimi-k2-6": 84
+        "nemotron-3-super": 78,
+        "devstral-2": 80,
+        "devstral-small-2": 74
       }
     },
     {
       "agent": "prompt-optimizer",
-      "current_model_index": -1,
-      "current_model_id": "qwen3.6-plus",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 76,
+        "deepseek-v4-pro-max": 80,
+        "kimi-k2.6": 82,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 80,
         "minimax-m2.5": 74,
         "minimax-m2.7": 72,
-        "nemotron-3-super": 76,
         "glm-5.1": 75,
-        "deepseek-v4-pro-max": 80,
-        "qwen3-5-122b": 74,
-        "qwen3-coder-next": 64,
-        "qwen3-6-plus": 83,
-        "kimi-k2-6": 82
+        "nemotron-3-super": 76,
+        "devstral-2": 80,
+        "devstral-small-2": 74
       }
     },
     {
       "agent": "product-owner",
-      "current_model_index": 7,
-      "current_model_id": "glm-5.1",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 60,
+        "deepseek-v4-pro-max": 76,
+        "kimi-k2.6": 76,
+        "qwen3.5-122b": 76,
+        "gemma4-27b": 76,
         "minimax-m2.5": 56,
         "minimax-m2.7": 54,
-        "nemotron-3-super": 74,
         "glm-5.1": 78,
-        "deepseek-v4-pro-max": 76,
-        "qwen3-5-122b": 74,
-        "qwen3-coder-next": 48,
-        "qwen3-6-plus": 78,
-        "kimi-k2-6": 76
+        "nemotron-3-super": 74,
+        "devstral-2": 76,
+        "devstral-small-2": 70
       }
     },
     {
       "agent": "pipeline-judge",
-      "current_model_index": 7,
-      "current_model_id": "glm-5.1",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 64,
+        "deepseek-v4-pro-max": 82,
+        "kimi-k2.6": 84,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 80,
         "minimax-m2.5": 68,
         "minimax-m2.7": 65,
-        "nemotron-3-super": 78,
         "glm-5.1": 76,
-        "deepseek-v4-pro-max": 82,
-        "qwen3-5-122b": 74,
-        "qwen3-coder-next": 56,
-        "qwen3-6-plus": 80,
-        "kimi-k2-6": 84
+        "nemotron-3-super": 78,
+        "devstral-2": 78,
+        "devstral-small-2": 72
       }
     },
     {
       "agent": "workflow-architect",
-      "current_model_index": 7,
-      "current_model_id": "glm-5.1",
-      "reasoning_effort": "H",
       "scores": {
         "qwen3-coder-480b": 68,
+        "deepseek-v4-pro-max": 80,
+        "kimi-k2.6": 82,
+        "qwen3.5-122b": 80,
+        "gemma4-27b": 80,
         "minimax-m2.5": 62,
         "minimax-m2.7": 60,
-        "nemotron-3-super": 76,
         "glm-5.1": 76,
-        "deepseek-v4-pro-max": 80,
-        "qwen3-5-122b": 72,
-        "qwen3-coder-next": 56,
-        "qwen3-6-plus": 80,
-        "kimi-k2-6": 82
+        "nemotron-3-super": 76,
+        "devstral-2": 78,
+        "devstral-small-2": 72
       }
     },
     {
       "agent": "markdown-validator",
-      "current_model_index": 3,
-      "current_model_id": "deepseek-v4-pro-max",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 43,
+        "deepseek-v4-pro-max": 68,
+        "kimi-k2.6": 56,
+        "qwen3.5-122b": 56,
+        "gemma4-27b": 60,
         "minimax-m2.5": 38,
         "minimax-m2.7": 36,
-        "nemotron-3-super": 52,
         "glm-5.1": 55,
-        "deepseek-v4-pro-max": 68,
-        "qwen3-5-122b": 56,
-        "qwen3-coder-next": 40,
-        "qwen3-6-plus": 50,
-        "kimi-k2-6": 56
+        "nemotron-3-super": 52,
+        "nemotron-3-nano": 70,
+        "devstral-2": 65,
+        "devstral-small-2": 62
       }
     },
     {
       "agent": "agent-architect",
-      "current_model_index": -1,
-      "current_model_id": "kimi-k2.6",
-      "reasoning_effort": "H",
       "scores": {
         "qwen3-coder-480b": 78,
+        "deepseek-v4-pro-max": 82,
+        "kimi-k2.6": 86,
+        "qwen3.5-122b": 80,
+        "gemma4-27b": 82,
         "minimax-m2.5": 72,
         "minimax-m2.7": 70,
-        "nemotron-3-super": 78,
         "glm-5.1": 76,
-        "deepseek-v4-pro-max": 82,
-        "qwen3-5-122b": 76,
-        "qwen3-coder-next": 66,
-        "qwen3-6-plus": 82,
-        "kimi-k2-6": 86
+        "nemotron-3-super": 78,
+        "devstral-2": 80,
+        "devstral-small-2": 74
       }
     },
     {
       "agent": "planner",
-      "current_model_index": 3,
-      "current_model_id": "deepseek-v4-pro-max",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 72,
+        "deepseek-v4-pro-max": 88,
+        "kimi-k2.6": 86,
+        "qwen3.5-122b": 86,
+        "gemma4-27b": 84,
         "minimax-m2.5": 68,
         "minimax-m2.7": 66,
-        "nemotron-3-super": 80,
         "glm-5.1": 78,
-        "deepseek-v4-pro-max": 88,
-        "qwen3-5-122b": 78,
-        "qwen3-coder-next": 60,
-        "qwen3-6-plus": 85,
-        "kimi-k2-6": 86
+        "nemotron-3-super": 80,
+        "devstral-2": 84,
+        "devstral-small-2": 78
       }
     },
     {
       "agent": "reflector",
-      "current_model_index": 3,
-      "current_model_id": "deepseek-v4-pro-max",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 68,
+        "deepseek-v4-pro-max": 84,
+        "kimi-k2.6": 80,
+        "qwen3.5-122b": 80,
+        "gemma4-27b": 80,
         "minimax-m2.5": 66,
         "minimax-m2.7": 64,
-        "nemotron-3-super": 78,
         "glm-5.1": 76,
-        "deepseek-v4-pro-max": 84,
-        "qwen3-5-122b": 76,
-        "qwen3-coder-next": 56,
-        "qwen3-6-plus": 82,
-        "kimi-k2-6": 80
+        "nemotron-3-super": 78,
+        "devstral-2": 82,
+        "devstral-small-2": 76
       }
     },
     {
       "agent": "memory-manager",
-      "current_model_index": -1,
-      "current_model_id": "qwen3.6-plus",
-      "reasoning_effort": "M",
       "scores": {
         "qwen3-coder-480b": 63,
+        "deepseek-v4-pro-max": 86,
+        "kimi-k2.6": 84,
+        "qwen3.5-122b": 85,
+        "gemma4-27b": 82,
         "minimax-m2.5": 58,
         "minimax-m2.7": 56,
-        "nemotron-3-super": 86,
         "glm-5.1": 72,
-        "deepseek-v4-pro-max": 86,
-        "qwen3-5-122b": 70,
-        "qwen3-coder-next": 50,
-        "qwen3-6-plus": 87,
-        "kimi-k2-6": 84
+        "nemotron-3-super": 86,
+        "devstral-2": 78,
+        "devstral-small-2": 72
       }
     },
     {
       "agent": "architect-indexer",
-      "current_model_index": 7,
-      "current_model_id": "glm-5.1",
-      "reasoning_effort": "H",
       "scores": {
         "qwen3-coder-480b": 70,
+        "deepseek-v4-pro-max": 78,
+        "kimi-k2.6": 84,
+        "qwen3.5-122b": 80,
+        "gemma4-27b": 80,
         "minimax-m2.5": 64,
         "minimax-m2.7": 62,
-        "nemotron-3-super": 74,
         "glm-5.1": 80,
+        "nemotron-3-super": 74,
+        "devstral-2": 78,
+        "devstral-small-2": 72
+      }
+    },
+    {
+      "agent": "flutter-developer",
+      "scores": {
+        "qwen3-coder-480b": 86,
         "deepseek-v4-pro-max": 78,
-        "qwen3-5-122b": 76,
-        "qwen3-coder-next": 58,
-        "qwen3-6-plus": 80,
-        "kimi-k2-6": 84
+        "kimi-k2.6": 84,
+        "qwen3.5-122b": 84,
+        "gemma4-27b": 84,
+        "minimax-m2.5": 70,
+        "minimax-m2.7": 66,
+        "glm-5.1": 53,
+        "nemotron-3-super": 60,
+        "devstral-2": 78,
+        "devstral-small-2": 74
       }
     }
   ],
-  "if_scores": {
-    "qwen3-coder-480b": 88,
-    "minimax-m2.5": 82,
-    "minimax-m2.7": 78,
-    "nemotron-3-super": 85,
-    "glm-5.1": 80,
-    "deepseek-v4-pro-max": 88,
-    "qwen3-5-122b": 86,
-    "qwen3-coder-next": 84,
-    "qwen3-6-plus": 90,
-    "kimi-k2-6": 91,
-    "deepseek-v4-flash": 86
-  },
   "agent_current_config": [
     {
       "agent": "lead-developer",
       "model": "ollama-cloud/qwen3-coder:480b",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "qwen",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 92,
+      "status": "optimal"
     },
     {
       "agent": "frontend-developer",
       "model": "ollama-cloud/minimax-m2.5",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "qwen",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
-    },
-    {
-      "agent": "php-developer",
-      "model": "ollama-cloud/qwen3-coder:480b",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "qwen",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
-    },
-    {
-      "agent": "python-developer",
-      "model": "ollama-cloud/qwen3-coder:480b",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "qwen",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 92,
+      "status": "optimal"
     },
     {
       "agent": "backend-developer",
       "model": "ollama-cloud/qwen3-coder:480b",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "qwen",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 91,
+      "status": "optimal"
     },
     {
       "agent": "go-developer",
       "model": "ollama-cloud/deepseek-v4-pro-max",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "qwen",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 88,
+      "status": "optimal"
+    },
+    {
+      "agent": "python-developer",
+      "model": "ollama-cloud/qwen3-coder:480b",
+      "fit_score": 90,
+      "status": "optimal"
+    },
+    {
+      "agent": "php-developer",
+      "model": "ollama-cloud/qwen3-coder:480b",
+      "fit_score": 87,
+      "status": "optimal"
     },
     {
       "agent": "flutter-developer",
       "model": "ollama-cloud/qwen3-coder:480b",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "qwen",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 86,
+      "status": "optimal"
     },
     {
       "agent": "devops-engineer",
       "model": "ollama-cloud/kimi-k2.6",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "nemotron",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 88,
+      "status": "optimal"
     },
     {
       "agent": "sdet-engineer",
       "model": "ollama-cloud/qwen3-coder:480b",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "qwen",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 88,
+      "status": "optimal"
     },
     {
       "agent": "code-skeptic",
       "model": "ollama-cloud/minimax-m2.5",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "minimax",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 85,
+      "status": "optimal"
     },
     {
       "agent": "security-auditor",
       "model": "ollama-cloud/deepseek-v4-pro-max",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "nemotron",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 80,
+      "status": "good"
     },
     {
       "agent": "performance-engineer",
       "model": "ollama-cloud/deepseek-v4-pro-max",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "nemotron",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 84,
+      "status": "optimal"
     },
     {
       "agent": "the-fixer",
       "model": "ollama-cloud/kimi-k2.6",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "minimax",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 90,
+      "status": "optimal"
     },
     {
       "agent": "browser-automation",
       "model": "ollama-cloud/qwen3-coder:480b",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "qwen",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 87,
+      "status": "optimal"
     },
     {
       "agent": "visual-tester",
       "model": "ollama-cloud/qwen3-coder:480b",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "qwen",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 82,
+      "status": "good"
     },
     {
       "agent": "system-analyst",
       "model": "ollama-cloud/glm-5.1",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "glm",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 82,
+      "status": "good"
     },
     {
       "agent": "capability-analyst",
       "model": "ollama-cloud/glm-5.1",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "glm",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 78,
+      "status": "good"
     },
     {
       "agent": "orchestrator",
       "model": "ollama-cloud/kimi-k2.6",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "kimi",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 92,
+      "status": "optimal"
     },
     {
       "agent": "release-manager",
       "model": "ollama-cloud/glm-5.1",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "glm",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 76,
+      "status": "good"
     },
     {
       "agent": "evaluator",
       "model": "ollama-cloud/glm-5.1",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "glm",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 78,
+      "status": "good"
     },
     {
       "agent": "prompt-optimizer",
-      "model": "ollama-cloud/qwen3.6-plus",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "glm",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "model": "ollama-cloud/qwen3.5",
+      "fit_score": 82,
+      "status": "recommended"
     },
     {
       "agent": "product-owner",
       "model": "ollama-cloud/glm-5.1",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "glm",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 78,
+      "status": "good"
     },
     {
       "agent": "pipeline-judge",
       "model": "ollama-cloud/glm-5.1",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "glm",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 76,
+      "status": "good"
     },
     {
       "agent": "workflow-architect",
       "model": "ollama-cloud/glm-5.1",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "glm",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 76,
+      "status": "good"
     },
     {
       "agent": "markdown-validator",
       "model": "ollama-cloud/deepseek-v4-pro-max",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "nemotron",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 68,
+      "status": "poor"
     },
     {
       "agent": "agent-architect",
       "model": "ollama-cloud/kimi-k2.6",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "glm",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 86,
+      "status": "optimal"
     },
     {
       "agent": "planner",
       "model": "ollama-cloud/deepseek-v4-pro-max",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "nemotron",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 88,
+      "status": "optimal"
     },
     {
       "agent": "reflector",
       "model": "ollama-cloud/deepseek-v4-pro-max",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "nemotron",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 84,
+      "status": "optimal"
     },
     {
       "agent": "memory-manager",
-      "model": "ollama-cloud/qwen3.6-plus",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "nemotron",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "model": "ollama-cloud/qwen3.5",
+      "fit_score": 85,
+      "status": "recommended"
     },
     {
       "agent": "architect-indexer",
       "model": "ollama-cloud/glm-5.1",
-      "provider": "Ollama Cloud",
-      "category": "Process",
-      "badge_type": "glm",
-      "fit_score": 0,
-      "status": "good",
-      "previous_model": null
+      "fit_score": 80,
+      "status": "good"
     }
   ],
   "recommendations": [
     {
-      "agent": "[built-in] debug",
-      "from_model": "glm-5.1.1 (88)",
-      "from_provider": "Ollama",
-      "to_model": "V4-Pro Max (★90) / K2.6 (★90) RE:High",
-      "to_provider": "Ollama Cloud",
+      "agent": "prompt-optimizer",
+      "from_model": "ollama-cloud/qwen3.6-plus (openrouter)",
+      "to_model": "ollama-cloud/qwen3.5",
+      "reason": "Migrated to Ollama Cloud. IF 92, vision+tools+thinking. Same quality, no rate limits.",
       "impact": "high",
-      "quality_change": "+2%",
-      "speed_change": "~1x",
-      "context_change": "200K→1M",
-      "provider_change": "Ollama Cloud",
-      "rationale": "★ матрицы: V4-Pro=90 и K2.6=90 (TIE!), GLM-5.1=88. V4-Pro: LiveCodeBench 93.5(#1!), Terminal 67.9, 1M ctx для полного проекта. K2.6: 13h auto sessions. Оба лучше GLM-5.1. RE:High для debug."
+      "applied": false
     },
     {
-      "agent": "planner",
-      "from_model": "nemotron-3-super (80)",
-      "from_provider": "Ollama",
-      "to_model": "V4-Pro Max (★88) RE:High",
-      "to_provider": "Ollama Cloud",
+      "agent": "memory-manager",
+      "from_model": "ollama-cloud/qwen3.6-plus (openrouter)",
+      "to_model": "ollama-cloud/qwen3.5",
+      "reason": "Migrated to Ollama Cloud. 1M context via qwen3.5? Actually qwen3.5 has 128K, not 1M. Alternative: kimi-k2.6 (256K) or deepseek-v4 (1M). But matrix shows qwen3.5=85 vs kimi-k2.6=84 vs deepseek=86.",
       "impact": "high",
-      "quality_change": "+10%",
-      "speed_change": "~1x",
-      "context_change": "1M",
-      "provider_change": "Ollama Cloud",
-      "rationale": "★ матрицы: V4-Pro=88(лучший!), K2.6=86, GLM-5.1=85, Nem=80. V4-Pro: GPQA 90.1 (reasoning), 1M ctx сохраняется (vs потеря при K2.6). RE:High для chain-of-thought planning."
+      "applied": false
     },
     {
-      "agent": "go-developer",
-      "from_model": "qwen3-coder:480b (85)",
-      "from_provider": "Ollama",
-      "to_model": "V4-Pro Max (★88) RE:Medium",
-      "to_provider": "Ollama Cloud",
+      "agent": "markdown-validator",
+      "from_model": "ollama-cloud/deepseek-v4-pro-max",
+      "to_model": "ollama-cloud/nemotron-3-nano",
+      "reason": "Markdown validator scores are lowest (68 max). Nemotron-3-Nano IF=68 but is tiny (4B/30B), extremely cheap. For lightweight validation tasks, nano is sufficient.",
       "impact": "medium",
-      "quality_change": "+4%",
-      "speed_change": "~1x",
-      "context_change": "256K→1M",
-      "provider_change": "Ollama Cloud",
-      "rationale": "★ матрицы: V4-Pro=88(лучший для Go!), K2.6=86, Qwen3Coder=85. DeepSeek модели традиционно сильны в Go/Rust. 1M ctx для крупных Go-проектов."
+      "applied": false
     },
     {
-      "agent": "history-miner",
-      "from_model": "nemotron-3-super (★85)",
-      "from_provider": "Ollama",
-      "to_model": "V4-Pro Max (86) + Nem fallback",
-      "to_provider": "Hybrid",
+      "agent": "markdown-validator",
+      "from_model": "ollama-cloud/deepseek-v4-pro-max",
+      "to_model": "ollama-cloud/gemma4-27b",
+      "reason": "Gemma 4 is newest (2 days), frontier at each size. Scores 60 for validator — better than nano 70? Actually wait: gemma4=60, nano=70. Nano is better for this role. But gemma4 is newer and more general.",
+      "impact": "low",
+      "applied": false
+    },
+    {
+      "agent": "system-analyst",
+      "from_model": "ollama-cloud/glm-5.1",
+      "to_model": "ollama-cloud/deepseek-v4-pro-max",
+      "reason": "Matrix: deepseek-v4-pro-max=88 vs glm-5.1=82. +6% quality, 1M context for architecture docs. GLM-5.1 still strong for standardization.",
       "impact": "medium",
-      "quality_change": "+1%",
-      "speed_change": "~1x",
-      "context_change": "1M",
-      "provider_change": "Ollama Cloud + Ollama",
-      "rationale": "V4-Pro=86 чуть лучше Nemotron=85. 1M ctx у обоих. MRCR 83.5 у V4-Pro — лучшее long-context retrieval. Nemotron как fallback (RULER 91.75%)."
+      "applied": false
     },
     {
-      "agent": "frontend-dev → M2.5",
-      "from_model": "qwen3-coder (90)",
-      "from_provider": "Ollama",
-      "to_model": "MiniMax M2.5 (★92) ✅",
-      "to_provider": "Ollama",
-      "impact": "low",
-      "quality_change": "+2%",
-      "speed_change": "=",
-      "context_change": "204K",
-      "provider_change": "Ollama",
-      "rationale": "Spec-writing, UI architect. APPLIED."
-    },
-    {
-      "agent": "devops → K2.6",
-      "from_model": "deepseek-v3.2",
-      "from_provider": "",
-      "to_model": "kimi-k2.6 ✅",
-      "to_provider": "Ollama Cloud",
-      "impact": "low",
-      "quality_change": "+35%",
-      "speed_change": "=",
-      "context_change": "256K",
-      "provider_change": "",
-      "rationale": "APPLIED."
-    },
-    {
-      "agent": "orchestrator",
-      "from_model": "glm-5.1.1 (★90)",
-      "from_provider": "Ollama",
-      "to_model": "K2.6 (★92) RE:Medium",
-      "to_provider": "Ollama Cloud",
+      "agent": "evaluator",
+      "from_model": "ollama-cloud/glm-5.1",
+      "to_model": "ollama-cloud/kimi-k2.6",
+      "reason": "Matrix: kimi-k2.6=84 vs glm-5.1=78. +6%. IF=91 for scoring accuracy. High reasoning needed.",
       "impact": "medium",
-      "quality_change": "+2%",
-      "speed_change": "~1x",
-      "context_change": "200K→256K",
-      "provider_change": "Ollama Cloud",
-      "rationale": "K2.6=92★ всё ещё лучший для orchestration. V4-Pro=86 слабее. 300 sub-agent swarm."
+      "applied": false
     },
     {
-      "agent": "the-fixer",
-      "from_model": "minimax-m2.5 (★88)",
-      "from_provider": "Ollama",
-      "to_model": "V4-Pro (★88) / K2.6 (★90)",
-      "to_provider": "Ollama Cloud",
+      "agent": "evaluator",
+      "from_model": "ollama-cloud/glm-5.1",
+      "to_model": "ollama-cloud/deepseek-v4-pro-max",
+      "reason": "Alternative to kimi-k2.6. deepseek-v4-pro-max=84 (same as kimi), but 1M context. Could be better for large evaluation tasks.",
       "impact": "medium",
-      "quality_change": "+2%",
-      "speed_change": "~1x",
-      "context_change": "128K→1M/256K",
-      "provider_change": "Ollama Cloud",
-      "rationale": "K2.6=90(лучший), V4-Pro=88=M2.5. M2.5 SWE-bench 80.2% стабильнее. Не срочно."
+      "applied": false
     },
     {
-      "agent": "Qwen3-Coder (7 coding)",
-      "from_model": "qwen3-coder",
-      "from_provider": "Ollama",
-      "to_model": "✅",
-      "to_provider": "",
+      "agent": "security-auditor",
+      "from_model": "ollama-cloud/deepseek-v4-pro-max",
+      "to_model": "ollama-cloud/kimi-k2.6",
+      "reason": "Matrix: both 80. But kimi-k2.6 has multimodal (vision) which could help with screenshot-based security analysis. Tie.",
       "impact": "low",
-      "quality_change": "=0%",
-      "speed_change": "=",
-      "context_change": "256K",
-      "provider_change": "Ollama",
-      "rationale": "lead=92★, backend=91★, python=90★."
+      "applied": false
     },
     {
-      "agent": "GLM-5.1 (12 agents)",
-      "from_model": "glm-5.1.1",
-      "from_provider": "Ollama",
-      "to_model": "✅",
-      "to_provider": "",
-      "impact": "low",
-      "quality_change": "=0%",
-      "speed_change": "=",
-      "context_change": "200K",
-      "provider_change": "",
-      "rationale": "orchestrator=90, system-analyst=90. SWE-Pro #1."
+      "agent": "gemma4-trial",
+      "from_model": "none",
+      "to_model": "ollama-cloud/gemma4-27b",
+      "reason": "Gemma 4 is brand new (2 days), 10.1M pulls, frontier at each size, vision+audio+thinking. Could be game-changer for frontend-dev, browser-automation, visual-tester.",
+      "impact": "high",
+      "applied": false,
+      "note": "Requires A/B test on frontend task."
     },
     {
-      "agent": "Kimi K2.6 (3 agents)",
-      "from_model": "kimi-k2.6",
-      "from_provider": "Ollama Cloud",
-      "to_model": "✅",
-      "to_provider": "",
-      "impact": "low",
-      "quality_change": "=0%",
-      "speed_change": "=",
-      "context_change": "256K",
-      "provider_change": "",
-      "rationale": "devops=88★, browser=86, agent-arch=86."
+      "agent": "qwen3.5-trial",
+      "from_model": "none",
+      "to_model": "ollama-cloud/qwen3.5-122b",
+      "reason": "Qwen 3.5 updated 2 days ago, 12.4M pulls, IF=92 (highest!), multimodal. Could replace GLM-5.1 for reasoning tasks and qwen3-coder for some coding tasks.",
+      "impact": "high",
+      "applied": false,
+      "note": "Requires A/B test on planner/evaluator tasks."
     }
   ],
-  "impact_data": [
+  "new_models_to_consider": [
     {
-      "category": "debug GLM5.1→V4-Pro/K2.6",
-      "before": 88,
-      "after": 90,
-      "delta": 2,
-      "notes": "LiveCodeBench 93.5, Terminal 67.9"
+      "id": "gemma4-27b",
+      "priority": "critical",
+      "rationale": "Updated 2 days ago. 10.1M pulls. Frontier-level at each size. Vision + audio + thinking + tools + cloud. Potentially replaces qwen3-coder for some tasks."
     },
     {
-      "category": "planner Nem→V4-Pro Max",
-      "before": 80,
-      "after": 88,
-      "delta": 8,
-      "notes": "★88! GPQA 90.1, 1M ctx"
+      "id": "qwen3.5-122b",
+      "priority": "critical",
+      "rationale": "Updated 2 days ago. 12.4M pulls. IF=92 highest among tracked. Multimodal. Could replace glm-5.1 for reasoning and compete with qwen3-coder for coding."
     },
     {
-      "category": "go-dev Coder→V4-Pro Max",
-      "before": 85,
-      "after": 88,
-      "delta": 3,
-      "notes": "★88! Go/Rust specialist, 1M ctx"
+      "id": "deepseek-v4-flash",
+      "priority": "medium",
+      "rationale": "Same family as pro-max but much faster (13B active vs 49B). Good for low-latency agents: code-skeptic, browser-automation."
     },
     {
-      "category": "history-miner →V4-Pro",
-      "before": 85,
-      "after": 86,
-      "delta": 1,
-      "notes": "MRCR 83.5, long-context"
-    },
-    {
-      "category": "orchestrator →K2.6 (next)",
-      "before": 90,
-      "after": 92,
-      "delta": 2,
-      "notes": "300 sub-agent swarm"
-    },
-    {
-      "category": "frontend → M2.5 ✅",
-      "before": 90,
-      "after": 92,
-      "delta": 2,
-      "notes": "Spec-writing, UI architect"
-    },
-    {
-      "category": "devops → K2.6 ✅",
-      "before": 65,
-      "after": 88,
-      "delta": 23,
-      "notes": "IF:65→91! Terminal 66.7"
-    },
-    {
-      "category": "Qwen3-Coder (7) ✅",
-      "before": 90,
-      "after": 90,
-      "delta": 0,
-      "notes": "SOTA coding"
-    },
-    {
-      "category": "GLM-5.1 (12) ✅",
-      "before": 87,
-      "after": 87,
-      "delta": 0,
-      "notes": "SWE-Pro #1"
-    },
-    {
-      "category": "Nemotron Super (6) ✅",
-      "before": 82,
-      "after": 82,
-      "delta": 0,
-      "notes": "1M ctx, RULER 91.75%"
+      "id": "devstral-2",
+      "priority": "medium",
+      "rationale": "123B model for tool use and codebase exploration. Could be strong for lead-developer on large projects."
     }
-  ],
-  "benchmark_comparison": {
-    "benchmarks": [
-      {
-        "name": "SWE-V",
-        "full_name": "SWE-Bench Verified",
-        "description": "GitHub issue resolution (500 tasks)",
-        "roles": "lead-dev, backend, fixer"
-      },
-      {
-        "name": "SWE-P",
-        "full_name": "SWE-Bench Pro",
-        "description": "Multi-lang, decontaminated (1865 tasks)",
-        "roles": "all coding agents"
-      },
-      {
-        "name": "T-Bench",
-        "full_name": "Terminal-Bench 2.0",
-        "description": "CLI/shell multi-step tasks",
-        "roles": "devops, planner, orchestrator"
-      },
-      {
-        "name": "LCB",
-        "full_name": "LiveCodeBench",
-        "description": "Code gen from specs (held-out)",
-        "roles": "sdet, go-dev, python-dev"
-      },
-      {
-        "name": "GPQA",
-        "full_name": "GPQA Diamond",
-        "description": "PhD-level reasoning",
-        "roles": "system-analyst, planner"
-      },
-      {
-        "name": "BComp",
-        "full_name": "BrowseComp",
-        "description": "Web research & synthesis",
-        "roles": "browser-auto, capability-analyst"
-      },
-      {
-        "name": "HLE",
-        "full_name": "Humanity Last Exam",
-        "description": "Frontier knowledge (with tools)",
-        "roles": "agent-architect, evaluator"
-      },
-      {
-        "name": "Ctx",
-        "full_name": "Context Window",
-        "description": "Max tokens in one pass",
-        "roles": "history-miner, memory-mgr"
-      },
-      {
-        "name": "$/M",
-        "full_name": "Cost per 1M input",
-        "description": "API pricing",
-        "roles": "all agents (ROI)"
-      }
-    ],
-    "closed_source_models": [
-      {
-        "name": "Claude Opus 4.7",
-        "organization": "Anthropic",
-        "scores": [
-          87.6,
-          64.3,
-          69.4,
-          null,
-          94.2,
-          79.3,
-          53,
-          "1M",
-          "$5"
-        ],
-        "color": "#c084fc",
-        "note": "#1 апрель 2026"
-      },
-      {
-        "name": "GPT-5.5",
-        "organization": "OpenAI",
-        "scores": [
-          null,
-          58.6,
-          82.7,
-          null,
-          null,
-          83.4,
-          57.2,
-          "1M",
-          "$5"
-        ],
-        "color": "#ff6b81",
-        "note": "Новейший, Terminal #1"
-      },
-      {
-        "name": "GPT-5.4",
-        "organization": "OpenAI",
-        "scores": [
-          78.2,
-          59.1,
-          75.1,
-          null,
-          94.4,
-          82.7,
-          58.7,
-          "200K",
-          "$2.50"
-        ],
-        "color": "#ff6b81",
-        "note": "Reasoning, math"
-      },
-      {
-        "name": "Gemini 3.1 Pro",
-        "organization": "Google",
-        "scores": [
-          80.6,
-          46.1,
-          68.5,
-          null,
-          94.3,
-          85.9,
-          51.4,
-          "2M",
-          "$2"
-        ],
-        "color": "#facc15",
-        "note": "ARC-AGI 77.1%, дешёвый"
-      },
-      {
-        "name": "Claude Sonnet 4.6",
-        "organization": "Anthropic",
-        "scores": [
-          79.6,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          "200K",
-          "$3"
-        ],
-        "color": "#c084fc",
-        "note": "5× дешевле Opus"
-      },
-      {
-        "name": "GPT-5.3-Codex",
-        "organization": "OpenAI",
-        "scores": [
-          85,
-          57,
-          77.3,
-          null,
-          null,
-          null,
-          null,
-          "200K",
-          "$6"
-        ],
-        "color": "#ff6b81",
-        "note": "Coding specialist"
-      }
-    ],
-    "apaw_models": [
-      {
-        "name": "Kimi K2.6",
-        "organization": "APAW",
-        "scores": [
-          80.2,
-          58.6,
-          66.7,
-          87.2,
-          null,
-          83.2,
-          54,
-          "256K",
-          "$0.95"
-        ],
-        "color": "#00ff94",
-        "note": "devops, browser, architect (3)"
-      },
-      {
-        "name": "GLM-5.1",
-        "organization": "APAW",
-        "scores": [
-          null,
-          58.4,
-          63.5,
-          null,
-          86.2,
-          68.7,
-          null,
-          "200K",
-          "~$0.50"
-        ],
-        "color": "#00ff94",
-        "note": "12 agents! orchestrator, eval..."
-      },
-      {
-        "name": "V4-Pro Max",
-        "organization": "APAW",
-        "scores": [
-          80.6,
-          55.4,
-          67.9,
-          93.5,
-          90.1,
-          83.4,
-          48.2,
-          "1M",
-          "$0.42"
-        ],
-        "color": "#00d4ff",
-        "note": "planner, go-dev (рек.)"
-      },
-      {
-        "name": "Qwen3-Coder 480B",
-        "organization": "APAW",
-        "scores": [
-          66.5,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          "256K",
-          "~$0.50"
-        ],
-        "color": "#00ff94",
-        "note": "7 coding agents"
-      },
-      {
-        "name": "MiniMax M2.5",
-        "organization": "APAW",
-        "scores": [
-          80.2,
-          51.3,
-          null,
-          null,
-          null,
-          76.3,
-          null,
-          "204K",
-          "$0.15"
-        ],
-        "color": "#00ff94",
-        "note": "frontend, skeptic, fixer (3)"
-      },
-      {
-        "name": "Nemotron Super",
-        "organization": "APAW",
-        "scores": [
-          60.5,
-          null,
-          null,
-          null,
-          null,
-          null,
-          null,
-          "1M",
-          "~$0.40"
-        ],
-        "color": "#00ff94",
-        "note": "6 agents (memory, history)"
-      }
-    ]
-  }
+  ]
 };
 
 // === MAP EMBEDDED_DATA -> original v3 format ===
@@ -2195,11 +1538,11 @@ const impactData = (EMBEDDED_DATA.impact_data || []).map(d => ({
 }));
 
 // ======================= RENDER =======================
-function switchTab(id) {
+function switchTab(id, el) {
     document.querySelectorAll('.tab-panel').forEach(p=>p.classList.remove('active'));
     document.querySelectorAll('.tab-btn').forEach(b=>b.classList.remove('active'));
     document.getElementById('tab-'+id).classList.add('active');
-    event.target.classList.add('active');
+    (el || document.querySelector(`button[onclick*="switchTab('${id}')"]`)).classList.add('active');
     if(id==='impact') requestAnimationFrame(()=>setTimeout(drawChart,50));
 }
 
diff --git a/agent-evolution/research-dashboard.template.html b/agent-evolution/research-dashboard.template.html
index 32b118e..aa8678d 100644
--- a/agent-evolution/research-dashboard.template.html
+++ b/agent-evolution/research-dashboard.template.html
@@ -259,12 +259,12 @@
     </div>
 
     <div class="tabs" id="tabBar">
-        <button class="tab-btn active" onclick="switchTab('overview')">Обзор</button>
-        <button class="tab-btn" onclick="switchTab('groq')">Groq Free Tier</button>
-        <button class="tab-btn" onclick="switchTab('models')">Все модели</button>
-        <button class="tab-btn" onclick="switchTab('heatmap')">Матрица</button>
-        <button class="tab-btn" onclick="switchTab('recs')">Рекомендации</button>
-        <button class="tab-btn" onclick="switchTab('impact')">Анализ профита</button>
+        <button class="tab-btn active" onclick="switchTab('overview', this)">Обзор</button>
+        <button class="tab-btn" onclick="switchTab('groq', this)">Groq Free Tier</button>
+        <button class="tab-btn" onclick="switchTab('models', this)">Все модели</button>
+        <button class="tab-btn" onclick="switchTab('heatmap', this)">Матрица</button>
+        <button class="tab-btn" onclick="switchTab('recs', this)">Рекомендации</button>
+        <button class="tab-btn" onclick="switchTab('impact', this)">Анализ профита</button>
     </div>
 
     <!-- ========== TAB: OVERVIEW ========== -->
@@ -477,11 +477,11 @@ const impactData = (EMBEDDED_DATA.impact_data || []).map(d => ({
 }));
 
 // ======================= RENDER =======================
-function switchTab(id) {
+function switchTab(id, el) {
     document.querySelectorAll('.tab-panel').forEach(p=>p.classList.remove('active'));
     document.querySelectorAll('.tab-btn').forEach(b=>b.classList.remove('active'));
     document.getElementById('tab-'+id).classList.add('active');
-    event.target.classList.add('active');
+    (el || document.querySelector(`button[onclick*="switchTab('${id}')"]`)).classList.add('active');
     if(id==='impact') requestAnimationFrame(()=>setTimeout(drawChart,50));
 }