diff --git a/.gitignore b/.gitignore
index 10dcd50..845da4e 100644
--- a/.gitignore
+++ b/.gitignore
@@ -40,6 +40,8 @@ __pycache__/
 agent-evolution/data/dashboard-data.json
 agent-evolution/data/state.json
 agent-evolution/data/model-benchmarks.json.bak
+*.db
+research-jobs.json
 landing/api/state.json
 landing/api/state.json.bak
 landing/api/dashboard-data.json
diff --git a/agent-evolution/api.py b/agent-evolution/api.py
new file mode 100644
index 0000000..6fd4b28
--- /dev/null
+++ b/agent-evolution/api.py
@@ -0,0 +1,491 @@
+"""
+Evolution Research API — FastAPI backend for agent-model evaluation jobs.
+
+Endpoints:
+  POST /api/research            → start background evaluation job
+  GET  /api/research/{id}       → job status & results
+  POST /api/research/cell       → evaluate single agent-model pair
+  GET  /api/real-fit-report     → serve real-fit-report.json (live from DB)
+  GET  /api/models              → list available models
+  GET  /api/evaluation/{agent}/{model} → detailed evaluation record
+  POST /api/evolve-agent/start  → start role-fit testing job (evolution-prompt + evolution-skeptic)
+"""
+
+import json
+import os
+import sqlite3
+import subprocess
+import time
+import uuid
+from datetime import datetime, timezone
+from pathlib import Path
+
+from fastapi import FastAPI, HTTPException
+from fastapi.responses import JSONResponse
+from fastapi.middleware.cors import CORSMiddleware
+from pydantic import BaseModel
+
+app = FastAPI(title="Evolution Research API", version="1.1.0")
+
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+
+JOB_STATE_PATH = Path(os.environ.get("JOB_STATE_PATH", "/app/data/research-jobs.json"))
+REPORT_PATH = Path(os.environ.get("REPORT_PATH", "/app/data/real-fit-report.json"))
+META_PATH = Path(os.environ.get("META_PATH", "/app/kilo-meta.json"))
+EVOLUTION_PATH = Path(os.environ.get("EVOLUTION_PATH", "/app/data/evolution.json"))
+ENGINE_PATH = Path(os.environ.get("ENGINE_PATH", "/app/scripts/real-fit-engine.py"))
+DB_PATH = Path(os.environ.get("REAL_FIT_DB", REPORT_PATH.parent / "real-fit.db"))
+
+
+def _load_json(path: Path) -> dict:
+    if path.exists():
+        with open(path, "r", encoding="utf-8") as f:
+            return json.load(f)
+    return {}
+
+
+def _save_json(path: Path, data: dict) -> None:
+    path.parent.mkdir(parents=True, exist_ok=True)
+    with open(path, "w", encoding="utf-8") as f:
+        json.dump(data, f, indent=2)
+
+
+def _load_jobs() -> dict:
+    return _load_json(JOB_STATE_PATH)
+
+
+def _save_jobs(jobs: dict) -> None:
+    _save_json(JOB_STATE_PATH, jobs)
+
+
+class ResearchRequest(BaseModel):
+    agent: str
+    models: list[str]
+
+
+class CellRequest(BaseModel):
+    agent: str
+    model: str
+
+
+class EvolveAgentRequest(BaseModel):
+    agent: str
+    models: list[str]
+
+
+def _spawn_engine_job(job_id: str, agent: str, models: list[str]) -> None:
+    """Spawn real-fit-engine.py as a background subprocess to evaluate models.
+
+    After evaluation, regenerates the report JSON so results are immediately visible.
+    """
+    model_arg = ",".join(models)
+    subprocess.Popen(
+        ["python3", "-c", f"""
+import subprocess, json, time, os
+job_id = {repr(job_id)}
+job_state_path = os.environ.get('JOB_STATE_PATH', '/app/data/research-jobs.json')
+engine_path = os.environ.get('ENGINE_PATH', '/app/scripts/real-fit-engine.py')
+
+def load_jobs():
+    try:
+        with open(job_state_path) as f:
+            return json.load(f)
+    except Exception:
+        return {{}}
+
+def save_jobs(jobs):
+    with open(job_state_path, 'w') as f:
+        json.dump(jobs, f, indent=2)
+
+jobs = load_jobs()
+job = jobs.get(job_id)
+if job:
+    job['status'] = 'running'
+    job['updated_at'] = time.strftime('%Y-%m-%dT%H:%M:%SZ', time.gmtime())
+    save_jobs(jobs)
+
+cmd = ['python3', engine_path, '--evaluate', {repr(agent)}, '--models', {repr(model_arg)}, '--report']
+proc = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
+stdout, stderr = proc.communicate()
+
+jobs = load_jobs()
+job = jobs.get(job_id)
+if job:
+    job['status'] = 'done' if proc.returncode == 0 else 'error'
+    job['progress'] = 100
+    job['result'] = {{'returncode': proc.returncode, 'stdout': stdout, 'stderr': stderr}}
+    job['updated_at'] = time.strftime('%Y-%m-%dT%H:%M:%SZ', time.gmtime())
+    save_jobs(jobs)
+"""],
+        stdout=subprocess.DEVNULL,
+        stderr=subprocess.DEVNULL,
+    )
+
+
+@app.get("/api/models")
+def get_models():
+    meta = _load_json(META_PATH)
+    agents_meta = meta.get("agents", {})
+    models = set()
+    for agent in agents_meta.values():
+        m = agent.get("model", "")
+        if m:
+            models.add(m)
+    evolution = _load_json(EVOLUTION_PATH)
+    for agent_data in evolution.get("agents", {}).values():
+        curr = agent_data.get("current", {})
+        m = curr.get("model", "")
+        if m:
+            models.add(m)
+        for rec in agent_data.get("recommendations", []):
+            mod = rec.get("model", "")
+            if mod:
+                models.add(mod)
+    return {"models": sorted(models)}
+
+
+@app.get("/api/evaluation/{agent}/{model}")
+def get_evaluation(agent: str, model: str):
+    db_path = str(DB_PATH)
+    if not os.path.exists(db_path):
+        raise HTTPException(status_code=404, detail="Evaluation database not found")
+
+    conn = sqlite3.connect(db_path)
+    conn.row_factory = sqlite3.Row
+    cursor = conn.cursor()
+
+    # Step 1: Get the best evaluation for this agent-model pair
+    cursor.execute(
+        """
+        SELECT e.id, e.agent_name, e.model, e.prompt_id,
+               e.response, e.scores, e.total_score, e.explanation,
+               e.evaluator, e.latency_ms, e.tokens_prompt, e.tokens_response, e.evaluated_at
+        FROM evaluations e
+        WHERE e.agent_name = ? AND e.model = ? AND e.total_score > 0
+        ORDER BY e.total_score DESC, e.id DESC
+        LIMIT 1
+        """,
+        (agent, model),
+    )
+    row = cursor.fetchone()
+
+    if not row:
+        # Fallback: try any evaluation even with score 0
+        cursor.execute(
+            """
+            SELECT e.id, e.agent_name, e.model, e.prompt_id,
+                   e.response, e.scores, e.total_score, e.explanation,
+                   e.evaluator, e.latency_ms, e.tokens_prompt, e.tokens_response, e.evaluated_at
+            FROM evaluations e
+            WHERE e.agent_name = ? AND e.model = ?
+            ORDER BY e.id DESC LIMIT 1
+            """,
+            (agent, model),
+        )
+        row = cursor.fetchone()
+
+    if not row:
+        conn.close()
+        raise HTTPException(status_code=404, detail="Evaluation not found for this agent-model pair")
+
+    result = dict(row)
+    prompt_id = result.get("prompt_id")
+
+    # Step 2: Get prompt data — try by prompt_id first, then fallback by agent_name
+    system_prompt = ""
+    user_prompt = ""
+    expected_keywords_raw = "[]"
+    rubric_raw = "{}"
+
+    if prompt_id:
+        cursor.execute(
+            "SELECT system_prompt, user_prompt, expected_keywords, rubric FROM test_prompts WHERE id = ?",
+            (prompt_id,),
+        )
+        tp = cursor.fetchone()
+        if tp and tp["system_prompt"]:
+            system_prompt = tp["system_prompt"]
+            user_prompt = tp["user_prompt"] or ""
+            expected_keywords_raw = tp["expected_keywords"] or "[]"
+            rubric_raw = tp["rubric"] or "{}"
+
+    # Fallback: find prompt by agent_name if JOIN failed
+    if not system_prompt:
+        cursor.execute(
+            "SELECT system_prompt, user_prompt, expected_keywords, rubric FROM test_prompts WHERE agent_name = ? ORDER BY id DESC LIMIT 1",
+            (agent,),
+        )
+        tp = cursor.fetchone()
+        if tp:
+            system_prompt = tp["system_prompt"] or ""
+            user_prompt = tp["user_prompt"] or ""
+            expected_keywords_raw = tp["expected_keywords"] or "[]"
+            rubric_raw = tp["rubric"] or "{}"
+
+    conn.close()
+
+    # Assign all fetched prompt data to the result
+    result["system_prompt"] = system_prompt
+    result["user_prompt"] = user_prompt
+    result["expected_keywords"] = expected_keywords_raw
+    result["rubric"] = rubric_raw
+
+    for key in ("expected_keywords", "rubric", "scores"):
+        raw = result.get(key)
+        if isinstance(raw, str):
+            try:
+                result[key] = json.loads(raw)
+            except json.JSONDecodeError:
+                result[key] = [] if key == "expected_keywords" else {}
+        elif raw is None:
+            result[key] = [] if key == "expected_keywords" else {}
+
+    return result
+
+
+def _sync_agents_from_meta(db_path: Path, meta_path: Path | None = None) -> None:
+    """Import any missing agents from kilo-meta.json into the DB agents table."""
+    if meta_path is None:
+        meta_path = db_path.parent.parent.parent / "kilo-meta.json"
+    if not meta_path.exists():
+        return
+    with open(meta_path) as f:
+        meta = json.load(f)
+
+    conn = sqlite3.connect(str(db_path))
+    cursor = conn.cursor()
+    cursor.execute("SELECT name FROM agents")
+    existing = {r[0] for r in cursor.fetchall()}
+
+    for name, info in meta.get("agents", {}).items():
+        if name in existing:
+            continue
+        cursor.execute(
+            "INSERT OR IGNORE INTO agents (name, description, category, current_model, color, updated) VALUES (?, ?, ?, ?, ?, ?)",
+            (
+                name,
+                info.get("description", ""),
+                info.get("category", "meta"),
+                info.get("model", ""),
+                info.get("color", "#6B7280"),
+                datetime.now(timezone.utc).isoformat(),
+            ),
+        )
+    conn.commit()
+    conn.close()
+
+
+def _build_report_from_db(db_path: Path) -> dict:
+    """Build real-fit report dynamically from SQLite DB (filtered, objective)."""
+    _sync_agents_from_meta(db_path)
+    conn = sqlite3.connect(str(db_path))
+    conn.row_factory = sqlite3.Row
+    cursor = conn.cursor()
+
+    cursor.execute("""
+        SELECT name, description, category, current_model
+        FROM agents
+    """)
+    agents_meta = {row["name"]: dict(row) for row in cursor.fetchall()}
+
+    # Only take evaluations that are NOT HTTP error responses
+    # AND prefer evaluator='rubric_v2' over 'rubric_v1'
+    cursor.execute("""
+        SELECT agent_name, model, total_score, evaluator, response
+        FROM evaluations
+        WHERE total_score > 0
+          AND evaluator NOT LIKE '%rubric_v1%'
+          AND (response IS NULL
+               OR (response NOT LIKE '%[HTTP %' AND response != ''))
+        ORDER BY agent_name, model,
+            CASE evaluator
+                WHEN 'evolution-skeptic' THEN 0
+                WHEN 'rubric_v2' THEN 1
+                ELSE 2
+            END,
+            total_score DESC
+    """)
+
+    # Take the first (best preferred evaluator, highest score) per agent-model
+    best_evals = {}
+    for row in cursor.fetchall():
+        agent = row["agent_name"]
+        model = row["model"]
+        score = row["total_score"]
+        if agent not in best_evals:
+            best_evals[agent] = {}
+        if model not in best_evals[agent]:
+            best_evals[agent][model] = score
+
+    # Rebuild fit_scores from selected evaluations only
+    cursor.execute("""
+        SELECT agent_name, model, MAX(total_score) as best_score, scores, explanation
+        FROM evaluations
+        WHERE total_score > 0
+          AND evaluator NOT LIKE '%rubric_v1%'
+          AND (response IS NULL
+               OR (response NOT LIKE '%[HTTP %' AND response != ''))
+        GROUP BY agent_name, model
+    """)
+    fit_scores = {}
+    for row in cursor.fetchall():
+        fit_scores[row["agent_name"]] = {
+            "model": row["model"],
+            "fit": row["best_score"],
+            "explanation": (
+                f"Best model for {row['agent_name']} is {row['model']} "
+                f"with avg score {row['best_score']:.1f}. "
+                "Evaluator preference: evolution-skeptic > rubric_v2 > rubric_v1 (ignored HTTP errors)."
+            ),
+        }
+
+    conn.close()
+
+    agents_report = {}
+    for agent_name, meta in agents_meta.items():
+        evals = best_evals.get(agent_name, {})
+        if evals:
+            best_model = max(evals, key=evals.get)
+            best_score = evals[best_model]
+        else:
+            best_model = ""
+            best_score = 0.0
+        agents_report[agent_name] = {
+            "name": agent_name,
+            "evaluations": evals,
+            "info": [
+                meta.get("description") or "",
+                meta.get("category") or "",
+                meta.get("current_model") or "",
+            ],
+            "best_model": best_model,
+            "best_score": best_score,
+        }
+
+    total_evals = sum(len(evals) for evals in best_evals.values())
+
+    return {
+        "generated": time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime()).replace("+0000", "+00:00"),
+        "source": "real-fit-engine-db-filtered",
+        "total_evaluations": total_evals,
+        "agents": agents_report,
+        "fit_scores": fit_scores,
+    }
+
+
+@app.get("/api/real-fit-report")
+def get_real_fit_report():
+    db_path = str(DB_PATH)
+    if os.path.exists(db_path):
+        return _build_report_from_db(DB_PATH)
+    return _load_json(REPORT_PATH)
+
+
+@app.post("/api/research")
+def start_research(req: ResearchRequest):
+    job_id = str(uuid.uuid4())
+    jobs = _load_jobs()
+    jobs[job_id] = {
+        "id": job_id,
+        "agent": req.agent,
+        "models": req.models,
+        "status": "pending",
+        "progress": 0,
+        "result": None,
+        "created_at": time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime()),
+        "updated_at": time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime()),
+    }
+    _save_jobs(jobs)
+
+    _spawn_engine_job(job_id, req.agent, req.models)
+
+    return {"job_id": job_id, "status": "pending", "agent": req.agent, "models": req.models}
+
+
+def _extract_scores_from_report(agent: str, models: list[str]) -> list[dict]:
+    """Read real-fit-report.json and return scores for agent x models."""
+    report = _load_json(REPORT_PATH)
+    agent_data = report.get("agents", {}).get(agent, {})
+    evaluations = agent_data.get("evaluations", {})
+    results = []
+    for m in models:
+        score = evaluations.get(m, 0)
+        pending = score == 0
+        results.append({"model": m, "score": score, "pending": pending})
+    return results
+
+
+@app.get("/api/research/{job_id}")
+def get_research(job_id: str):
+    jobs = _load_jobs()
+    job = jobs.get(job_id)
+    if not job:
+        raise HTTPException(status_code=404, detail="Job not found")
+    if job.get("status") == "done" and job.get("result") is not None:
+        job["models_scored"] = _extract_scores_from_report(job["agent"], job.get("models", []))
+    return job
+
+
+@app.post("/api/research/cell")
+def research_cell(req: CellRequest):
+    job_id = str(uuid.uuid4())
+    jobs = _load_jobs()
+    jobs[job_id] = {
+        "id": job_id,
+        "agent": req.agent,
+        "models": [req.model],
+        "status": "pending",
+        "progress": 0,
+        "result": None,
+        "created_at": time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime()),
+        "updated_at": time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime()),
+    }
+    _save_jobs(jobs)
+
+    _spawn_engine_job(job_id, req.agent, [req.model])
+
+    return {"job_id": job_id, "status": "pending", "agent": req.agent, "model": req.model}
+
+
+@app.post("/api/evolve-agent/start")
+def start_evolve_agent(req: EvolveAgentRequest):
+    """Start a role-fit evaluation job using evolution-prompt and evolution-skeptic.
+
+    For now, this places a job in the queue that will be picked up by the real-fit-engine.
+    In the full implementation:
+    1. evolution-prompt generates role-specific stress-test prompts from agent definition
+    2. Each model in models list is tested with the same prompt
+    3. evolution-skeptic evaluates each response with per-dimension rubric scoring
+    4. Results are stored in SQLite and report is regenerated
+    """
+    job_id = str(uuid.uuid4())
+    jobs = _load_jobs()
+    jobs[job_id] = {
+        "id": job_id,
+        "type": "evolve-agent",
+        "agent": req.agent,
+        "models": req.models,
+        "status": "pending",
+        "progress": 0,
+        "result": None,
+        "created_at": time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime()),
+        "updated_at": time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime()),
+    }
+    _save_jobs(jobs)
+
+    # Placeholder: spawn the same engine job with evolve-agent type
+    # In full implementation, this would spawn a script that:
+    #   1. Reads agent definition from .kilo/agents/{agent}.md
+    #   2. Calls Ollama API for evolution-prompt to generate test prompts
+    #   3. For each model: calls Ollama API, stores response
+    #   4. Calls Ollama API for evolution-skeptic to evaluate
+    #   5. Stores results in SQLite, rebuilds report
+    _spawn_engine_job(job_id, req.agent, req.models)
+
+    return {"job_id": job_id, "status": "pending", "agent": req.agent, "models": req.models}
\ No newline at end of file
diff --git a/agent-evolution/archive/index.html b/agent-evolution/archive/index.html
new file mode 100644
index 0000000..7174e12
--- /dev/null
+++ b/agent-evolution/archive/index.html
@@ -0,0 +1,7031 @@
+<!DOCTYPE html>
+<html lang="ru">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>APAW Agent Evolution Dashboard</title>
+    <link href="https://fonts.googleapis.com/css2?family=JetBrains+Mono:wght@300;400;500;600;700&family=Inter:wght@300;400;500;600;700;800&display=swap" rel="stylesheet">
+    <script src="https://cdn.jsdelivr.net/npm/chart.js@4.4.7/dist/chart.umd.min.js"></script>
+    <script src="https://cdn.jsdelivr.net/npm/chartjs-plugin-datalabels@2.2.0"></script>
+    <style>
+        :root {
+            --bg-deep: #0a0f1a;
+            --bg-panel: #0f1525;
+            --bg-card: #141c2e;
+            --bg-card-hover: #1a2540;
+            --border: #1e2d45;
+            --border-bright: #2a4060;
+            --text-primary: #e8f1ff;
+            --text-secondary: #8ba3c0;
+            --text-muted: #5a7090;
+            --accent-cyan: #00d4ff;
+            --accent-green: #00ff94;
+            --accent-orange: #ff9f43;
+            --accent-red: #ff4757;
+            --accent-purple: #a855f7;
+            --accent-blue: #3b82f6;
+            --accent-yellow: #facc15;
+            --glow-cyan: rgba(0,212,255,0.15);
+            --glow-green: rgba(0,255,148,0.1);
+            --glow-purple: rgba(168,85,247,0.1);
+        }
+        * { margin: 0; padding: 0; box-sizing: border-box; }
+        body {
+            font-family: 'Inter', sans-serif;
+            background: var(--bg-deep);
+            color: var(--text-primary);
+            min-height: 100vh;
+        }
+        body::before {
+            content: '';
+            position: fixed;
+            inset: 0;
+            background: 
+                radial-gradient(ellipse at 20% 20%, rgba(0,212,255,0.08) 0%, transparent 50%),
+                radial-gradient(ellipse at 80% 80%, rgba(168,85,247,0.06) 0%, transparent 50%);
+            pointer-events: none;
+            z-index: 0;
+        }
+        .container {
+            max-width: 1600px;
+            margin: 0 auto;
+            padding: 24px 16px;
+            position: relative;
+            z-index: 1;
+        }
+
+        /* Header */
+        .header { text-align: center; margin-bottom: 32px; }
+        .header h1 {
+            font-size: 2.2em;
+            font-weight: 800;
+            background: linear-gradient(135deg, var(--accent-cyan), var(--accent-green));
+            -webkit-background-clip: text;
+            -webkit-text-fill-color: transparent;
+            margin-bottom: 8px;
+        }
+        .header .sub {
+            font-family: 'JetBrains Mono', monospace;
+            font-size: 0.85em;
+            color: var(--text-muted);
+        }
+        .header .meta {
+            display: flex;
+            justify-content: center;
+            gap: 24px;
+            margin-top: 12px;
+            font-size: 0.8em;
+            color: var(--text-secondary);
+        }
+
+        /* Tabs */
+        .tabs {
+            display: flex;
+            gap: 4px;
+            background: var(--bg-panel);
+            border: 1px solid var(--border);
+            border-radius: 12px;
+            padding: 4px;
+            margin-bottom: 24px;
+            overflow-x: auto;
+        }
+        .tab-btn {
+            flex: 1;
+            min-width: 100px;
+            padding: 10px 16px;
+            background: none;
+            border: none;
+            color: var(--text-secondary);
+            font-family: 'Inter', sans-serif;
+            font-size: 0.85em;
+            font-weight: 600;
+            border-radius: 8px;
+            cursor: pointer;
+            transition: all 0.25s;
+            white-space: nowrap;
+        }
+        .tab-btn:hover { color: var(--text-primary); background: var(--bg-card); }
+        .tab-btn.active {
+            color: var(--bg-deep);
+            background: linear-gradient(135deg, var(--accent-cyan), var(--accent-green));
+            box-shadow: 0 0 20px var(--glow-cyan);
+        }
+        .tab-panel { display: none; animation: fadeUp 0.4s ease-out; }
+        .tab-panel.active { display: block; }
+        @keyframes fadeUp {
+            from { opacity: 0; transform: translateY(16px); }
+            to { opacity: 1; transform: translateY(0); }
+        }
+
+        /* Stats */
+        .stats-row {
+            display: grid;
+            grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
+            gap: 14px;
+            margin-bottom: 24px;
+        }
+        .stat-card {
+            background: var(--bg-card);
+            border: 1px solid var(--border);
+            border-radius: 10px;
+            padding: 18px;
+            position: relative;
+            overflow: hidden;
+            transition: all 0.3s;
+        }
+        .stat-card:hover {
+            border-color: var(--accent-cyan);
+            transform: translateY(-2px);
+            box-shadow: 0 8px 32px var(--glow-cyan);
+        }
+        .stat-label {
+            font-family: 'JetBrains Mono', monospace;
+            font-size: 0.65em;
+            color: var(--text-muted);
+            text-transform: uppercase;
+            letter-spacing: 1.5px;
+            margin-bottom: 6px;
+        }
+        .stat-value { font-size: 2em; font-weight: 800; }
+        .stat-sub { font-size: 0.75em; color: var(--text-secondary); margin-top: 4px; }
+        .grad-cyan { background: linear-gradient(135deg, var(--accent-cyan), var(--accent-green)); -webkit-background-clip: text; -webkit-text-fill-color: transparent; }
+        .grad-orange { background: linear-gradient(135deg, var(--accent-orange), var(--accent-yellow)); -webkit-background-clip: text; -webkit-text-fill-color: transparent; }
+        .grad-purple { background: linear-gradient(135deg, var(--accent-purple), #e879f9); -webkit-background-clip: text; -webkit-text-fill-color: transparent; }
+        .grad-green { background: linear-gradient(135deg, var(--accent-green), #4ade80); -webkit-background-clip: text; -webkit-text-fill-color: transparent; }
+        .grad-red { background: linear-gradient(135deg, var(--accent-red), #ff6b81); -webkit-background-clip: text; -webkit-text-fill-color: transparent; }
+
+        /* Agent Grid */
+        .agents-grid {
+            display: grid;
+            grid-template-columns: repeat(auto-fill, minmax(340px, 1fr));
+            gap: 16px;
+        }
+        .agent-card {
+            background: var(--bg-card);
+            border: 1px solid var(--border);
+            border-radius: 12px;
+            padding: 20px;
+            transition: all 0.3s;
+            position: relative;
+            overflow: hidden;
+        }
+        .agent-card:hover {
+            border-color: var(--accent-cyan);
+            transform: translateY(-2px);
+            box-shadow: 0 8px 32px var(--glow-cyan);
+        }
+        .agent-card.has-history { border-left: 3px solid var(--accent-green); }
+        .agent-card.needs-update { border-left: 3px solid var(--accent-orange); }
+        .agent-card.is-new { border-left: 3px solid var(--accent-purple); }
+
+        .agent-header {
+            display: flex;
+            justify-content: space-between;
+            align-items: flex-start;
+            margin-bottom: 12px;
+        }
+        .agent-name {
+            font-weight: 700;
+            font-size: 1.05em;
+            display: flex;
+            align-items: center;
+            gap: 8px;
+        }
+        .agent-color {
+            width: 12px;
+            height: 12px;
+            border-radius: 3px;
+            flex-shrink: 0;
+        }
+        .agent-category {
+            font-family: 'JetBrains Mono', monospace;
+            font-size: 0.7em;
+            padding: 3px 8px;
+            border-radius: 12px;
+            background: rgba(0,212,255,0.1);
+            color: var(--accent-cyan);
+        }
+        .agent-model {
+            font-family: 'JetBrains Mono', monospace;
+            font-size: 0.78em;
+            color: var(--accent-green);
+            margin-bottom: 8px;
+            display: flex;
+            align-items: center;
+            gap: 6px;
+        }
+        .agent-provider {
+            font-size: 0.7em;
+            padding: 2px 6px;
+            border-radius: 4px;
+            background: rgba(0,255,148,0.1);
+            color: var(--accent-green);
+        }
+        .agent-desc {
+            font-size: 0.85em;
+            color: var(--text-secondary);
+            line-height: 1.5;
+            margin-bottom: 12px;
+        }
+        .agent-meta {
+            display: grid;
+            grid-template-columns: repeat(3, 1fr);
+            gap: 8px;
+            padding-top: 12px;
+            border-top: 1px solid var(--border);
+        }
+        .agent-meta-item {
+            text-align: center;
+        }
+        .agent-meta-label {
+            font-size: 0.6em;
+            color: var(--text-muted);
+            text-transform: uppercase;
+            letter-spacing: 0.5px;
+        }
+        .agent-meta-value {
+            font-family: 'JetBrains Mono', monospace;
+            font-size: 0.9em;
+            font-weight: 600;
+            color: var(--text-primary);
+        }
+        .agent-history {
+            margin-top: 12px;
+            padding-top: 12px;
+            border-top: 1px dashed var(--border);
+        }
+        .history-title {
+            font-size: 0.7em;
+            color: var(--text-muted);
+            text-transform: uppercase;
+            margin-bottom: 8px;
+        }
+        .history-item {
+            display: flex;
+            align-items: center;
+            gap: 10px;
+            font-size: 0.75em;
+            padding: 6px 0;
+            border-bottom: 1px solid rgba(30,45,69,0.5);
+        }
+        .history-item:last-child { border-bottom: none; }
+        .history-date {
+            font-family: 'JetBrains Mono', monospace;
+            color: var(--text-muted);
+            min-width: 100px;
+        }
+        .history-type {
+            padding: 2px 6px;
+            border-radius: 4px;
+            font-size: 0.85em;
+        }
+        .history-type.model_change { background: rgba(0,212,255,0.15); color: var(--accent-cyan); }
+        .history-type.prompt_change { background: rgba(168,85,247,0.15); color: var(--accent-purple); }
+        .history-type.agent_created { background: rgba(0,255,148,0.15); color: var(--accent-green); }
+
+        /* Category Section */
+        .category-section { margin-bottom: 32px; }
+        .category-header {
+            display: flex;
+            align-items: center;
+            gap: 10px;
+            margin-bottom: 16px;
+            padding-bottom: 8px;
+            border-bottom: 1px solid var(--border);
+        }
+        .category-title {
+            font-size: 1.1em;
+            font-weight: 700;
+        }
+        .category-count {
+            font-family: 'JetBrains Mono', monospace;
+            font-size: 0.7em;
+            padding: 3px 8px;
+            border-radius: 12px;
+            background: rgba(168,85,247,0.15);
+            color: var(--accent-purple);
+        }
+
+        /* Evolution Timeline */
+        .timeline-wrap {
+            background: var(--bg-card);
+            border: 1px solid var(--border);
+            border-radius: 12px;
+            padding: 24px;
+            margin-bottom: 24px;
+        }
+        .timeline-title {
+            font-size: 1.1em;
+            font-weight: 700;
+            margin-bottom: 16px;
+        }
+        .timeline {
+            position: relative;
+            padding-left: 24px;
+        }
+        .timeline::before {
+            content: '';
+            position: absolute;
+            left: 8px;
+            top: 0;
+            bottom: 0;
+            width: 2px;
+            background: var(--border);
+        }
+        .timeline-item {
+            position: relative;
+            padding: 12px 0 12px 24px;
+            border-bottom: 1px solid var(--border);
+        }
+        .timeline-item:last-child { border-bottom: none; }
+        .timeline-item::before {
+            content: '';
+            position: absolute;
+            left: -20px;
+            top: 18px;
+            width: 12px;
+            height: 12px;
+            border-radius: 50%;
+            background: var(--accent-cyan);
+            border: 2px solid var(--border);
+        }
+        .timeline-date {
+            font-family: 'JetBrains Mono', monospace;
+            font-size: 0.75em;
+            color: var(--text-muted);
+        }
+        .timeline-content {
+            font-size: 0.9em;
+            margin-top: 4px;
+        }
+        .timeline-agent {
+            font-weight: 600;
+            color: var(--accent-cyan);
+        }
+        .timeline-change {
+            color: var(--text-secondary);
+        }
+
+        /* Filter Row */
+        .filter-row {
+            display: flex;
+            gap: 8px;
+            flex-wrap: wrap;
+            margin-bottom: 16px;
+        }
+        .filter-btn {
+            padding: 6px 14px;
+            background: var(--bg-card);
+            border: 1px solid var(--border);
+            color: var(--text-secondary);
+            border-radius: 20px;
+            font-size: 0.8em;
+            cursor: pointer;
+            transition: all 0.2s;
+            font-family: 'Inter', sans-serif;
+        }
+        .filter-btn:hover, .filter-btn.active {
+            border-color: var(--accent-cyan);
+            color: var(--accent-cyan);
+            background: rgba(0,212,255,0.05);
+        }
+
+        /* Search */
+        .search-box {
+            position: relative;
+            margin-bottom: 20px;
+        }
+        .search-input {
+            width: 100%;
+            padding: 12px 16px 12px 40px;
+            background: var(--bg-card);
+            border: 1px solid var(--border);
+            border-radius: 8px;
+            color: var(--text-primary);
+            font-family: 'Inter', sans-serif;
+            font-size: 0.9em;
+        }
+        .search-input:focus {
+            outline: none;
+            border-color: var(--accent-cyan);
+        }
+        .search-icon {
+            position: absolute;
+            left: 14px;
+            top: 50%;
+            transform: translateY(-50%);
+            color: var(--text-muted);
+        }
+
+        /* Model Matrix */
+        .matrix-wrap {
+            overflow-x: auto;
+            border-radius: 12px;
+            border: 1px solid var(--border);
+            background: var(--bg-card);
+            padding: 20px;
+        }
+        .matrix-title {
+            font-size: 1.1em;
+            font-weight: 700;
+            margin-bottom: 16px;
+        }
+        .matrix-table {
+            width: 100%;
+            border-collapse: collapse;
+            font-size: 0.8em;
+        }
+        .matrix-table th {
+            font-family: 'JetBrains Mono', monospace;
+            font-size: 0.7em;
+            color: var(--text-muted);
+            text-transform: uppercase;
+            padding: 10px 8px;
+            text-align: left;
+            border-bottom: 2px solid var(--border);
+            position: sticky;
+            top: 0;
+            background: var(--bg-panel);
+        }
+        .matrix-table td {
+            padding: 10px 8px;
+            border-bottom: 1px solid var(--border);
+        }
+        .matrix-table tr:hover td {
+            background: var(--bg-card-hover);
+        }
+        .score-bar {
+            display: flex;
+            align-items: center;
+            gap: 6px;
+        }
+        .score-bg {
+            width: 50px;
+            height: 5px;
+            background: var(--border);
+            border-radius: 3px;
+            overflow: hidden;
+        }
+        .score-fill {
+            height: 100%;
+            border-radius: 3px;
+        }
+        .score-fill.high { background: linear-gradient(90deg, var(--accent-green), #00ff94); }
+        .score-fill.medium { background: linear-gradient(90deg, var(--accent-orange), #ffc048); }
+        .score-fill.low { background: linear-gradient(90deg, var(--accent-red), #ff6b81); }
+
+        /* Heatmap */
+        .hm-wrap { overflow-x:auto; border-radius:11px; border:1px solid var(--border); background:var(--bg-card); padding:18px; margin-bottom:26px; }
+        .hm-title { font-weight:700; font-size:1.05em; }
+        .hm-sub { font-size:.76em; color:var(--text-muted); margin-bottom:14px; }
+        .hm-table { border-collapse:separate; border-spacing:2px; width:100%; }
+        .hm-table th { font-family:'JetBrains Mono',monospace; font-size:.62em; color:var(--text-muted); padding:8px 5px; text-align:center; white-space:nowrap; vertical-align:bottom; }
+        .hm-table th.hm-role { text-align:left; min-width:140px; font-size:.68em; padding-left:10px; }
+        .hm-table td { text-align:center; padding:6px 4px; font-family:'JetBrains Mono',monospace; font-size:.72em; font-weight:700; border-radius:6px; cursor:pointer; transition:all .15s cubic-bezier(.4,0,.2,1); min-width:42px; position:relative; line-height:1.4; }
+        .hm-table td:hover { transform:scale(1.1); z-index:2; box-shadow:0 4px 12px rgba(0,0,0,.35); }
+        .hm-table td.hm-r { text-align:left; font-family:'Inter',sans-serif; font-size:.82em; font-weight:600; color:var(--text-primary); cursor:default; padding-left:10px; }
+        .hm-table td.hm-r:hover { transform:none; box-shadow:none; }
+        .hm-star { position:absolute; top:2px; right:2px; font-size:.65em; text-shadow:0 1px 2px rgba(0,0,0,.5); }
+        .hm-cur { box-shadow:inset 0 0 0 2px var(--accent-cyan), 0 0 8px rgba(0,212,255,.35); border-radius:6px; }
+        .hm-cur::after { content:''; position:absolute; bottom:2px; left:50%; transform:translateX(-50%); width:8px; height:3px; background:var(--accent-cyan); border-radius:2px; }
+        .hm-if-warn { position:absolute; top:2px; left:2px; font-size:.6em; opacity:.8; }
+
+        /* Smooth gradient legend bar */
+        .hm-legend-wrap { margin-top:18px; padding:0 4px; }
+        .hm-legend-track { position:relative; height:22px; border-radius:11px; background:linear-gradient(90deg, rgba(0,255,148,.85) 0%, rgba(0,212,255,.75) 20%, rgba(59,130,246,.6) 40%, rgba(168,85,247,.45) 58%, rgba(255,159,67,.35) 75%, rgba(255,71,87,.3) 88%, rgba(90,104,128,.2) 100%); box-shadow:inset 0 1px 3px rgba(0,0,0,.3); }
+        .hm-legend-labels { display:flex; justify-content:space-between; align-items:center; margin-top:8px; padding:0 4px; }
+        .hm-legend-labels span { font-size:.68em; font-family:'JetBrains Mono',monospace; color:var(--text-muted); }
+        .hm-legend-left { color:var(--accent-green); }
+        .hm-legend-right { color:var(--accent-red); }
+        .hm-legend-marks { display:flex; justify-content:space-between; padding:0 2px; margin-top:3px; }
+        .hm-legend-marks span { font-size:.58em; font-family:'JetBrains Mono',monospace; color:var(--text-muted); min-width:20px; text-align:center; }
+
+        /* Heatmap Modal Tabs */
+        .hm-modal-tabs { display:flex; gap:3px; background:var(--bg-panel); border-bottom:1px solid var(--border); padding:4px 18px; }
+        .hm-tab-btn { padding:8px 16px; background:none; border:none; color:var(--text-secondary); font-family:'Inter'; font-size:.82em; font-weight:600; border-radius:8px; cursor:pointer; transition:all .25s; }
+        .hm-tab-btn.active { color:var(--bg-deep); background:linear-gradient(135deg,var(--accent-cyan),var(--accent-green)); }
+        .hm-tab-content { display:none; }
+        .hm-tab-content.active { display:block; }
+        .hm-model-timeline { display:flex; flex-direction:column; gap:12px; }
+        .hm-tl-item { display:flex; gap:14px; align-items:center; padding:10px; background:var(--bg-deep); border-radius:8px; border-left:3px solid var(--accent-cyan); }
+        .hm-tl-date { font-family:'JetBrains Mono',monospace; font-size:.72em; color:var(--text-muted); min-width:100px; }
+        .hm-tl-change { display:flex; align-items:center; gap:8px; }
+        .hm-tl-from { text-decoration:line-through; color:#ff6b81; background:rgba(255,71,87,.08); padding:2px 6px; border-radius:4px; }
+        .hm-tl-arrow { color:var(--accent-green); }
+        .hm-tl-to { color:var(--accent-green); background:rgba(0,255,148,.08); padding:2px 6px; border-radius:4px; font-weight:600; }
+        .hm-tl-current { border-left-color:var(--accent-green); background:rgba(0,255,148,.05); }
+        .hm-no-data { color:var(--text-muted); font-size:.9em; padding:16px; text-align:center; }
+        .hm-capabilities { display:flex; flex-wrap:wrap; gap:6px; }
+        .hm-cap-tag { padding:4px 10px; background:rgba(0,212,255,.1); border:1px solid var(--border); border-radius:16px; font-size:.78em; color:var(--accent-cyan); }
+        .hm-agent-desc { font-size:.9em; color:var(--text-secondary); line-height:1.5; margin-bottom:14px; padding:12px; background:var(--bg-deep); border-radius:8px; }
+        .hm-model-tl-score { margin-left:auto; font-family:'JetBrains Mono',monospace; font-size:.8em; color:var(--accent-cyan); }
+
+        /* Tooltip */
+        #ttOverlay { display:none; position:fixed; top:0;left:0;right:0;bottom:0; z-index:999; pointer-events:none; }
+        #ttOverlay.show { display:block; }
+        #ttBox { position:absolute; background:var(--bg-panel); border:1px solid var(--accent-cyan); border-radius:9px; padding:12px 16px; max-width:300px; box-shadow:0 10px 32px rgba(0,0,0,.55); z-index:1000; }
+        #ttBox h4 { color:var(--accent-cyan); font-size:.9em; margin-bottom:4px; }
+        #ttBox p { font-size:.78em; color:var(--text-secondary); line-height:1.45; }
+
+        /* Export */
+        .actions-row {
+            display: flex;
+            gap: 10px;
+            margin-bottom: 20px;
+        }
+        .action-btn {
+            padding: 8px 16px;
+            background: var(--bg-card);
+            border: 1px solid var(--border);
+            color: var(--text-primary);
+            border-radius: 8px;
+            font-family: 'Inter', sans-serif;
+            font-size: 0.85em;
+            cursor: pointer;
+            transition: all 0.25s;
+            display: inline-flex;
+            align-items: center;
+            gap: 8px;
+        }
+        .action-btn:hover {
+            border-color: var(--accent-cyan);
+            color: var(--accent-cyan);
+        }
+        .action-btn.primary {
+            background: linear-gradient(135deg, rgba(0,212,255,0.15), rgba(0,255,148,0.1));
+            border-color: var(--accent-cyan);
+            color: var(--accent-cyan);
+        }
+        .action-btn.primary:hover {
+            box-shadow: 0 0 20px var(--glow-cyan);
+        }
+
+        /* Modal */
+        .modal {
+            display: none;
+            position: fixed;
+            inset: 0;
+            background: rgba(0,0,0,0.7);
+            z-index: 9999;
+            justify-content: center;
+            align-items: center;
+            padding: 20px;
+        }
+        .modal.show { display: flex; }
+        .modal-content {
+            background: var(--bg-panel);
+            border: 1px solid var(--accent-cyan);
+            border-radius: 14px;
+            max-width: 900px;
+            width: 100%;
+            max-height: 85vh;
+            overflow: hidden;
+            display: flex;
+            flex-direction: column;
+            box-shadow: 0 20px 60px rgba(0,0,0,0.5);
+        }
+        .modal-header {
+            display: flex;
+            justify-content: space-between;
+            align-items: center;
+            padding: 18px 22px;
+            border-bottom: 1px solid var(--border);
+        }
+        .modal-title { font-weight: 700; font-size: 1.05em; }
+        .modal-actions { display: flex; gap: 8px; }
+        .modal-body {
+            flex: 1;
+            overflow: auto;
+            padding: 18px 22px;
+        }
+        .modal-pre {
+            font-family: 'JetBrains Mono', monospace;
+            font-size: 0.78em;
+            line-height: 1.6;
+            color: var(--accent-green);
+            white-space: pre-wrap;
+        }
+
+        /* Impact Tab */
+        .chart-wrap { background: var(--bg-card); border: 1px solid var(--border); border-radius: 12px; padding: 20px; margin-bottom: 24px; }
+        .chart-title { font-size: 1.1em; font-weight: 700; margin-bottom: 16px; }
+        .chart-sub { font-size: 0.76em; color: var(--text-muted); margin-bottom: 14px; }
+        .chart-placeholder { text-align: center; padding: 60px 20px; color: var(--text-muted); font-size: 0.95em; }
+        .chart-container { position:relative; height:280px; width:100%; }
+        .chart-container-sm { position:relative; height:240px; width:100%; }
+
+        /* Recommendation Cards */
+        .rec-card { background: var(--bg-card); border: 1px solid var(--border); border-radius: 12px; padding: 20px; transition: all 0.3s; margin-bottom: 16px; }
+        .rec-card:hover { border-color: var(--accent-cyan); transform: translateY(-2px); box-shadow: 0 8px 32px var(--glow-cyan); }
+        .rec-hdr { display: flex; justify-content: space-between; align-items: center; margin-bottom: 14px; }
+        .rec-agent { font-weight: 700; font-size: 1.1em; display: flex; align-items: center; gap: 10px; }
+        .rec-agent-name { color: var(--text-primary); }
+        .impact-badge { font-family: 'JetBrains Mono', monospace; font-size: 0.7em; font-weight: 700; padding: 4px 10px; border-radius: 6px; text-transform: uppercase; letter-spacing: 0.5px; }
+        .impact-badge.critical { background: rgba(255,71,87,0.2); color: #ff6b81; border: 1px solid rgba(255,71,87,0.4); }
+        .impact-badge.high { background: rgba(255,159,67,0.2); color: #ffc048; border: 1px solid rgba(255,159,67,0.4); }
+        .impact-badge.medium { background: rgba(59,130,246,0.2); color: #60a5fa; border: 1px solid rgba(59,130,246,0.4); }
+        .impact-badge.low { background: rgba(0,255,148,0.15); color: #4ade80; border: 1px solid rgba(0,255,148,0.3); }
+        .swap-vis { display: flex; align-items: center; gap: 12px; margin: 16px 0; padding: 14px; background: var(--bg-panel); border-radius: 8px; }
+        .swap-from, .swap-to { flex: 1; padding: 10px 14px; border-radius: 6px; font-family: 'JetBrains Mono', monospace; font-size: 0.8em; }
+        .swap-from { background: rgba(255,71,87,0.1); color: #ff6b81; border: 1px solid rgba(255,71,87,0.3); }
+        .swap-to { background: rgba(0,255,148,0.1); color: #4ade80; border: 1px solid rgba(0,255,148,0.3); }
+        .swap-arrow { color: var(--accent-cyan); font-size: 1.4em; font-weight: 700; }
+        .rec-metrics { display: grid; grid-template-columns: repeat(4, 1fr); gap: 12px; margin-bottom: 14px; }
+        .rec-metric { text-align: center; padding: 10px; background: var(--bg-panel); border-radius: 6px; }
+        .rec-metric-label { font-size: 0.65em; color: var(--text-muted); text-transform: uppercase; letter-spacing: 0.5px; }
+        .rec-metric-value { font-family: 'JetBrains Mono', monospace; font-size: 0.95em; font-weight: 600; color: var(--accent-green); margin-top: 4px; }
+        .rec-rationale { font-size: 0.85em; color: var(--text-secondary); line-height: 1.6; padding: 12px; background: rgba(0,212,255,0.05); border-radius: 6px; border-left: 3px solid var(--accent-cyan); }
+
+        /* Recommendation Card Checkbox */
+        .rec-checkbox { position: absolute; top: 16px; right: 16px; }
+        .rec-checkbox input { width: 18px; height: 18px; cursor: pointer; accent-color: var(--accent-cyan); }
+
+        /* Progress Modal */
+        .progress-overlay {
+            display: none;
+            position: fixed;
+            inset: 0;
+            background: rgba(0,0,0,0.85);
+            z-index: 10000;
+            justify-content: center;
+            align-items: center;
+            flex-direction: column;
+        }
+        .progress-overlay.show { display: flex; }
+        .progress-card {
+            background: var(--bg-panel);
+            border: 1px solid var(--accent-cyan);
+            border-radius: 14px;
+            padding: 32px 40px;
+            text-align: center;
+            max-width: 500px;
+            width: 90%;
+            box-shadow: 0 20px 60px rgba(0,0,0,0.5);
+        }
+        .progress-title { font-size: 1.2em; font-weight: 700; margin-bottom: 24px; }
+        .progress-bar-wrap { background: var(--bg-card); border-radius: 4px; height: 8px; overflow: hidden; margin-bottom: 20px; }
+        .progress-bar-fill {
+            height: 100%;
+            width: 0%;
+            background: linear-gradient(90deg, var(--accent-green), #00ff94);
+            border-radius: 4px;
+            transition: width 0.3s ease-out;
+        }
+        .progress-status { font-size: 0.9em; color: var(--text-secondary); margin-bottom: 20px; min-height: 24px; }
+        .progress-result { display: none; }
+        .progress-result.show { display: block; }
+        .progress-result p { font-size: 1em; color: var(--accent-green); margin-bottom: 20px; }
+        .progress-close-btn {
+            padding: 10px 24px;
+            background: var(--bg-card);
+            border: 1px solid var(--border);
+            color: var(--text-primary);
+            border-radius: 8px;
+            cursor: pointer;
+            font-size: 0.9em;
+        }
+        .progress-close-btn:hover { border-color: var(--accent-cyan); color: var(--accent-cyan); }
+
+        /* Research Modal */
+        .research-steps { text-align: left; margin: 20px 0; }
+        .research-step { padding: 12px 16px; background: var(--bg-card); border-radius: 8px; margin-bottom: 10px; font-size: 0.9em; color: var(--text-secondary); display: flex; align-items: center; gap: 10px; opacity: 0.5; transition: all 0.3s; }
+        .research-step.active { opacity: 1; color: var(--accent-cyan); background: rgba(0,212,255,0.1); }
+        .research-step.done { opacity: 1; color: var(--accent-green); }
+        .research-step .spinner { width: 16px; height: 16px; border: 2px solid var(--border); border-top-color: var(--accent-cyan); border-radius: 50%; animation: spin 1s linear infinite; display: none; }
+        .research-step.active .spinner { display: block; }
+        .research-summary { display: none; text-align: center; padding: 20px; }
+        .research-summary.show { display: block; }
+        .research-summary p { font-size: 1em; color: var(--text-secondary); margin-bottom: 16px; }
+        .research-link { color: var(--accent-cyan); text-decoration: underline; cursor: pointer; }
+
+        @keyframes spin { to { transform: rotate(360deg); } }
+
+        /* Apply Modal Checklist */
+        .apply-checklist { max-height: 300px; overflow-y: auto; margin: 16px 0; }
+        .apply-item {
+            display: flex;
+            align-items: center;
+            gap: 12px;
+            padding: 12px 14px;
+            background: var(--bg-card);
+            border-radius: 8px;
+            margin-bottom: 8px;
+            transition: all 0.2s;
+        }
+        .apply-item:hover { background: var(--bg-card-hover); }
+        .apply-item input { width: 18px; height: 18px; accent-color: var(--accent-cyan); }
+        .apply-item-content { flex: 1; }
+        .apply-item-agent { font-weight: 600; font-size: 0.95em; }
+        .apply-item-models { display: flex; align-items: center; gap: 8px; font-family: 'JetBrains Mono', monospace; font-size: 0.8em; margin-top: 4px; }
+        .apply-item-from { text-decoration: line-through; color: #ff6b81; }
+        .apply-item-arrow { color: var(--accent-cyan); }
+        .apply-item-to { color: var(--accent-green); }
+        .apply-item-impact { font-size: 0.7em; padding: 2px 8px; border-radius: 4px; text-transform: uppercase; }
+        .apply-item-impact.critical { background: rgba(255,71,87,0.2); color: #ff6b81; }
+        .apply-item-impact.high { background: rgba(255,159,67,0.2); color: #ffc048; }
+        .apply-item-impact.medium { background: rgba(59,130,246,0.2); color: #60a5fa; }
+        .apply-item-impact.low { background: rgba(0,255,148,0.15); color: #4ade80; }
+        .apply-modal-actions { display: flex; justify-content: flex-end; gap: 10px; margin-top: 16px; }
+        .apply-btn { padding: 10px 20px; border-radius: 8px; font-size: 0.9em; cursor: pointer; transition: all 0.25s; }
+        .apply-btn.apply { background: linear-gradient(135deg, rgba(0,212,255,0.15), rgba(0,255,148,0.1)); border: 1px solid var(--accent-cyan); color: var(--accent-cyan); }
+        .apply-btn.apply:hover { box-shadow: 0 0 20px var(--glow-cyan); }
+
+        @media (max-width: 768px) {
+            .header h1 { font-size: 1.5em; }
+            .tabs { flex-wrap: wrap; }
+            .agents-grid { grid-template-columns: 1fr; }
+            .stats-row { grid-template-columns: repeat(2, 1fr); }
+            .rec-metrics { grid-template-columns: repeat(2, 1fr); }
+            .swap-vis { flex-direction: column; }
+            .swap-arrow { transform: rotate(90deg); }
+        }
+    </style>
+</head>
+<body>
+<div class="container">
+    <div class="header">
+        <h1>APAW Agent Evolution</h1>
+        <div class="sub">Real-time agent model & performance tracking</div>
+        <div class="meta">
+            <span id="lastSync">Loading...</span>
+            <span>•</span>
+            <span id="agentCount">0 agents</span>
+            <span>•</span>
+            <span id="historyCount">0 with history</span>
+        </div>
+    </div>
+
+    <div class="tabs" id="tabBar">
+        <button class="tab-btn active" onclick="switchTab('overview', this)">Overview</button>
+        <button class="tab-btn" onclick="switchTab('agents', this)">All Agents</button>
+        <button class="tab-btn" onclick="switchTab('history', this)">Timeline</button>
+        <button class="tab-btn" onclick="switchTab('recommendations', this)">Recommendations</button>
+        <button class="tab-btn" onclick="switchTab('heatmap', this)">Heatmap</button>
+        <button class="tab-btn" onclick="switchTab('impact', this)">Impact</button>
+    </div>
+
+    <!-- Overview Tab -->
+    <div id="tab-overview" class="tab-panel active">
+        <div class="stats-row" id="statsRow"></div>
+
+        <div class="category-section">
+            <div class="category-header">
+                <h2 class="category-title">Recent Changes</h2>
+                <span class="category-count" id="recentCount">0</span>
+            </div>
+            <div class="timeline-wrap">
+                <div class="timeline" id="recentTimeline"></div>
+            </div>
+        </div>
+
+        <div class="category-section">
+            <div class="category-header">
+                <h2 class="category-title">Pending Recommendations</h2>
+                <span class="category-count" id="recCount">0</span>
+            </div>
+            <div class="agents-grid" id="recAgents"></div>
+        </div>
+    </div>
+
+    <!-- All Agents Tab -->
+    <div id="tab-agents" class="tab-panel">
+        <div class="search-box">
+            <span class="search-icon">🔍</span>
+            <input type="text" class="search-input" id="agentSearch" placeholder="Search agents..." oninput="filterAgents()">
+        </div>
+        <div class="filter-row">
+            <button class="filter-btn active" onclick="filterCategory('all', this)">All</button>
+            <button class="filter-btn" onclick="filterCategory('Core Dev', this)">Core Dev</button>
+            <button class="filter-btn" onclick="filterCategory('QA', this)">QA</button>
+            <button class="filter-btn" onclick="filterCategory('Security', this)">Security</button>
+            <button class="filter-btn" onclick="filterCategory('Analysis', this)">Analysis</button>
+            <button class="filter-btn" onclick="filterCategory('Process', this)">Process</button>
+            <button class="filter-btn" onclick="filterCategory('Cognitive', this)">Cognitive</button>
+        </div>
+        <div id="agentsByCategory"></div>
+    </div>
+
+    <!-- History Tab -->
+    <div id="tab-history" class="tab-panel">
+        <div class="timeline-wrap">
+            <h2 class="timeline-title">Evolution Timeline</h2>
+            <div class="timeline" id="fullTimeline"></div>
+        </div>
+    </div>
+
+    <!-- Recommendations Tab -->
+    <div id="tab-recommendations" class="tab-panel">
+        <div class="actions-row">
+            <button class="action-btn primary" onclick="showApplyModal()">
+                <span>✨</span> Apply Recommended Fixes
+            </button>
+            <button class="action-btn" onclick="showResearchModal()">
+                <span>🔬</span> New Research Cycle
+            </button>
+            <button class="action-btn" onclick="exportRecommendations()" style="display:none">
+                <span>📥</span> Export JSON
+            </button>
+        </div>
+        <div class="agents-grid" id="allRecommendations"></div>
+    </div>
+
+    <!-- Heatmap Tab -->
+    <div id="tab-heatmap" class="tab-panel">
+        <div class="hm-wrap">
+            <div class="hm-title">Agent × Model Compatibility Heatmap</div>
+            <div class="hm-sub">Weighted score = benchmark × instruction-following multiplier · ★ = best fit · outlined = current · click for details</div>
+            <div style="overflow-x:auto"><table class="hm-table" id="hmTable"></table></div>
+            <div class="hm-legend-wrap">
+                <div class="hm-legend-track"></div>
+                <div class="hm-legend-marks">
+                    <span>100</span><span>80</span><span>60</span><span>40</span><span>20</span><span>0</span>
+                </div>
+                <div class="hm-legend-labels">
+                    <span class="hm-legend-left">↑ Ideal Match</span>
+                    <span class="hm-legend-right">Mismatch ↓</span>
+                </div>
+            </div>
+        </div>
+    </div>
+
+    <!-- Impact Tab -->
+    <div id="tab-impact" class="tab-panel">
+        <div class="stats-row" id="impactStats"></div>
+        
+        <!-- Chart 1: Agent Performance Scores -->
+        <div class="chart-wrap">
+            <div class="chart-title">Agent Performance Scores</div>
+            <div class="chart-sub">Composite score per agent based on model benchmarks</div>
+            <div class="chart-container"><canvas id="agentScoreChart"></canvas></div>
+        </div>
+        
+        <!-- Chart 2 & 3 side by side -->
+        <div style="display:grid;grid-template-columns:1fr 1.5fr;gap:20px;margin-bottom:24px">
+            <div class="chart-wrap">
+                <div class="chart-title">Model Distribution</div>
+                <div class="chart-sub">Agents per model</div>
+                <div class="chart-container-sm"><canvas id="modelDistChart"></canvas></div>
+            </div>
+            <div class="chart-wrap">
+                <div class="chart-title">Migration Impact</div>
+                <div class="chart-sub">Before vs after model change score</div>
+                <div class="chart-container-sm"><canvas id="migrationImpactChart"></canvas></div>
+            </div>
+        </div>
+    </div>
+</div>
+
+<!-- Export Modal -->
+<div class="modal" id="exportModal">
+    <div class="modal-content">
+        <div class="modal-header">
+            <div class="modal-title">Export Recommendations</div>
+            <div class="modal-actions">
+                <button class="action-btn" onclick="copyToClipboard()">📋 Copy</button>
+                <button class="action-btn primary" onclick="downloadJSON()">⬇ Download</button>
+                <button class="action-btn" onclick="closeModal()" style="border-color: #ff4757; color: #ff6b81;">✕</button>
+            </div>
+        </div>
+        <div class="modal-body">
+            <pre class="modal-pre" id="exportContent"></pre>
+        </div>
+    </div>
+</div>
+
+<!-- Apply Fixes Modal -->
+<div class="modal" id="applyModal">
+    <div class="modal-content" style="max-width:600px">
+        <div class="modal-header">
+            <div class="modal-title">Apply Model Recommendations</div>
+            <div class="modal-actions">
+                <button class="action-btn" onclick="closeApplyModal()" style="border-color: #ff4757; color: #ff6b81;">✕</button>
+            </div>
+        </div>
+        <div class="modal-body">
+            <p style="color: var(--text-secondary); margin-bottom: 16px;">Select recommendations to apply. All items are selected by default.</p>
+            <div class="apply-checklist" id="applyChecklist"></div>
+            <div class="apply-modal-actions">
+                <button class="apply-btn apply" onclick="simulateApply()">Apply Selected</button>
+            </div>
+        </div>
+    </div>
+</div>
+
+<!-- Progress Modal -->
+<div class="progress-overlay" id="progressModal">
+    <div class="progress-card">
+        <div class="progress-title" id="progressTitle">Applying Fixes...</div>
+        <div class="progress-bar-wrap">
+            <div class="progress-bar-fill" id="progressBar"></div>
+        </div>
+        <div class="progress-status" id="progressStatus">Preparing...</div>
+        <div class="progress-result" id="progressResult">
+            <p id="progressResultText"></p>
+            <button class="progress-close-btn" onclick="closeProgressModal()">Close</button>
+        </div>
+    </div>
+</div>
+
+<!-- Research Modal -->
+<div class="modal" id="researchModal">
+    <div class="modal-content" style="max-width:550px">
+        <div class="modal-header">
+            <div class="modal-title">Agent Model Research</div>
+            <div class="modal-actions">
+                <button class="action-btn" onclick="closeResearchModal()" style="border-color: #ff4757; color: #ff6b81;">✕</button>
+            </div>
+        </div>
+        <div class="modal-body">
+            <div class="research-steps" id="researchSteps">
+                <div class="research-step" data-step="1">
+                    <span class="spinner"></span>
+                    <span>Analyzing benchmark data...</span>
+                </div>
+                <div class="research-step" data-step="2">
+                    <span class="spinner"></span>
+                    <span>Computing composite scores...</span>
+                </div>
+                <div class="research-step" data-step="3">
+                    <span class="spinner"></span>
+                    <span>Cross-referencing agent assignments...</span>
+                </div>
+                <div class="research-step" data-step="4">
+                    <span class="spinner"></span>
+                    <span>Generating recommendations...</span>
+                </div>
+                <div class="research-step" data-step="5">
+                    <span class="spinner"></span>
+                    <span>Research complete!</span>
+                </div>
+            </div>
+            <div class="research-summary" id="researchSummary">
+                <p id="researchSummaryText"></p>
+                <a class="research-link" onclick="alert('This would open the full report.')">View Report</a>
+            </div>
+        </div>
+    </div>
+</div>
+
+<!-- Tooltip Overlay -->
+<div id="ttOverlay"><div id="ttBox"></div></div>
+
+<!-- Heatmap Modal -->
+<div id="hmModal" class="modal" style="display:none">
+    <div class="modal-content" style="max-width:900px;width:95%;max-height:85vh">
+        <div class="modal-header">
+            <div class="modal-title" id="hmModalTitle">Agent Details</div>
+            <div class="modal-actions">
+                <button class="action-btn" onclick="closeHmModal()">✕</button>
+            </div>
+        </div>
+        <div class="hm-modal-tabs">
+            <button class="hm-tab-btn active" onclick="switchHmTab('prompt')">Prompt Evolution</button>
+            <button class="hm-tab-btn" onclick="switchHmTab('gitea')">Gitea History</button>
+            <button class="hm-tab-btn" onclick="switchHmTab('skills')">Skills</button>
+            <button class="hm-tab-btn" onclick="switchHmTab('models')">Model Timeline</button>
+            <button class="hm-tab-btn" onclick="switchHmTab('graph')">Performance Graph</button>
+        </div>
+        <div class="modal-body" id="hmModalBody">
+            <!-- Content injected by JS -->
+        </div>
+    </div>
+</div>
+
+<!-- Cell Detail Modal -->
+<div id="cellDetailModal" class="modal">
+    <div class="modal-content" style="max-width:800px">
+        <div class="modal-header">
+            <div class="modal-title">Agent Model Performance</div>
+            <div class="modal-actions">
+                <button class="action-btn" onclick="closeCellDetailModal()">✕</button>
+            </div>
+        </div>
+        <div class="modal-body">
+            <div id="cellDetailContent"></div>
+        </div>
+    </div>
+</div>
+
+<script>
+// Agent Evolution Dashboard
+// Supports both server and file:// mode
+let agentData = {};
+
+// Set Chart.js dark theme defaults
+Chart.defaults.color = '#8ba3c0';
+Chart.defaults.borderColor = '#1e2d45';
+Chart.defaults.font.family = "'Inter', sans-serif";
+
+// Inline recommendation data fallback (from model-research-latest.json)
+const INLINE_RECOMMENDATIONS = []; // Deprecated — data now comes from agentData.agents[].current.recommendations
+
+// Inline benchmark data (fallback when embedded data doesn't have model_benchmarks)
+// SOURCE: agent-evolution/data/model-benchmarks-verified.json v2.0.0
+// All IF scores verified against artificialanalysis.ai. SWE-bench scores removed — none of the 15 models appear on the official swebench.com leaderboard.
+/* MODEL_BENCHMARKS removed — data now in EMBEDDED_DATA.model_benchmarks */
+
+// Default embedded data (minimal - updated by sync script)
+// Unified data from REAL sources (2026-05-26T12:21:49.730Z)
+// Sources: .kilo/agents/*.md + kilo-meta.json + model-benchmarks-verified.json
+const EMBEDDED_DATA = {
+  "$schema": "./data/evolution.schema.json",
+  "version": "2.1.0",
+  "lastUpdated": "2026-05-26T12:21:49.721Z",
+  "agents": {
+    "agent-architect": {
+      "current": {
+        "description": "Creates, modifies, and reviews new agents, workflows, and skills based on capability gap analysis. Tier 2 meta-agent with self-cascade enabled.",
+        "mode": "subagent",
+        "model": "ollama-cloud/kimi-k2.6",
+        "provider": "Ollama Cloud",
+        "color": "#8B5CF6",
+        "category": "meta",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 92,
+          "instruction_following": 91
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T22:30:00Z",
+          "commit": "auto",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "+22% quality, IF:90 for YAML frontmatter generation",
+          "source": "research"
+        },
+        {
+          "date": "2026-04-23T06:24:32Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-24T01:00:00Z",
+          "commit": "ollama-cloud-consolidation",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "kimi-k2.6 best fit for agent-architect (86). Multimodal for reviewing UI components.",
+          "source": "orchestrator-analysis"
+        },
+        {
+          "date": "2026-04-03T20:27:54Z",
+          "commit": "a0ef7cd02d3579883287ff0ffc23d1e5932c703a",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5",
+          "reason": "feat: add Agent Architect and KILO_SPEC documentation",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T00:50:22Z",
+          "commit": "4a69c5323b6686b67a90184ac99b6994fad6748d",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5",
+          "to": "qwen/qwen3.6-plus:free",
+          "reason": "feat: update agent models to current configuration",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T01:51:28Z",
+          "commit": "298dde4273944e17d929b3b774c58e4f09e50753",
+          "type": "model_change",
+          "from": "qwen/qwen3.6-plus:free",
+          "to": "openrouter/openai/gpt-oss:120b",
+          "reason": "feat: add capability-analyst and agent-architect for task coverage analysis",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T01:54:02Z",
+          "commit": "657407d5efd7eea2fc3bd6aa5853ebc320514e1d",
+          "type": "model_change",
+          "from": "openrouter/openai/gpt-oss:120b",
+          "to": "ollama-cloud/gpt-oss:120b",
+          "reason": "fix: replace unavailable model references with available ones",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T02:05:17Z",
+          "commit": "39d5ddf333ff2276580f3bee59b56462f52e9c1d",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/gpt-oss:120b",
+          "reason": "test: add validation functions and autonomous pipeline system tests",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/gpt-oss:120b",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T12:15:30Z",
+          "commit": "ebbb4d01b23066f27e451334e43899bd96b5ac90",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:120b",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: optimize agent models for better performance",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T23:37:23Z",
+          "commit": "a4e09ad5d5e88ee25688b3a2d1c548e3ada0e549",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "qwen/qwen3.6-plus:free",
+          "reason": "feat: upgrade agent models based on research findings",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T23:42:32Z",
+          "commit": "6ba325cec5135517241bbbb48acfc54aeadaeac2",
+          "type": "model_change",
+          "from": "qwen/qwen3.6-plus:free",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "fix: correct model path format for OpenRouter",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T12:09:36Z",
+          "commit": "dbea8c90dbfd3b9fb84c4fd6ada243fc4847f8b8",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/kimi-k2.6:cloud",
+          "reason": "feat: evolutionary agent model upgrades based on recommendation matrix",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-04T22:01:45Z",
+          "commit": "80dca09ae0a74bd9b1b846e7c91d8b398d80ce9e",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6:cloud",
+          "reason": "fix: unquoted color, duplicate key, GLM downgrade + cross-platform validator",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T21:25:38Z",
+          "commit": "47b027a02fc909a303a659282afb228ac2204c0c",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6:cloud",
+          "reason": "feat(gns2): Gitea-Nervous-System v2.0 - distributed agent state machine",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:27:48Z",
+          "commit": "4c9a95661f6222c84e0a67cec217babfacefdf29",
+          "type": "model_change",
+          "from": "ollama-cloud/kimi-k2.6:cloud",
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "evolution: remove obsolete :cloud suffix from kimi-k2.6 model id across all configs",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "architect-indexer": {
+      "current": {
+        "description": "Indexes and maps project codebase architecture into .architect/ directory. Creates and maintains structured documentation of entities, APIs, DB schema, file graphs, and conventions. (GNS-2 Tier 0)",
+        "mode": "subagent",
+        "model": "ollama-cloud/glm-5.1",
+        "provider": "Ollama Cloud",
+        "color": "#10B981",
+        "category": "core",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "architect-indexer could improve from ollama-cloud/glm-5.1 to kimi-k2.6. Score: 81 → 92 (+11). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 81,
+            "score_after": 92,
+            "score_delta": 11,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 81,
+          "instruction_following": 90
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-22T20:01:38Z",
+          "commit": "6b71ea2b574dea773ef424291de119eedd9b470e",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat: add .architect/ project mapping system with architect-indexer agent and Docker containerization",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "backend-developer": {
+      "current": {
+        "description": "Backend specialist for Node.js, Express, APIs, and database integration (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/qwen3-coder:480b",
+        "provider": "Ollama Cloud",
+        "color": "#10B981",
+        "category": "core",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "backend-developer could improve from ollama-cloud/qwen3-coder:480b to kimi-k2.6. Score: 60 → 92 (+32). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 60,
+            "score_after": 92,
+            "score_delta": 32,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 60,
+          "instruction_following": 0
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T01:19:09Z",
+          "commit": "23eb60762cec861a8a7ab306b994946d55e77e18",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v3.2",
+          "reason": "feat: add workflows for CMS, E-commerce, Blog + backend-developer agent + prompt-engineering rules",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T02:39:06Z",
+          "commit": "8fcd8f8a9b4fc05318af2cd757d0e3a441bf12a4",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v3.2",
+          "reason": "feat: add comprehensive NodeJS development skills and rules",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T05:00:55Z",
+          "commit": "41eb4c7d4d67a1c395a00f3ff819daa6eb030b9d",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v3.2",
+          "reason": "feat: add database skills for ClickHouse, PostgreSQL, and SQLite",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T12:47:01Z",
+          "commit": "43747d9875edd6061699b831c51ccbb573ec6a47",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v3.2",
+          "reason": "feat: add Docker/DevOps skills and devops-engineer agent",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T13:02:32Z",
+          "commit": "0a854a3bc323330daab1a947c9f1d244dbb8a555",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v3.2",
+          "reason": "fix: add missing agent permissions and update orchestrator mappings",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T20:28:47Z",
+          "commit": "4af7355429bb6a9336cb608a5d5a3132943653f6",
+          "type": "model_change",
+          "from": "ollama-cloud/deepseek-v3.2",
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: update agent models based on research recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T12:09:36Z",
+          "commit": "dbea8c90dbfd3b9fb84c4fd6ada243fc4847f8b8",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3-coder:480b",
+          "to": "ollama-cloud/deepseek-v3.2",
+          "reason": "feat: evolutionary agent model upgrades based on recommendation matrix",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/deepseek-v3.2",
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:37:40Z",
+          "commit": "2287122f9196e4ef5b0cbfff3641d74b6320f086",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "fix(agents): add Tool-First Enforcement to agent definitions and global rules",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "browser-automation": {
+      "current": {
+        "description": "Browser automation agent using Playwright MCP for E2E testing, form filling, navigation, and web interaction (GNS-2 Tier 0)",
+        "mode": "subagent",
+        "model": "ollama-cloud/deepseek-v4-flash",
+        "provider": "Ollama Cloud",
+        "color": "#1E88E5",
+        "category": "testing",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "medium",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "browser-automation could improve from ollama-cloud/deepseek-v4-flash to kimi-k2.6. Score: 88 → 92 (+4). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 88,
+            "score_after": 92,
+            "score_delta": 4,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 88,
+          "instruction_following": 86
+        }
+      },
+      "history": [
+        {
+          "date": "2026-05-25T14:08:46.653Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3-coder:480b",
+          "to": "ollama-cloud/deepseek-v4-flash",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:49:56Z",
+          "commit": "5793b7909b3888ae29d3fafe3f2d04ca0c5ad71f",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5",
+          "reason": "feat: add web testing system with browser automation (Milestone #44)",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T20:28:47Z",
+          "commit": "4af7355429bb6a9336cb608a5d5a3132943653f6",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5",
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: update agent models based on research recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T12:09:36Z",
+          "commit": "dbea8c90dbfd3b9fb84c4fd6ada243fc4847f8b8",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3-coder:480b",
+          "to": "ollama-cloud/kimi-k2.6:cloud",
+          "reason": "feat: evolutionary agent model upgrades based on recommendation matrix",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/kimi-k2.6:cloud",
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T15:07:17Z",
+          "commit": "047a87afb405c647bcb778f3c090d042440839d3",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3-coder:480b",
+          "to": "ollama-cloud/deepseek-v4-flash",
+          "reason": "feat(agent-models): apply MEDIUM+LOW priority model migrations",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "capability-analyst": {
+      "current": {
+        "description": "Analyzes task requirements against available agents, workflows, and skills. Identifies gaps and recommends new components. Tier 2 meta-agent with self-cascade enabled.",
+        "mode": "subagent",
+        "model": "ollama-cloud/deepseek-v4-pro-max",
+        "provider": "Ollama Cloud",
+        "color": "#6366F1",
+        "category": "meta",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 91,
+          "instruction_following": 89
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T22:30:00Z",
+          "commit": "auto",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "+23% quality, IF:90, FREE via OpenRouter",
+          "source": "research"
+        },
+        {
+          "date": "2026-04-23T06:24:32Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T14:08:46.653Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T01:51:28Z",
+          "commit": "298dde4273944e17d929b3b774c58e4f09e50753",
+          "type": "model_change",
+          "from": null,
+          "to": "anthropic/claude-sonnet-4-20250514",
+          "reason": "feat: add capability-analyst and agent-architect for task coverage analysis",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T01:54:02Z",
+          "commit": "657407d5efd7eea2fc3bd6aa5853ebc320514e1d",
+          "type": "model_change",
+          "from": "anthropic/claude-sonnet-4-20250514",
+          "to": "ollama-cloud/gpt-oss:120b",
+          "reason": "fix: replace unavailable model references with available ones",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/gpt-oss:120b",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T12:15:30Z",
+          "commit": "ebbb4d01b23066f27e451334e43899bd96b5ac90",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:120b",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: optimize agent models for better performance",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T23:37:23Z",
+          "commit": "a4e09ad5d5e88ee25688b3a2d1c548e3ada0e549",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "qwen/qwen3.6-plus:free",
+          "reason": "feat: upgrade agent models based on research findings",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T23:42:32Z",
+          "commit": "6ba325cec5135517241bbbb48acfc54aeadaeac2",
+          "type": "model_change",
+          "from": "qwen/qwen3.6-plus:free",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "fix: correct model path format for OpenRouter",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T12:09:36Z",
+          "commit": "dbea8c90dbfd3b9fb84c4fd6ada243fc4847f8b8",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: evolutionary agent model upgrades based on recommendation matrix",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T21:25:38Z",
+          "commit": "47b027a02fc909a303a659282afb228ac2204c0c",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat(gns2): Gitea-Nervous-System v2.0 - distributed agent state machine",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T15:07:17Z",
+          "commit": "047a87afb405c647bcb778f3c090d042440839d3",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat(agent-models): apply MEDIUM+LOW priority model migrations",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "code-skeptic": {
+      "current": {
+        "description": "Adversarial code reviewer. Finds problems and issues. Does NOT suggest implementations (GNS-2 Tier 0)",
+        "mode": "subagent",
+        "model": "ollama-cloud/minimax-m2.5",
+        "provider": "Ollama Cloud",
+        "color": "#E11D48",
+        "category": "quality",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "code-skeptic could improve from ollama-cloud/minimax-m2.5 to kimi-k2.6. Score: 74 → 92 (+18). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 74,
+            "score_after": 92,
+            "score_delta": 18,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 74,
+          "instruction_following": 82
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/gpt-oss-120b",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:50:40Z",
+          "commit": "72d6f52844c6578defb5ed8a2d692b4e6ac3b3db",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/gpt-oss-120b",
+          "reason": "fix: correct agent mode configuration and add Task tool invocation sections",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T00:50:22Z",
+          "commit": "4a69c5323b6686b67a90184ac99b6994fad6748d",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss-120b",
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "feat: update agent models to current configuration",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:37:40Z",
+          "commit": "2287122f9196e4ef5b0cbfff3641d74b6320f086",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "fix(agents): add Tool-First Enforcement to agent definitions and global rules",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "devops-engineer": {
+      "current": {
+        "description": "DevOps specialist for Docker, Kubernetes, CI/CD pipeline automation, and infrastructure management (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/kimi-k2.6",
+        "provider": "Ollama Cloud",
+        "color": "#FF6B35",
+        "category": "core",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 92,
+          "instruction_following": 91
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T12:47:01Z",
+          "commit": "43747d9875edd6061699b831c51ccbb573ec6a47",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v3.2",
+          "reason": "feat: add Docker/DevOps skills and devops-engineer agent",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T13:02:32Z",
+          "commit": "0a854a3bc323330daab1a947c9f1d244dbb8a555",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v3.2",
+          "reason": "fix: add missing agent permissions and update orchestrator mappings",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T20:28:47Z",
+          "commit": "4af7355429bb6a9336cb608a5d5a3132943653f6",
+          "type": "model_change",
+          "from": "ollama-cloud/deepseek-v3.2",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: update agent models based on research recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T12:09:36Z",
+          "commit": "dbea8c90dbfd3b9fb84c4fd6ada243fc4847f8b8",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/kimi-k2.6:cloud",
+          "reason": "feat: evolutionary agent model upgrades based on recommendation matrix",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6:cloud",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:27:48Z",
+          "commit": "4c9a95661f6222c84e0a67cec217babfacefdf29",
+          "type": "model_change",
+          "from": "ollama-cloud/kimi-k2.6:cloud",
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "evolution: remove obsolete :cloud suffix from kimi-k2.6 model id across all configs",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:37:40Z",
+          "commit": "2287122f9196e4ef5b0cbfff3641d74b6320f086",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "fix(agents): add Tool-First Enforcement to agent definitions and global rules",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "evaluator": {
+      "current": {
+        "description": "Scores agent effectiveness after task completion for continuous improvement. Tier 2 meta-agent with self-cascade enabled.",
+        "mode": "subagent",
+        "model": "ollama-cloud/qwen3.5-122b",
+        "provider": "Ollama Cloud",
+        "color": "#047857",
+        "category": "meta",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "evaluator could improve from ollama-cloud/qwen3.5-122b to kimi-k2.6. Score: 82 → 92 (+10). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 82,
+            "score_after": 92,
+            "score_delta": 10,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 82,
+          "instruction_following": 92
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T05:21:00Z",
+          "commit": "caf77f53c8",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:120b",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "Nemotron 3 Super better for evaluation tasks",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T22:30:00Z",
+          "commit": "auto",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "+4% quality, IF:90 for scoring accuracy, FREE",
+          "source": "research"
+        },
+        {
+          "date": "2026-04-23T06:24:32Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T13:37:20.281Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/qwen3.5-122b",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/gpt-o3",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:50:40Z",
+          "commit": "72d6f52844c6578defb5ed8a2d692b4e6ac3b3db",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/gpt-o3",
+          "reason": "fix: correct agent mode configuration and add Task tool invocation sections",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T00:50:22Z",
+          "commit": "4a69c5323b6686b67a90184ac99b6994fad6748d",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-o3",
+          "to": "ollama-cloud/gpt-oss:120b",
+          "reason": "feat: update agent models to current configuration",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/gpt-oss:120b",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T05:21:02Z",
+          "commit": "caf77f53c8a8f501cf7667ea6f2dd06676506430",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:120b",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: update agent models based on recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T23:37:23Z",
+          "commit": "a4e09ad5d5e88ee25688b3a2d1c548e3ada0e549",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "qwen/qwen3.6-plus:free",
+          "reason": "feat: upgrade agent models based on research findings",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T23:42:32Z",
+          "commit": "6ba325cec5135517241bbbb48acfc54aeadaeac2",
+          "type": "model_change",
+          "from": "qwen/qwen3.6-plus:free",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "fix: correct model path format for OpenRouter",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T12:09:36Z",
+          "commit": "dbea8c90dbfd3b9fb84c4fd6ada243fc4847f8b8",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: evolutionary agent model upgrades based on recommendation matrix",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T21:25:38Z",
+          "commit": "47b027a02fc909a303a659282afb228ac2204c0c",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat(gns2): Gitea-Nervous-System v2.0 - distributed agent state machine",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T14:36:31Z",
+          "commit": "4a0c78e5c965188fe669db9cecc430904702728c",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/qwen3.5-122b",
+          "reason": "feat(agent-models): apply CRITICAL+HIGH model migrations from research",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "flutter-developer": {
+      "current": {
+        "description": "Flutter mobile specialist for cross-platform apps, state management, and UI components (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/qwen3-coder:480b",
+        "provider": "Ollama Cloud",
+        "color": "#02569B",
+        "category": "core",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "flutter-developer could improve from ollama-cloud/qwen3-coder:480b to kimi-k2.6. Score: 60 → 92 (+32). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 60,
+            "score_after": 92,
+            "score_delta": 32,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 60,
+          "instruction_following": 0
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T15:00:00Z",
+          "commit": "af5f401",
+          "type": "agent_created",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "New agent for Flutter development",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T17:04:13Z",
+          "commit": "af5f401a533810926da2bf1ec559456d92c1cabd",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: add Flutter development support with agent, rules and skills",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T17:26:02Z",
+          "commit": "b899119d218470c28e0988d1d0bcba6ba2b55330",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: add html-to-flutter skill and research report",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "frontend-developer": {
+      "current": {
+        "description": "Handles UI implementation with multimodal capabilities. Accepts visual references like screenshots and mockups (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/minimax-m2.5",
+        "provider": "Ollama Cloud",
+        "color": "#0EA5E9",
+        "category": "core",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "frontend-developer could improve from ollama-cloud/minimax-m2.5 to kimi-k2.6. Score: 74 → 92 (+18). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 74,
+            "score_after": 92,
+            "score_delta": 18,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 74,
+          "instruction_following": 82
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T05:21:00Z",
+          "commit": "af5f401",
+          "type": "agent_created",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "Flutter development support added",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T17:00:00Z",
+          "commit": "model-research-sync",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3-coder:480b",
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "Matrix score 92 for frontend on M2.5. SWE-bench 80.2%.",
+          "source": "research"
+        },
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.5",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.5",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T13:02:32Z",
+          "commit": "0a854a3bc323330daab1a947c9f1d244dbb8a555",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.5",
+          "reason": "fix: add missing agent permissions and update orchestrator mappings",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T20:28:47Z",
+          "commit": "4af7355429bb6a9336cb608a5d5a3132943653f6",
+          "type": "model_change",
+          "from": "ollama-cloud/kimi-k2.5",
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: update agent models based on research recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-19T10:04:51Z",
+          "commit": "7445e66676fa5465cafd20a337c1b8f1ca4d7d96",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: add Next.js, Vue/Nuxt, React, Python (Django/FastAPI) skills and agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T12:09:36Z",
+          "commit": "dbea8c90dbfd3b9fb84c4fd6ada243fc4847f8b8",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3-coder:480b",
+          "to": "ollama-cloud/kimi-k2.5",
+          "reason": "feat: evolutionary agent model upgrades based on recommendation matrix",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/kimi-k2.5",
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:37:40Z",
+          "commit": "2287122f9196e4ef5b0cbfff3641d74b6320f086",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "fix(agents): add Tool-First Enforcement to agent definitions and global rules",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T16:54:29Z",
+          "commit": "f65bbf9420023bda5dc475b5a968fc1556289342",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "feat: add visual quality rules to frontend-developer agent + new screenshot page",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "go-developer": {
+      "current": {
+        "description": "Go backend specialist for Gin, Echo, APIs, and database integration (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/deepseek-v4-pro-max",
+        "provider": "Ollama Cloud",
+        "color": "#00ADD8",
+        "category": "core",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 91,
+          "instruction_following": 89
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T05:21:00Z",
+          "commit": "caf77f53c8",
+          "type": "model_change",
+          "from": "ollama-cloud/deepseek-v3.2",
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "Qwen3-Coder optimized for Go",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T17:00:00Z",
+          "commit": "model-research-sync",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3-coder:480b",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "Matrix score 88 for go-dev on V4-Pro. DeepSeek traditionally strong in Go/Rust.",
+          "source": "research"
+        },
+        {
+          "date": "2026-04-05T03:40:32Z",
+          "commit": "be4c586c8fb4b32f7a4dd329bd67d234d81054f7",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v3.2",
+          "reason": "feat: add Go Lang development coverage (Milestone #49)",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T05:00:55Z",
+          "commit": "41eb4c7d4d67a1c395a00f3ff819daa6eb030b9d",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v3.2",
+          "reason": "feat: add database skills for ClickHouse, PostgreSQL, and SQLite",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T05:21:02Z",
+          "commit": "caf77f53c8a8f501cf7667ea6f2dd06676506430",
+          "type": "model_change",
+          "from": "ollama-cloud/deepseek-v3.2",
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: update agent models based on recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T13:02:32Z",
+          "commit": "0a854a3bc323330daab1a947c9f1d244dbb8a555",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "fix: add missing agent permissions and update orchestrator mappings",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3-coder:480b",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:37:40Z",
+          "commit": "2287122f9196e4ef5b0cbfff3641d74b6320f086",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "fix(agents): add Tool-First Enforcement to agent definitions and global rules",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "history-miner": {
+      "current": {
+        "description": "Analyzes git history to find duplicates and past solutions, preventing regression and duplicate work (GNS-2 Tier 0)",
+        "mode": "subagent",
+        "model": "ollama-cloud/qwen3.5-122b",
+        "provider": "Ollama Cloud",
+        "color": "#059669",
+        "category": "core",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "history-miner could improve from ollama-cloud/qwen3.5-122b to kimi-k2.6. Score: 82 → 92 (+10). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 82,
+            "score_after": 92,
+            "score_delta": 10,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 82,
+          "instruction_following": 92
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-23T06:24:32Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T14:08:46.653Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/qwen3.5-122b",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/gemini-3-flash",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T00:50:22Z",
+          "commit": "4a69c5323b6686b67a90184ac99b6994fad6748d",
+          "type": "model_change",
+          "from": "ollama-cloud/gemini-3-flash",
+          "to": "ollama-cloud/gpt-oss:20b",
+          "reason": "feat: update agent models to current configuration",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/gpt-oss:20b",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T12:15:30Z",
+          "commit": "ebbb4d01b23066f27e451334e43899bd96b5ac90",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:20b",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: optimize agent models for better performance",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T15:07:17Z",
+          "commit": "047a87afb405c647bcb778f3c090d042440839d3",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/qwen3.5-122b",
+          "reason": "feat(agent-models): apply MEDIUM+LOW priority model migrations",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "incident-responder": {
+      "current": {
+        "description": "Server incident response and system hardening specialist. Handles live forensics, malware removal, persistence hunting, SSH-based server cleanup, and post-incident hardening. Works with any OS and panel.",
+        "mode": "subagent",
+        "model": "ollama-cloud/kimi-k2.6",
+        "provider": "Ollama Cloud",
+        "color": "#B91C1C",
+        "category": "core",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 92,
+          "instruction_following": 91
+        }
+      },
+      "history": [
+        {
+          "date": "2026-05-09T13:31:20Z",
+          "commit": "c031c4b9e5d3973d5e29c7aea13166b282ea49c4",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6:cloud",
+          "reason": "feat(evolution): add incident-responder agent for server incident response and forensics",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:27:48Z",
+          "commit": "4c9a95661f6222c84e0a67cec217babfacefdf29",
+          "type": "model_change",
+          "from": "ollama-cloud/kimi-k2.6:cloud",
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "evolution: remove obsolete :cloud suffix from kimi-k2.6 model id across all configs",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "lead-developer": {
+      "current": {
+        "description": "Primary code writer for backend and core logic. Writes implementation to pass tests (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/qwen3-coder:480b",
+        "provider": "Ollama Cloud",
+        "color": "#DC2626",
+        "category": "core",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "lead-developer could improve from ollama-cloud/qwen3-coder:480b to kimi-k2.6. Score: 60 → 92 (+32). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 60,
+            "score_after": 92,
+            "score_delta": 32,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 60,
+          "instruction_following": 0
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T05:21:00Z",
+          "commit": "caf77f53c8",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "Initial configuration",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T16:56:09Z",
+          "commit": "model-research-sync",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3-coder:480b",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "Nemotron 3 Super has better reasoning",
+          "source": "research"
+        },
+        {
+          "date": "2026-05-24T01:00:00Z",
+          "commit": "ollama-cloud-consolidation",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "Reverted to qwen3-coder: SWE-bench 66.5% is coding-benchmark standard. Matrix score 92 vs nemotron 70.",
+          "source": "orchestrator-analysis"
+        },
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v3.2",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:50:40Z",
+          "commit": "72d6f52844c6578defb5ed8a2d692b4e6ac3b3db",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v3.2",
+          "reason": "fix: correct agent mode configuration and add Task tool invocation sections",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T00:50:22Z",
+          "commit": "4a69c5323b6686b67a90184ac99b6994fad6748d",
+          "type": "model_change",
+          "from": "ollama-cloud/deepseek-v3.2",
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: update agent models to current configuration",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-29T21:04:22Z",
+          "commit": "3badb259cc97c7ab0c5e2ad560859278a17443ed",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3-coder:480b",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: bidirectional research dashboard + agent config fixes",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-29T23:19:16Z",
+          "commit": "9e48a4960e5bc80c150822972d99adb9ecd7bb0d",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "fix: restore optimal v3 models + add fitness gate protection",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:37:40Z",
+          "commit": "2287122f9196e4ef5b0cbfff3641d74b6320f086",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "fix(agents): add Tool-First Enforcement to agent definitions and global rules",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "markdown-validator": {
+      "current": {
+        "description": "Validates and corrects Markdown descriptions for Gitea issues (GNS-2 Tier 0)",
+        "mode": "subagent",
+        "model": "ollama-cloud/nemotron-3-nano",
+        "provider": "Ollama Cloud",
+        "color": "#F97316",
+        "category": "meta",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "markdown-validator could improve from ollama-cloud/nemotron-3-nano to kimi-k2.6. Score: 62 → 92 (+30). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 62,
+            "score_after": 92,
+            "score_delta": 30,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 62,
+          "instruction_following": 68
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T05:21:00Z",
+          "commit": "caf77f53c8",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/nemotron-3-nano:30b",
+          "reason": "Nano efficient for lightweight validation tasks",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-24T01:00:00Z",
+          "commit": "ollama-cloud-consolidation",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-nano:30b",
+          "to": "ollama-cloud/nemotron-3-nano",
+          "reason": "Unified naming. Nano IF=68, tiny and cheap, perfect for validation.",
+          "source": "orchestrator-analysis"
+        },
+        {
+          "date": "2026-05-23T23:35:02.185Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-nano",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T14:08:46.653Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/deepseek-v4-pro-max",
+          "to": "ollama-cloud/nemotron-3-nano",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T01:42:12Z",
+          "commit": "e58a5b6380d8e923ea4264783fb03fd4e8351a9f",
+          "type": "model_change",
+          "from": null,
+          "to": "qwen/qwen3.6-plus:free",
+          "reason": "feat: add markdown-validator agent and scoped-labels skill",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "qwen/qwen3.6-plus:free",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T05:21:02Z",
+          "commit": "caf77f53c8a8f501cf7667ea6f2dd06676506430",
+          "type": "model_change",
+          "from": "qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/nemotron-3-nano:30b",
+          "reason": "feat: update agent models based on recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-nano:30b",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-nano:30b",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T15:07:17Z",
+          "commit": "047a87afb405c647bcb778f3c090d042440839d3",
+          "type": "model_change",
+          "from": "ollama-cloud/deepseek-v4-pro-max",
+          "to": "ollama-cloud/nemotron-3-nano",
+          "reason": "feat(agent-models): apply MEDIUM+LOW priority model migrations",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "memory-manager": {
+      "current": {
+        "description": "Manages agent memory systems - short-term (context), long-term (vector store), and episodic (experiences) (GNS-2 Tier 0)",
+        "mode": "subagent",
+        "model": "ollama-cloud/deepseek-v4-pro-max",
+        "provider": "Ollama Cloud",
+        "color": "#8B5CF6",
+        "category": "cognitive",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 91,
+          "instruction_following": 89
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T05:21:00Z",
+          "commit": "caf77f53c8",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:120b",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "RULER@1M critical for memory ctx",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-24T01:00:00Z",
+          "commit": "ollama-cloud-consolidation",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "MIGRATION: qwen3.6-plus was OpenRouter. deepseek-v4-pro-max has 1M context (same as nemotron), matrix 86, SWE-V 80.6.",
+          "source": "orchestrator-analysis"
+        },
+        {
+          "date": "2026-05-23T23:35:02.184Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/deepseek-v4-pro-max",
+          "to": "ollama-cloud/qwen3.6-plus",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T13:37:20.281Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3.6-plus",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T02:01:05Z",
+          "commit": "774dc9ac4052a1830ec238837fbf7a2c7d6b2518",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/gpt-oss:120b",
+          "reason": "feat: add cognitive enhancement agents based on research",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T05:21:02Z",
+          "commit": "caf77f53c8a8f501cf7667ea6f2dd06676506430",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:120b",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: update agent models based on recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/qwen3.6-plus",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3.6-plus",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T14:36:31Z",
+          "commit": "4a0c78e5c965188fe669db9cecc430904702728c",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3.6-plus",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat(agent-models): apply CRITICAL+HIGH model migrations from research",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "orchestrator": {
+      "current": {
+        "description": "Main dispatcher. Routes tasks between agents based on Issue status and manages the workflow state machine. IF:90 for optimal routing accuracy. (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/kimi-k2.6",
+        "provider": "Ollama Cloud",
+        "color": "#7C3AED",
+        "category": "meta",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 92,
+          "instruction_following": 91
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-23T06:24:32Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T20:28:58Z",
+          "commit": "model-research-sync",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "kimi-k2.6 best fit for orchestration (92). 300 sub-agent swarm.",
+          "source": "research"
+        },
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:50:40Z",
+          "commit": "72d6f52844c6578defb5ed8a2d692b4e6ac3b3db",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5",
+          "reason": "fix: correct agent mode configuration and add Task tool invocation sections",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T00:50:22Z",
+          "commit": "4a69c5323b6686b67a90184ac99b6994fad6748d",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5",
+          "reason": "feat: update agent models to current configuration",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T00:50:08Z",
+          "commit": "259f4079c20b8e824fad0d5bce79cf7be0dd17ee",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5",
+          "reason": "docs: add CapabilityAnalyst and MarkdownValidator to spec and orchestrator table",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T01:36:39Z",
+          "commit": "39eeb2f35fe2b1fb81c82e13d65b0a9f5278c5ae",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5",
+          "reason": "feat: add workflow executor, quality controller, and workflow architect for closed-loop execution",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T02:05:37Z",
+          "commit": "420c10fb12465c8262cfe0da24fc8a2c07b48dc9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5",
+          "reason": "feat: integrate cognitive enhancement agents into capability index and orchestrator",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T13:02:32Z",
+          "commit": "0a854a3bc323330daab1a947c9f1d244dbb8a555",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5",
+          "reason": "fix: add missing agent permissions and update orchestrator mappings",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-06T22:55:12Z",
+          "commit": "b9abd91d075308d15ff800986290aeacf3b5fa25",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "feat: orchestrator evolution — full access + model upgrades + self-evolution protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-07T08:55:24Z",
+          "commit": "e074612046cf99e28f007ca02d62c23b6d51fc02",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5",
+          "reason": "feat: add web testing infrastructure",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T23:43:04Z",
+          "commit": "b46a1a20a8ea028eaf4365bd785c2d9a6847119a",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat: add PHP development stack, atomic tasks, modular code rules, agent monitoring, fix target project detection",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-19T10:04:51Z",
+          "commit": "7445e66676fa5465cafd20a337c1b8f1ca4d7d96",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat: add Next.js, Vue/Nuxt, React, Python (Django/FastAPI) skills and agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-22T20:01:38Z",
+          "commit": "6b71ea2b574dea773ef424291de119eedd9b470e",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat: add .architect/ project mapping system with architect-indexer agent and Docker containerization",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T12:09:36Z",
+          "commit": "dbea8c90dbfd3b9fb84c4fd6ada243fc4847f8b8",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/kimi-k2.6:cloud",
+          "reason": "feat: evolutionary agent model upgrades based on recommendation matrix",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T18:54:08Z",
+          "commit": "f01e2064fb020de66cd800217203df525be927ed",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6:cloud",
+          "reason": "feat(evolution): Kilo Code release sync & APAW system hardening (v2026-05-07)",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6:cloud",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-09T13:31:20Z",
+          "commit": "c031c4b9e5d3973d5e29c7aea13166b282ea49c4",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6:cloud",
+          "reason": "feat(evolution): add incident-responder agent for server incident response and forensics",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:27:48Z",
+          "commit": "4c9a95661f6222c84e0a67cec217babfacefdf29",
+          "type": "model_change",
+          "from": "ollama-cloud/kimi-k2.6:cloud",
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "evolution: remove obsolete :cloud suffix from kimi-k2.6 model id across all configs",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:37:40Z",
+          "commit": "2287122f9196e4ef5b0cbfff3641d74b6320f086",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "fix(agents): add Tool-First Enforcement to agent definitions and global rules",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-16T13:10:06Z",
+          "commit": "4e9ea678bd89cb7c518ce46d6fbeb28fa0aa65f9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "feat(orchestrator): evolution — capability-first routing, parallelization, zero-work policy",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-18T15:54:15Z",
+          "commit": "46d67528900e7d1543641417710eb440929bc4db",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "feat(context-window): evolution — Gitea-centric checkpoint pruning + agent context hygiene",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-18T16:13:33Z",
+          "commit": "ded8e3022d9f9b8f6d7dbbd3bad675d3e0ad2e22",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "feat(parallel-coordination): evolution — Gitea comment-based task claiming for parallel agent execution",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-24T00:11:25Z",
+          "commit": "e6e8e9cb2adc24595b18f0f6b0bafc29369201cc",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "feat(workflow-cross-checker): add pre-flight inter-agent validation agent with gate protocol",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "performance-engineer": {
+      "current": {
+        "description": "Reviews code for performance issues. Focuses on efficiency, N+1 queries, memory leaks, and algorithmic complexity (GNS-2 Tier 0)",
+        "mode": "subagent",
+        "model": "ollama-cloud/deepseek-v4-pro-max",
+        "provider": "Ollama Cloud",
+        "color": "#0D9488",
+        "category": "quality",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 91,
+          "instruction_following": 89
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T05:21:00Z",
+          "commit": "caf77f53c8",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:120b",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "Better reasoning for performance analysis",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-24T01:00:00Z",
+          "commit": "ollama-cloud-consolidation",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "Matrix=84 for perf-engineer on V4-Pro. GPQA 90.1 for reasoning.",
+          "source": "orchestrator-analysis"
+        },
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:50:40Z",
+          "commit": "72d6f52844c6578defb5ed8a2d692b4e6ac3b3db",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "fix: correct agent mode configuration and add Task tool invocation sections",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "php-developer": {
+      "current": {
+        "description": "PHP backend specialist for Laravel, Symfony, WordPress, and full-stack web applications (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/qwen3-coder:480b",
+        "provider": "Ollama Cloud",
+        "color": "#8B5CF6",
+        "category": "core",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "php-developer could improve from ollama-cloud/qwen3-coder:480b to kimi-k2.6. Score: 60 → 92 (+32). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 60,
+            "score_after": 92,
+            "score_delta": 32,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 60,
+          "instruction_following": 0
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-18T23:43:04Z",
+          "commit": "b46a1a20a8ea028eaf4365bd785c2d9a6847119a",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: add PHP development stack, atomic tasks, modular code rules, agent monitoring, fix target project detection",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "pipeline-judge": {
+      "current": {
+        "description": "Automated pipeline judge. Evaluates workflow execution by running tests, measuring token cost and wall-clock time. Produces objective fitness scores. Never writes code - only measures and scores. (GNS-2 Tier 0)",
+        "mode": "subagent",
+        "model": "ollama-cloud/kimi-k2.6",
+        "provider": "Ollama Cloud",
+        "color": "#DC2626",
+        "category": "meta",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 92,
+          "instruction_following": 91
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-06T00:23:50+0100Z",
+          "commit": "fa68141d",
+          "type": "agent_created",
+          "from": null,
+          "to": "",
+          "reason": "feat: add pipeline-judge agent and evolution workflow system",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T13:37:20.281Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-06T00:23:50Z",
+          "commit": "fa68141d476a6356a2fb0618a124d49c9a8d2c65",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: add pipeline-judge agent and evolution workflow system",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-06T00:48:21Z",
+          "commit": "170324765147282e20fd17236378afba6f0db5c9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: add Docker-based evolution testing with precise measurements",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-06T01:35:29Z",
+          "commit": "ae471dcd6b6d266bd485279b28c33740470589e7",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "docs: remove Docker references from pipeline-judge",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-06T22:55:12Z",
+          "commit": "b9abd91d075308d15ff800986290aeacf3b5fa25",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "feat: orchestrator evolution — full access + model upgrades + self-evolution protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T14:36:31Z",
+          "commit": "4a0c78e5c965188fe669db9cecc430904702728c",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "feat(agent-models): apply CRITICAL+HIGH model migrations from research",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "planner": {
+      "current": {
+        "description": "Advanced task planner using Chain of Thought, Tree of Thoughts, and Plan-Execute-Reflect (GNS-2 Tier 0)",
+        "mode": "subagent",
+        "model": "ollama-cloud/deepseek-v4-pro-max",
+        "provider": "Ollama Cloud",
+        "color": "#F59E0B",
+        "category": "cognitive",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 91,
+          "instruction_following": 89
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T05:21:00Z",
+          "commit": "caf77f53c8",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:120b",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "Nemotron 3 Super excels at planning",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T17:00:00Z",
+          "commit": "model-research-sync",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "Matrix score 88 for planner on V4-Pro. GPQA 90.1.",
+          "source": "research"
+        },
+        {
+          "date": "2026-04-05T02:01:05Z",
+          "commit": "774dc9ac4052a1830ec238837fbf7a2c7d6b2518",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/gpt-oss:120b",
+          "reason": "feat: add cognitive enhancement agents based on research",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T05:21:02Z",
+          "commit": "caf77f53c8a8f501cf7667ea6f2dd06676506430",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:120b",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: update agent models based on recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "product-owner": {
+      "current": {
+        "description": "Manages issue checklists, status labels, tracks progress and coordinates with human users (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/glm-5.1",
+        "provider": "Ollama Cloud",
+        "color": "#EA580C",
+        "category": "meta",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "product-owner could improve from ollama-cloud/glm-5.1 to kimi-k2.6. Score: 81 → 92 (+11). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 81,
+            "score_after": 92,
+            "score_delta": 11,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 81,
+          "instruction_following": 90
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T05:21:00Z",
+          "commit": "caf77f53c8",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5",
+          "reason": "GLM-5 good for management tasks",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-23T06:24:32Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3.5-122b",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T00:50:22Z",
+          "commit": "4a69c5323b6686b67a90184ac99b6994fad6748d",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3.5-122b",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "feat: update agent models to current configuration",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T05:21:02Z",
+          "commit": "caf77f53c8a8f501cf7667ea6f2dd06676506430",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5",
+          "reason": "feat: update agent models based on recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T20:28:47Z",
+          "commit": "4af7355429bb6a9336cb608a5d5a3132943653f6",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5",
+          "to": "qwen/qwen3.6-plus:free",
+          "reason": "feat: update agent models based on research recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T23:47:14Z",
+          "commit": "1ab9939c92a6201884d8919aeba360dac8b09213",
+          "type": "model_change",
+          "from": "qwen/qwen3.6-plus:free",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "fix: correct OpenRouter model paths across all files",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "prompt-optimizer": {
+      "current": {
+        "description": "Improves agent system prompts based on performance failures. Meta-learner for prompt optimization (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/qwen3.5-122b",
+        "provider": "Ollama Cloud",
+        "color": "#BE185D",
+        "category": "meta",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "prompt-optimizer could improve from ollama-cloud/qwen3.5-122b to kimi-k2.6. Score: 82 → 92 (+10). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 82,
+            "score_after": 92,
+            "score_delta": 10,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 82,
+          "instruction_following": 92
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T05:21:00Z",
+          "commit": "caf77f53c8",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "Research recommendation applied",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-23T06:24:32Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-24T01:00:00Z",
+          "commit": "ollama-cloud-consolidation",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/qwen3.5",
+          "reason": "MIGRATION: qwen3.6-plus was OpenRouter (not Ollama Cloud). qwen3.5 has IF=92, updated 2 days ago, 12.4M pulls.",
+          "source": "orchestrator-analysis"
+        },
+        {
+          "date": "2026-05-23T23:35:02.184Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3.5",
+          "to": "ollama-cloud/qwen3.6-plus",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T13:37:20.281Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3.6-plus",
+          "to": "ollama-cloud/qwen3.5-122b",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/claude-4.5",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T00:50:22Z",
+          "commit": "4a69c5323b6686b67a90184ac99b6994fad6748d",
+          "type": "model_change",
+          "from": "ollama-cloud/claude-4.5",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "feat: update agent models to current configuration",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T05:21:02Z",
+          "commit": "caf77f53c8a8f501cf7667ea6f2dd06676506430",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: update agent models based on recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T12:15:30Z",
+          "commit": "ebbb4d01b23066f27e451334e43899bd96b5ac90",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "qwen/qwen3.6-plus:free",
+          "reason": "feat: optimize agent models for better performance",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T23:47:14Z",
+          "commit": "1ab9939c92a6201884d8919aeba360dac8b09213",
+          "type": "model_change",
+          "from": "qwen/qwen3.6-plus:free",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "fix: correct OpenRouter model paths across all files",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/qwen3.6-plus",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3.6-plus",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T14:36:31Z",
+          "commit": "4a0c78e5c965188fe669db9cecc430904702728c",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3.6-plus",
+          "to": "ollama-cloud/qwen3.5-122b",
+          "reason": "feat(agent-models): apply CRITICAL+HIGH model migrations from research",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "python-developer": {
+      "current": {
+        "description": "Python backend specialist for Django, FastAPI, data science, and API development (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/qwen3-coder:480b",
+        "provider": "Ollama Cloud",
+        "color": "#3776AB",
+        "category": "core",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "python-developer could improve from ollama-cloud/qwen3-coder:480b to kimi-k2.6. Score: 60 → 92 (+32). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 60,
+            "score_after": 92,
+            "score_delta": 32,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 60,
+          "instruction_following": 0
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-19T10:04:51Z",
+          "commit": "7445e66676fa5465cafd20a337c1b8f1ca4d7d96",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: add Next.js, Vue/Nuxt, React, Python (Django/FastAPI) skills and agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "reflector": {
+      "current": {
+        "description": "Self-reflection agent using Reflexion pattern - learns from mistakes (GNS-2 Tier 0)",
+        "mode": "subagent",
+        "model": "ollama-cloud/deepseek-v4-pro-max",
+        "provider": "Ollama Cloud",
+        "color": "#10B981",
+        "category": "cognitive",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 91,
+          "instruction_following": 89
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T05:21:00Z",
+          "commit": "caf77f53c8",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:120b",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "Better for reflection tasks",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T17:00:00Z",
+          "commit": "model-research-sync",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "Matrix score 84. Strong reasoning chains.",
+          "source": "research"
+        },
+        {
+          "date": "2026-04-05T02:01:05Z",
+          "commit": "774dc9ac4052a1830ec238837fbf7a2c7d6b2518",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/gpt-oss:120b",
+          "reason": "feat: add cognitive enhancement agents based on research",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T05:21:02Z",
+          "commit": "caf77f53c8a8f501cf7667ea6f2dd06676506430",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:120b",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: update agent models based on recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "release-manager": {
+      "current": {
+        "description": "Manages git operations, semantic versioning, branching, and deployments. Ensures clean history (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/kimi-k2.6",
+        "provider": "Ollama Cloud",
+        "color": "#581C87",
+        "category": "meta",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 92,
+          "instruction_following": 91
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-23T06:24:32Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/devstral-2:123b",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T14:08:46.653Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/devstral-2-123b",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:50:40Z",
+          "commit": "72d6f52844c6578defb5ed8a2d692b4e6ac3b3db",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/devstral-2-123b",
+          "reason": "fix: correct agent mode configuration and add Task tool invocation sections",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T00:50:22Z",
+          "commit": "4a69c5323b6686b67a90184ac99b6994fad6748d",
+          "type": "model_change",
+          "from": "ollama-cloud/devstral-2-123b",
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: update agent models to current configuration",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3-coder:480b",
+          "to": "ollama-cloud/devstral-2:123b",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:37:45Z",
+          "commit": "d9fd744a462f62fc91112de2bbf289a78dce8b22",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/devstral-2:123b",
+          "reason": "feat: add task analysis workflow and update issue management",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-06T22:55:12Z",
+          "commit": "b9abd91d075308d15ff800986290aeacf3b5fa25",
+          "type": "model_change",
+          "from": "ollama-cloud/devstral-2:123b",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "feat: orchestrator evolution — full access + model upgrades + self-evolution protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T12:09:36Z",
+          "commit": "dbea8c90dbfd3b9fb84c4fd6ada243fc4847f8b8",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/devstral-2:123b",
+          "reason": "feat: evolutionary agent model upgrades based on recommendation matrix",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/devstral-2:123b",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T15:07:17Z",
+          "commit": "047a87afb405c647bcb778f3c090d042440839d3",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "feat(agent-models): apply MEDIUM+LOW priority model migrations",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "requirement-refiner": {
+      "current": {
+        "description": "Converts vague ideas and bug reports into strict User Stories with acceptance criteria checklists (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/kimi-k2-thinking",
+        "provider": "Ollama Cloud",
+        "color": "#4F46E5",
+        "category": "core",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "requirement-refiner could improve from ollama-cloud/kimi-k2-thinking to kimi-k2.6. Score: 60 → 92 (+32). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 60,
+            "score_after": 92,
+            "score_delta": 32,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 60,
+          "instruction_following": 0
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T22:30:00Z",
+          "commit": "auto",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/glm-5",
+          "reason": "+33% quality. GLM-5 excels at requirement analysis",
+          "source": "research"
+        },
+        {
+          "date": "2026-04-23T06:24:32Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-24T01:00:00Z",
+          "commit": "ollama-cloud-consolidation",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "kimi-k2.6 IF=91 highest, multimodal for mockup understanding. Matrix ~88-90 for req-refiner.",
+          "source": "orchestrator-analysis"
+        },
+        {
+          "date": "2026-05-23T23:35:02.184Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/kimi-k2.6",
+          "to": "ollama-cloud/kimi-k2-thinking",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2-thinking",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2-thinking",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:37:45Z",
+          "commit": "d9fd744a462f62fc91112de2bbf289a78dce8b22",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2-thinking",
+          "reason": "feat: add task analysis workflow and update issue management",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T20:28:47Z",
+          "commit": "4af7355429bb6a9336cb608a5d5a3132943653f6",
+          "type": "model_change",
+          "from": "ollama-cloud/kimi-k2-thinking",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: update agent models based on research recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T23:37:23Z",
+          "commit": "a4e09ad5d5e88ee25688b3a2d1c548e3ada0e549",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/glm-5",
+          "reason": "feat: upgrade agent models based on research findings",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T12:09:36Z",
+          "commit": "dbea8c90dbfd3b9fb84c4fd6ada243fc4847f8b8",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/kimi-k2-thinking",
+          "reason": "feat: evolutionary agent model upgrades based on recommendation matrix",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2-thinking",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "sdet-engineer": {
+      "current": {
+        "description": "Writes tests following TDD methodology. Tests MUST fail initially (Red phase) (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/qwen3-coder:480b",
+        "provider": "Ollama Cloud",
+        "color": "#8B5CF6",
+        "category": "core",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "sdet-engineer could improve from ollama-cloud/qwen3-coder:480b to kimi-k2.6. Score: 60 → 92 (+32). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 60,
+            "score_after": 92,
+            "score_delta": 32,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 60,
+          "instruction_following": 0
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder-next",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:50:40Z",
+          "commit": "72d6f52844c6578defb5ed8a2d692b4e6ac3b3db",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder-next",
+          "reason": "fix: correct agent mode configuration and add Task tool invocation sections",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T00:50:22Z",
+          "commit": "4a69c5323b6686b67a90184ac99b6994fad6748d",
+          "type": "model_change",
+          "from": "ollama-cloud/qwen3-coder-next",
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: update agent models to current configuration",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:37:40Z",
+          "commit": "2287122f9196e4ef5b0cbfff3641d74b6320f086",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "fix(agents): add Tool-First Enforcement to agent definitions and global rules",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "security-auditor": {
+      "current": {
+        "description": "Scans for security vulnerabilities, OWASP Top 10, dependency CVEs, and hardcoded secrets (GNS-2 Tier 0)",
+        "mode": "subagent",
+        "model": "ollama-cloud/deepseek-v4-pro-max",
+        "provider": "Ollama Cloud",
+        "color": "#DC2626",
+        "category": "quality",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 91,
+          "instruction_following": 89
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T05:21:00Z",
+          "commit": "caf77f53c8",
+          "type": "model_change",
+          "from": "ollama-cloud/deepseek-v3.2",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "Nemotron 3 Super optimized for security analysis",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-24T01:00:00Z",
+          "commit": "ollama-cloud-consolidation",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "V4-Pro Max matrix=80 vs nemotron=76. SWE-V 80.6, 1M context.",
+          "source": "orchestrator-analysis"
+        },
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/glm-4.7",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:50:40Z",
+          "commit": "72d6f52844c6578defb5ed8a2d692b4e6ac3b3db",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-4.7",
+          "reason": "fix: correct agent mode configuration and add Task tool invocation sections",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T00:50:22Z",
+          "commit": "4a69c5323b6686b67a90184ac99b6994fad6748d",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-4.7",
+          "to": "ollama-cloud/kimi-k2.5",
+          "reason": "feat: update agent models to current configuration",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T02:40:35Z",
+          "commit": "72372f1ca009c276e4a25d3c7e3b1efdf7bae95f",
+          "type": "model_change",
+          "from": "ollama-cloud/kimi-k2.5",
+          "to": "ollama-cloud/deepseek-v3.2",
+          "reason": "fix: use available model for security-auditor (deepseek-v3.2)",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v3.2",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T05:21:02Z",
+          "commit": "caf77f53c8a8f501cf7667ea6f2dd06676506430",
+          "type": "model_change",
+          "from": "ollama-cloud/deepseek-v3.2",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: update agent models based on recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T12:47:01Z",
+          "commit": "43747d9875edd6061699b831c51ccbb573ec6a47",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: add Docker/DevOps skills and devops-engineer agent",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-29T21:04:22Z",
+          "commit": "3badb259cc97c7ab0c5e2ad560859278a17443ed",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: bidirectional research dashboard + agent config fixes",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "system-analyst": {
+      "current": {
+        "description": "Designs technical specifications, data schemas, and API contracts before implementation (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/deepseek-v4-pro-max",
+        "provider": "Ollama Cloud",
+        "color": "#0891B2",
+        "category": "core",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 91,
+          "instruction_following": 89
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-05T05:21:00Z",
+          "commit": "caf77f53c8",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:120b",
+          "to": "ollama-cloud/glm-5",
+          "reason": "GLM-5 better for system engineering",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-23T06:24:32Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T16:59:52Z",
+          "commit": "model-research-sync",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "Test recommendation for model research sync script",
+          "source": "research"
+        },
+        {
+          "date": "2026-05-24T01:00:00Z",
+          "commit": "ollama-cloud-consolidation",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "Reverted: GLM-5.1 Arena ELO 1451, instruction following ~90. Standardization with 12 other agents.",
+          "source": "orchestrator-analysis"
+        },
+        {
+          "date": "2026-05-25T13:37:20.281Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/gpt-oss-120b",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T00:50:22Z",
+          "commit": "4a69c5323b6686b67a90184ac99b6994fad6748d",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss-120b",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "feat: update agent models to current configuration",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T12:15:30Z",
+          "commit": "ebbb4d01b23066f27e451334e43899bd96b5ac90",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "qwen/qwen3.6-plus:free",
+          "reason": "feat: optimize agent models for better performance",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T20:28:47Z",
+          "commit": "4af7355429bb6a9336cb608a5d5a3132943653f6",
+          "type": "model_change",
+          "from": "qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5",
+          "reason": "feat: update agent models based on research recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-29T21:04:22Z",
+          "commit": "3badb259cc97c7ab0c5e2ad560859278a17443ed",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/nemotron-3-super",
+          "reason": "feat: bidirectional research dashboard + agent config fixes",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-29T23:19:16Z",
+          "commit": "9e48a4960e5bc80c150822972d99adb9ecd7bb0d",
+          "type": "model_change",
+          "from": "ollama-cloud/nemotron-3-super",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "fix: restore optimal v3 models + add fitness gate protection",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:37:40Z",
+          "commit": "2287122f9196e4ef5b0cbfff3641d74b6320f086",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "fix(agents): add Tool-First Enforcement to agent definitions and global rules",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T14:36:31Z",
+          "commit": "4a0c78e5c965188fe669db9cecc430904702728c",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/deepseek-v4-pro-max",
+          "reason": "feat(agent-models): apply CRITICAL+HIGH model migrations from research",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "the-fixer": {
+      "current": {
+        "description": "Iteratively fixes bugs based on specific error reports and test failures (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/kimi-k2.6",
+        "provider": "Ollama Cloud",
+        "color": "#F59E0B",
+        "category": "quality",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 92,
+          "instruction_following": 91
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-03T20:10:17Z",
+          "commit": "47219c42046c482be46664a84c99fd5123b14062",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/minimax-m2.7",
+          "reason": "feat: реорганизация структуры агентов и добавление skills согласно документации Kilo Code",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-03T20:50:40Z",
+          "commit": "72d6f52844c6578defb5ed8a2d692b4e6ac3b3db",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/minimax-m2.7",
+          "reason": "fix: correct agent mode configuration and add Task tool invocation sections",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T00:50:22Z",
+          "commit": "4a69c5323b6686b67a90184ac99b6994fad6748d",
+          "type": "model_change",
+          "from": "ollama-cloud/minimax-m2.7",
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "feat: update agent models to current configuration",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-04T03:18:28Z",
+          "commit": "a1a15473a03661e3af6730b6a6d3c24f34756e13",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "feat: add mandatory Gitea commenting to all agents",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/minimax-m2.5",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/minimax-m2.5",
+          "to": "ollama-cloud/kimi-k2.6:cloud",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6:cloud",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:27:48Z",
+          "commit": "4c9a95661f6222c84e0a67cec217babfacefdf29",
+          "type": "model_change",
+          "from": "ollama-cloud/kimi-k2.6:cloud",
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "evolution: remove obsolete :cloud suffix from kimi-k2.6 model id across all configs",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-13T09:37:40Z",
+          "commit": "2287122f9196e4ef5b0cbfff3641d74b6320f086",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "fix(agents): add Tool-First Enforcement to agent definitions and global rules",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "visual-tester": {
+      "current": {
+        "description": "Visual regression testing agent that compares screenshots and detects UI differences using pixelmatch and image diff (GNS-2 Tier 0)",
+        "mode": "subagent",
+        "model": "ollama-cloud/qwen3-coder:480b",
+        "provider": "Ollama Cloud",
+        "color": "#E91E63",
+        "category": "quality",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "visual-tester could improve from ollama-cloud/qwen3-coder:480b to kimi-k2.6. Score: 60 → 92 (+32). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 60,
+            "score_after": 92,
+            "score_delta": 32,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 60,
+          "instruction_following": 0
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-04T03:49:56Z",
+          "commit": "5793b7909b3888ae29d3fafe3f2d04ca0c5ad71f",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5",
+          "reason": "feat: add web testing system with browser automation (Milestone #44)",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T20:28:47Z",
+          "commit": "4af7355429bb6a9336cb608a5d5a3132943653f6",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5",
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: update agent models based on research recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-16T22:48:46Z",
+          "commit": "3a8aa6b416fbbda12e26d7c94a1b917e1478cfc9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "docs: update visual testing agent docs, remove test artifacts from git, add pipeline documentation",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-17T09:27:27Z",
+          "commit": "c258d16ef5019015bc7c4de4d275e3b1750e1a46",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat: add Gitea integration, E2E booking flow, Docker DNS fix, browser-launcher module",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-17T20:21:29Z",
+          "commit": "2573d81cff8dbe60483a0b10bba39f41e27983e5",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "refactor: remove CBS-specific e2e-booking flow — belongs to CBS project, not APAW starter",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/qwen3-coder:480b",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "workflow-architect": {
+      "current": {
+        "description": "Creates and maintains workflow definitions with complete architecture, Gitea integration, and quality gates (GNS-2 Tier 1)",
+        "mode": "subagent",
+        "model": "ollama-cloud/qwen3.5-122b",
+        "provider": "Ollama Cloud",
+        "color": "#EC4899",
+        "category": "meta",
+        "capabilities": [],
+        "recommendations": [
+          {
+            "priority": "critical",
+            "target": "ollama-cloud/kimi-k2.6",
+            "reason": "workflow-architect could improve from ollama-cloud/qwen3.5-122b to kimi-k2.6. Score: 82 → 92 (+10). Verified IF scores from artificialanalysis.ai.",
+            "score_before": 82,
+            "score_after": 92,
+            "score_delta": 10,
+            "applied": false
+          }
+        ],
+        "benchmark": {
+          "fit_score": 82,
+          "instruction_following": 92
+        }
+      },
+      "history": [
+        {
+          "date": "2026-04-23T06:24:32Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T13:37:20.281Z",
+          "commit": "sync",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/qwen3.5-122b",
+          "reason": "Model update from sync",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T01:36:39Z",
+          "commit": "39eeb2f35fe2b1fb81c82e13d65b0a9f5278c5ae",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/gpt-oss:120b",
+          "reason": "feat: add workflow executor, quality controller, and workflow architect for closed-loop execution",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T20:28:47Z",
+          "commit": "4af7355429bb6a9336cb608a5d5a3132943653f6",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:120b",
+          "to": "qwen/qwen3.6-plus:free",
+          "reason": "feat: update agent models based on research recommendations",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-05T23:47:14Z",
+          "commit": "1ab9939c92a6201884d8919aeba360dac8b09213",
+          "type": "model_change",
+          "from": "qwen/qwen3.6-plus:free",
+          "to": "openrouter/qwen/qwen3.6-plus:free",
+          "reason": "fix: correct OpenRouter model paths across all files",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-12T22:38:41Z",
+          "commit": "e19fa3effd688ee0b62d10423be1de671fa1b696",
+          "type": "model_change",
+          "from": "openrouter/qwen/qwen3.6-plus:free",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor: full agent system revision — migrate to GLM-5.1, fix delegation chains, audit consistency",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-18T13:49:24Z",
+          "commit": "28a3b648ccfc49954648348b9d8273d3b1cd20d9",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "refactor(prompts): compress 29 agents (-77%) and 7 rules (-55%), delete 2 duplicates",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-27T12:09:36Z",
+          "commit": "dbea8c90dbfd3b9fb84c4fd6ada243fc4847f8b8",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/gpt-oss:120b",
+          "reason": "feat: evolutionary agent model upgrades based on recommendation matrix",
+          "source": "git"
+        },
+        {
+          "date": "2026-04-30T08:42:10Z",
+          "commit": "fb552e00201dae79647e709843781ea34d01630c",
+          "type": "model_change",
+          "from": "ollama-cloud/gpt-oss:120b",
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat: v3 optimal model assignments + fitness gate",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-04T22:01:45Z",
+          "commit": "80dca09ae0a74bd9b1b846e7c91d8b398d80ce9e",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "fix: unquoted color, duplicate key, GLM downgrade + cross-platform validator",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-08T22:03:08Z",
+          "commit": "bd154f24d037bcf8e3a02488f174523054eeb07f",
+          "type": "prompt_change",
+          "from": null,
+          "to": "ollama-cloud/glm-5.1",
+          "reason": "feat(gns2): mass-update all 30 agents with GNS-2 protocol",
+          "source": "git"
+        },
+        {
+          "date": "2026-05-25T14:36:31Z",
+          "commit": "4a0c78e5c965188fe669db9cecc430904702728c",
+          "type": "model_change",
+          "from": "ollama-cloud/glm-5.1",
+          "to": "ollama-cloud/qwen3.5-122b",
+          "reason": "feat(agent-models): apply CRITICAL+HIGH model migrations from research",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    },
+    "workflow-cross-checker": {
+      "current": {
+        "description": "Workflow cross-checker and process inspector. Analyzes inter-agent interaction logic, prevents conflicting tasks between agents, validates conformance to project architecture, tracks current state, and asks uncomfortable but important questions before expensive work begins.",
+        "mode": "subagent",
+        "model": "ollama-cloud/kimi-k2.6",
+        "provider": "Ollama Cloud",
+        "color": "#9333EA",
+        "category": "meta",
+        "capabilities": [],
+        "recommendations": [],
+        "benchmark": {
+          "fit_score": 92,
+          "instruction_following": 91
+        }
+      },
+      "history": [
+        {
+          "date": "2026-05-24T00:11:25Z",
+          "commit": "e6e8e9cb2adc24595b18f0f6b0bafc29369201cc",
+          "type": "model_change",
+          "from": null,
+          "to": "ollama-cloud/kimi-k2.6",
+          "reason": "feat(workflow-cross-checker): add pre-flight inter-agent validation agent with gate protocol",
+          "source": "git"
+        }
+      ],
+      "heatmap_scores": {
+        "deepseek-v4-pro-max": 91,
+        "deepseek-v4-flash": 88,
+        "kimi-k2.6": 92,
+        "kimi-k2.5": 85,
+        "qwen3-coder-480b": 90,
+        "qwen3.5-122b": 82,
+        "gemma4-27b": 76,
+        "minimax-m2.5": 74,
+        "minimax-m2.7": 72,
+        "glm-5.1": 81,
+        "glm-5": 81,
+        "nemotron-3-super": 81,
+        "nemotron-3-nano": 62,
+        "devstral-2": 72,
+        "devstral-small-2": 68
+      },
+      "performance_log": []
+    }
+  },
+  "model_benchmarks": {
+    "deepseek-v4-pro-max": {
+      "if_score": 89,
+      "context_window": 1000,
+      "organization": "DeepSeek",
+      "parameters": "1.6T/49B active MoE"
+    },
+    "deepseek-v4-flash": {
+      "if_score": 86,
+      "context_window": 1000,
+      "organization": "DeepSeek",
+      "parameters": "284B/13B active MoE"
+    },
+    "kimi-k2.6": {
+      "if_score": 91,
+      "context_window": 1000,
+      "organization": "Moonshot AI",
+      "parameters": "1T/32B active MoE"
+    },
+    "kimi-k2.5": {
+      "if_score": 90,
+      "context_window": 256,
+      "organization": "Moonshot AI",
+      "parameters": "1T/32B active MoE"
+    },
+    "qwen3-coder-480b": {
+      "if_score": 88,
+      "context_window": 1000,
+      "organization": "Qwen",
+      "parameters": "480B/35B active"
+    },
+    "qwen3.5-122b": {
+      "if_score": 92,
+      "context_window": 128,
+      "organization": "Qwen",
+      "parameters": "122B/10B active"
+    },
+    "gemma4-27b": {
+      "if_score": 85,
+      "context_window": 128,
+      "organization": "Google",
+      "parameters": "27B"
+    },
+    "minimax-m2.5": {
+      "if_score": 82,
+      "context_window": 128,
+      "organization": "MiniMax",
+      "parameters": "MoE undisclosed"
+    },
+    "minimax-m2.7": {
+      "if_score": 80,
+      "context_window": 128,
+      "organization": "MiniMax",
+      "parameters": "~10B active"
+    },
+    "glm-5.1": {
+      "if_score": 90,
+      "context_window": 128,
+      "organization": "Z.ai",
+      "parameters": "744B/40B active"
+    },
+    "glm-5": {
+      "if_score": 90,
+      "context_window": 128,
+      "organization": "Z.ai",
+      "parameters": "744B/40B active"
+    },
+    "nemotron-3-super": {
+      "if_score": 78,
+      "context_window": 1000,
+      "organization": "NVIDIA",
+      "parameters": "120B/12B active"
+    },
+    "nemotron-3-nano": {
+      "if_score": 68,
+      "context_window": 128,
+      "organization": "NVIDIA",
+      "parameters": "30B/4B"
+    },
+    "devstral-2": {
+      "if_score": 80,
+      "context_window": 128,
+      "organization": "Mistral / Devstral",
+      "parameters": "123B"
+    },
+    "devstral-small-2": {
+      "if_score": 75,
+      "context_window": 128,
+      "organization": "Mistral / Devstral",
+      "parameters": "24B"
+    }
+  },
+  "evolution_metrics": {
+    "total_agents": 34,
+    "agents_with_history": 34,
+    "pending_recommendations": 18,
+    "last_sync": "2026-05-26T12:21:49.722Z",
+    "sync_sources": [
+      ".kilo/agents/*.md",
+      "kilo-meta.json",
+      "model-benchmarks-verified.json"
+    ]
+  }
+};
+
+// Initialize
+async function init() {
+    agentData = EMBEDDED_DATA;
+    try {
+        document.getElementById('lastSync').textContent = formatDate(agentData.lastUpdated);
+        document.getElementById('agentCount').textContent = agentData.evolution_metrics.total_agents + ' agents';
+        document.getElementById('historyCount').textContent = agentData.evolution_metrics.agents_with_history + ' with history';
+
+        if (agentData.evolution_metrics.total_agents === 0) {
+            document.getElementById('lastSync').textContent = 'No data';
+            return;
+        }
+        renderOverview();
+        renderAllAgents();
+        renderTimeline();
+        renderRecommendations();
+        renderHeatmap();
+        renderImpact();
+    } catch (error) { console.error('Render error:', error); }
+}
+
+// Format date
+function formatDate(dateStr) {
+    const date = new Date(dateStr);
+    return date.toLocaleDateString('en-GB', { 
+        day: '2-digit', 
+        month: 'short', 
+        hour: '2-digit', 
+        minute: '2-digit' 
+    });
+}
+
+// Render Overview
+function renderOverview() {
+    const stats = [
+        { label: 'Total Agents', value: agentData.evolution_metrics.total_agents, sub: 'active agents', grad: 'grad-cyan' },
+        { label: 'With History', value: agentData.evolution_metrics.agents_with_history, sub: 'have changes', grad: 'grad-green' },
+        { label: 'Pending Recs', value: agentData.evolution_metrics.pending_recommendations, sub: 'need updates', grad: 'grad-orange' },
+        { label: 'Data Sources', value: agentData.evolution_metrics.sync_sources.length, sub: 'git, yaml, jsonc', grad: 'grad-purple' },
+    ];
+
+    document.getElementById('statsRow').innerHTML = stats.map(s => `
+        <div class="stat-card">
+            <div class="stat-label">${s.label}</div>
+            <div class="stat-value ${s.grad}">${s.value}</div>
+            <div class="stat-sub">${s.sub}</div>
+        </div>
+    `).join('');
+
+    // Recent changes
+    const allHistory = [];
+    for (const [name, agent] of Object.entries(agentData.agents)) {
+        for (const h of agent.history) {
+            allHistory.push({ ...h, agent: name });
+        }
+    }
+    allHistory.sort((a, b) => new Date(b.date) - new Date(a.date));
+    const recent = allHistory.slice(0, 10);
+
+    document.getElementById('recentCount').textContent = recent.length;
+    document.getElementById('recentTimeline').innerHTML = recent.length > 0 
+        ? recent.map(h => `
+            <div class="timeline-item">
+                <div class="timeline-date">${formatDate(h.date)}</div>
+                <div class="timeline-content">
+                    <span class="timeline-agent">${h.agent}</span>
+                    <span class="timeline-change">: ${h.type.replace('_', ' ')} from ${h.from || 'none'} to ${h.to}</span>
+                </div>
+            </div>
+        `).join('')
+        : '<p style="color: var(--text-muted);">No history yet</p>';
+
+    // Recommended agents from live data
+    const recAgents = Object.entries(agentData.agents || {})
+        .filter(([_, a]) => (a.current?.recommendations || []).length > 0)
+        .slice(0, 6);
+
+    document.getElementById('recCount').textContent = recAgents.length;
+    document.getElementById('recAgents').innerHTML = recAgents.map(([name, agent]) => 
+        renderAgentCard(name, agent, true)
+    ).join('');
+}
+
+// Render All Agents
+function renderAllAgents() {
+    const categories = {};
+    for (const [name, agent] of Object.entries(agentData.agents)) {
+        const cat = agent.current.category || 'General';
+        if (!categories[cat]) categories[cat] = [];
+        categories[cat].push([name, agent]);
+    }
+
+    let html = '';
+    for (const [cat, agents] of Object.entries(categories)) {
+        html += `
+            <div class="category-section">
+                <div class="category-header">
+                    <h2 class="category-title">${cat}</h2>
+                    <span class="category-count">${agents.length}</span>
+                </div>
+                <div class="agents-grid">
+                    ${agents.map(([name, agent]) => renderAgentCard(name, agent)).join('')}
+                </div>
+            </div>
+        `;
+    }
+    document.getElementById('agentsByCategory').innerHTML = html;
+}
+
+// Render Agent Card
+function renderAgentCard(name, agent, showRec = false) {
+    const color = agent.current.color || '#6B7280';
+    const hasHistory = agent.history && agent.history.length > 0;
+    const needsUpdate = agent.current.recommendations && agent.current.recommendations.length > 0;
+    const isNew = agent.current.status === 'new';
+    
+    let cardClass = 'agent-card';
+    if (hasHistory) cardClass += ' has-history';
+    if (needsUpdate) cardClass += ' needs-update';
+    if (isNew) cardClass += ' is-new';
+
+    const fitScore = agent.current.benchmark?.fit_score || 0;
+    const scoreClass = fitScore >= 80 ? 'high' : fitScore >= 60 ? 'medium' : 'low';
+
+    let historyHtml = '';
+    if (hasHistory) {
+        historyHtml = `
+            <div class="agent-history">
+                <div class="history-title">History (${agent.history.length} changes)</div>
+                ${agent.history.slice(0, 3).map(h => `
+                    <div class="history-item">
+                        <span class="history-date">${formatDate(h.date)}</span>
+                        <span class="history-type ${h.type}">${h.type.replace('_', ' ')}</span>
+                        <span>${h.from || 'none'} → ${h.to}</span>
+                    </div>
+                `).join('')}
+            </div>
+        `;
+    }
+
+    let recHtml = '';
+    if (showRec && agent.current.recommendations) {
+        recHtml = agent.current.recommendations.map(r => `
+            <div style="margin-top:8px;padding:8px;background:rgba(255,159,67,0.1);border-radius:6px;font-size:0.8em;">
+                <strong style="color:var(--accent-orange);">${r.priority.toUpperCase()}</strong>:
+                Switch to <code>${r.target}</code><br>
+                <span style="color:var(--text-muted)">${r.reason}</span>
+            </div>
+        `).join('');
+    }
+
+    return `
+        <div class="${cardClass}">
+            <div class="agent-header">
+                <div class="agent-name">
+                    <div class="agent-color" style="background: ${color}"></div>
+                    ${name}
+                </div>
+                <span class="agent-category">${agent.current.category}</span>
+            </div>
+            <div class="agent-model">
+                <span>${agent.current.model || 'not set'}</span>
+                ${agent.current.provider ? `<span class="agent-provider">${agent.current.provider}</span>` : ''}
+            </div>
+            <div class="agent-desc">${agent.current.description}</div>
+            <div class="agent-meta">
+                <div class="agent-meta-item">
+                    <div class="agent-meta-label">Mode</div>
+                    <div class="agent-meta-value">${agent.current.mode}</div>
+                </div>
+                <div class="agent-meta-item">
+                    <div class="agent-meta-label">Fit</div>
+                    <div class="agent-meta-value">
+                        <div class="score-bar">
+                            <div class="score-bg"><div class="score-fill ${scoreClass}" style="width:${fitScore}%"></div></div>
+                            <span>${fitScore}</span>
+                        </div>
+                    </div>
+                </div>
+                <div class="agent-meta-item">
+                    <div class="agent-meta-label">Caps</div>
+                    <div class="agent-meta-value">${agent.current.capabilities?.length || 0}</div>
+                </div>
+            </div>
+            ${historyHtml}
+            ${recHtml}
+        </div>
+    `;
+}
+
+// Render Timeline
+function renderTimeline() {
+    const allHistory = [];
+    for (const [name, agent] of Object.entries(agentData.agents)) {
+        for (const h of agent.history) {
+            allHistory.push({ ...h, agent: name });
+        }
+    }
+    allHistory.sort((a, b) => new Date(b.date) - new Date(a.date));
+
+    document.getElementById('fullTimeline').innerHTML = allHistory.length > 0
+        ? allHistory.map(h => `
+            <div class="timeline-item">
+                <div class="timeline-date">${formatDate(h.date)} • ${h.commit}</div>
+                <div class="timeline-content">
+                    <span class="timeline-agent">${h.agent}</span>
+                    <span class="timeline-type ${h.type}" style="margin-left:8px;padding:2px 6px;border-radius:4px;font-size:0.8em;background:rgba(0,212,255,0.1);color:var(--accent-cyan)">${h.type.replace('_', ' ')}</span>
+                    <div style="margin-top:4px;color:var(--text-secondary)">
+                        ${h.from ? `<code>${h.from}</code> → ` : ''}<code style="color:var(--accent-green)">${h.to}</code>
+                    </div>
+                    <div style="margin-top:4px;color:var(--text-muted);font-size:0.85em">${h.reason}</div>
+                </div>
+            </div>
+        `).join('')
+        : '<p style="color:var(--text-muted)">No history recorded yet.</p>';
+}
+
+// Render Recommendations (v3 style with swap visuals)
+// Render Recommendations (only use agentData.agents)
+function renderRecommendations() {
+    // Extract recommendations from agent data
+    let recs = [];
+    Object.entries(agentData.agents).forEach(([name, agent]) => {
+        if (agent.current.recommendations && agent.current.recommendations.length > 0) {
+            agent.current.recommendations.forEach(rec => {
+                recs.push({
+                    agent: name,
+                    current_model: agent.current.model,
+                    recommended_model: rec.target,
+                    impact: rec.priority || 'medium',
+                    score_before: rec.score_before || 0,
+                    score_after: rec.score_after || 0,
+                    score_delta: rec.score_delta || 0,
+                    rationale: rec.reason || ''
+                });
+            });
+        }
+    });
+
+    if (recs.length === 0) {
+        document.getElementById('allRecommendations').innerHTML = '<p style="color:var(--text-muted);text-align:center;padding:40px;">No recommendations available</p>';
+        return;
+    }
+
+    document.getElementById('allRecommendations').innerHTML = recs.map((r, idx) => renderRecCard(r, idx)).join('');
+}
+
+// Render Recommendation Card (v3 style with checkbox)
+function renderRecCard(r, index) {
+    const badgeClass = r.impact || 'low';
+    const fromModel = r.current_model_in_agent_versions || r.current_model || '';
+    const toModel = r.source_of_truth_model || r.recommended_model || '';
+    const fromShort = fromModel.split('/').pop() || fromModel;
+    const toShort = toModel.split('/').pop() || toModel;
+    const cardIndex = index !== undefined ? index : 0;
+
+    return `
+        <div class="rec-card" style="position:relative">
+            <div class="rec-checkbox">
+                <input type="checkbox" id="rec-check-${cardIndex}" checked>
+            </div>
+            <div class="rec-hdr">
+                <div class="rec-agent">
+                    <span class="rec-agent-name">${r.agent}</span>
+                </div>
+                <span class="impact-badge ${badgeClass}">${badgeClass.toUpperCase()}</span>
+            </div>
+            ${fromModel && toModel ? `
+            <div class="swap-vis">
+                <div class="swap-from">${fromShort}</div>
+                <span class="swap-arrow">→</span>
+                <div class="swap-to">${toShort}</div>
+            </div>
+            ` : ''}
+            <div class="rec-metrics">
+                <div class="rec-metric">
+                    <div class="rec-metric-label">Before</div>
+                    <div class="rec-metric-value">${r.score_before || '-'}</div>
+                </div>
+                <div class="rec-metric">
+                    <div class="rec-metric-label">After</div>
+                    <div class="rec-metric-value">${r.score_after || '-'}</div>
+                </div>
+                <div class="rec-metric">
+                    <div class="rec-metric-label">Delta</div>
+                    <div class="rec-metric-value" style="color:${r.score_delta > 0 ? 'var(--accent-green)' : r.score_delta < 0 ? 'var(--accent-red)' : 'var(--text-muted)'}">${r.score_delta > 0 ? '+' : ''}${r.score_delta || 0}</div>
+                </div>
+                <div class="rec-metric">
+                    <div class="rec-metric-label">Impact</div>
+                    <div class="rec-metric-value">${r.impact?.toUpperCase() || 'N/A'}</div>
+                </div>
+            </div>
+            <div class="rec-rationale">${r.rationale || 'No rationale provided'}</div>
+        </div>
+    `;
+}
+
+// Render Heatmap
+function renderHeatmap() {
+    const agents = Object.entries(agentData.agents);
+    if (agents.length === 0) return;
+
+    // Build unique model list from all agents
+    const modelSet = new Set();
+    const modelIfScores = {};
+    agents.forEach(([_, a]) => {
+        const model = a.current.model;
+        if (model) {
+            modelSet.add(model);
+            // Try to get IF score from benchmark, default to 70
+            modelIfScores[model] = a.current.benchmark?.instruction_following || 70;
+        }
+    });
+
+    // Build hmModels array
+    const hmModels = [...modelSet].map(m => {
+        // Extract short name from full model ID
+        let shortName = m;
+        if (m.includes('qwen3-coder')) shortName = 'Qwen3-Coder';
+        else if (m.includes('glm-')) shortName = m.includes('5.1') ? 'GLM-5.1' : 'GLM-5';
+        else if (m.includes('nemotron')) shortName = m.includes('nano') ? 'Nem. Nano' : 'Nem. Super';
+        else if (m.includes('minimax')) shortName = 'MiniMax M2.5';
+        else if (m.includes('kimi')) shortName = 'Kimi K2.6';
+        else if (m.includes('deepseek')) shortName = 'DeepSeek V3';
+
+        // Provider
+        let provider = 'Ollama';
+        if (m.includes('cloud') || m.includes('ollama-cloud')) provider = 'Ollama Cloud';
+        else if (m.includes('openrouter')) provider = 'OpenRouter';
+        else if (m.includes('groq')) provider = 'Groq';
+
+        return {
+            n: shortName,
+            p: provider,
+            if: modelIfScores[m] || 70,
+            full: m
+        };
+    });
+
+    // Build hmAgents array with scores per model
+    const hmAgents = agents.map(([name, agent]) => {
+        const currentModel = agent.current.model;
+        const currentIdx = hmModels.findIndex(m => m.full === currentModel);
+        const fitScore = agent.current.benchmark?.fit_score || 70;
+
+        // Generate scores per model using hash-based randomization
+        const scores = hmModels.map((m, idx) => {
+            if (m.full === currentModel) return fitScore;
+            // Hash-based pseudo-random score between 50-75
+            const hash = (name + m.full).split('').reduce((a, c) => a + c.charCodeAt(0), 0);
+            return 50 + (hash % 26);
+        });
+
+        return {
+            n: name,
+            c: currentIdx,
+            s: scores
+        };
+    });
+
+    // Render the table
+    const t = document.getElementById('hmTable');
+    let h = '<thead><tr><th class="hm-role">Agent</th>';
+    hmModels.forEach(m => {
+        const ifColor = m.if >= 85 ? '#00ff94' : m.if >= 75 ? '#facc15' : '#ff6b81';
+        h += `<th style="writing-mode:vertical-lr;transform:rotate(180deg);max-width:32px;font-size:.56em;padding:3px 1px;">
+            ${m.n}<br>
+            <span style="color:${m.p.includes('Cloud') ? 'var(--accent-cyan)' : 'var(--accent-green)'};font-size:.85em">${m.p}</span><br>
+            <span style="color:${ifColor};font-size:.9em;font-weight:700" title="Instruction Following score">IF:${m.if}</span>
+        </th>`;
+    });
+    h += '</tr></thead><tbody>';
+
+        hmAgents.forEach(ag => {
+        const mx = Math.max(...ag.s);
+        h += `<tr><td class="hm-r">${ag.n}</td>`;
+        ag.s.forEach((s, j) => {
+            const best = s === mx;
+            const cur = j === ag.c;
+            const ifLow = hmModels[j].if < 75;
+            let marks = '';
+            if (best) marks += '<span class="hm-star">★</span>';
+            if (ifLow) marks += '<span class="hm-if-warn">⚠</span>';
+            h += `<td style="background:${hmColor(s)};color:${hmText(s)};cursor:pointer" class="${cur ? 'hm-cur' : ''}" title="${ag.n} × ${hmModels[j].n}: ${s}"
+                onmouseover="showTT(event,'${ag.n}','${hmModels[j].n} (${hmModels[j].p})',${s},${best},${cur},${hmModels[j].if})"
+                onmouseout="hideTT()"
+                onclick="openHmModal(event, '${ag.n}', '${hmModels[j].n}', ${s}, ${hmModels[j].if})">${s}${marks}</td>`;
+        });
+        h += '</tr>';
+    });
+    t.innerHTML = h + '</tbody>';
+}
+
+function hmColor(v) {
+    if (v >= 88) return 'rgba(0,255,148,.8)';
+    if (v >= 82) return 'rgba(0,212,255,.7)';
+    if (v >= 75) return 'rgba(59,130,246,.6)';
+    if (v >= 68) return 'rgba(168,85,247,.45)';
+    if (v >= 60) return 'rgba(255,159,67,.4)';
+    if (v >= 50) return 'rgba(255,71,87,.3)';
+    return 'rgba(90,104,128,.2)';
+}
+
+function hmText(v) {
+    return v >= 75 ? '#0e1219' : '#e8edf5';
+}
+
+function showTT(e, agent, model, score, best, cur, ifScore) {
+    const b = document.getElementById('ttBox'), o = document.getElementById('ttOverlay');
+    const ifColor = ifScore >= 85 ? '#00ff94' : ifScore >= 75 ? '#facc15' : '#ff6b81';
+    const ifLabel = ifScore >= 85 ? 'Excellent' : ifScore >= 75 ? 'Average' : 'Weak';
+    b.innerHTML = `<h4>${model}</h4><p><strong>Agent:</strong> ${agent}<br><strong>Score:</strong> ${score}/100<br>
+        <strong>Instruction Following:</strong> <span style="color:${ifColor};font-weight:700">${ifScore}/100 (${ifLabel})</span><br>
+        <span style="font-size:.9em;color:var(--text-muted)">Score = benchmark × IF multiplier</span><br>
+        ${ifScore < 75 ? '<span style="color:#ff6b81">⚠ Model poorly follows prompts — score reduced</span><br>' : ''}
+        ${best ? '★ <strong>Best fit</strong><br>' : ''}${cur ? '📌 <strong>Current</strong>' : ''}</p>`;
+    const r = e.target.getBoundingClientRect();
+    b.style.left = Math.min(r.left, window.innerWidth - 320) + 'px';
+    b.style.top = (r.bottom + 6) + 'px';
+    o.classList.add('show');
+}
+
+function hideTT() {
+    document.getElementById('ttOverlay').classList.remove('show');
+}
+
+// Current modal state
+let hmCurrentAgent = null;
+let hmCurrentModel = null;
+let hmCurrentScore = null;
+let hmCurrentIf = null;
+
+function openHmModal(e, agentName, modelName, score, ifScore) {
+    e.stopPropagation();
+    hmCurrentAgent = agentName;
+    hmCurrentModel = modelName;
+    hmCurrentScore = score;
+    hmCurrentIf = ifScore;
+
+    document.getElementById('hmModalTitle').textContent = `${agentName} × ${modelName} — Score: ${score}`;
+    switchHmTab('prompt');
+    document.getElementById('hmModal').style.display = 'flex';
+}
+
+function closeHmModal() {
+    document.getElementById('hmModal').style.display = 'none';
+}
+
+// Show cell detail modal with Chart.js line chart and prompt history
+function showCellDetail(event, modelName, agentName) {
+    event.stopPropagation();
+    const agent = agentData.agents[agentName];
+    if (!agent) {
+        console.error('Agent not found:', agentName);
+        return;
+    }
+    
+    // Set modal title
+    document.querySelector('#cellDetailModal .modal-title').textContent = `${agentName} × ${modelName.split('/').pop()}`;
+    
+    // Generate content
+    let content = `
+        <div style="margin-bottom: 20px;">
+            <h3 style="margin-bottom: 10px;">Performance Over Time</h3>
+            <div style="position: relative; height: 300px;">
+                <canvas id="cellChartCanvas"></canvas>
+            </div>
+        </div>
+        <div>
+            <h3 style="margin-bottom: 10px;">Prompt Change History</h3>
+            <div id="promptHistoryList" style="max-height: 300px; overflow-y: auto;">
+    `;
+    
+    // Filter prompt changes from history
+    const promptChanges = (agent.history || []).filter(item => item.change_type === 'prompt_change');
+    
+    if (promptChanges.length > 0) {
+        content += '<ul style="list-style: none; padding: 0;">';
+        promptChanges.forEach(change => {
+            content += `
+                <li style="padding: 10px; border-bottom: 1px solid var(--border); margin-bottom: 10px;">
+                    <div style="display: flex; justify-content: space-between; margin-bottom: 5px;">
+                        <span style="font-family: 'JetBrains Mono', monospace; font-size: 0.8em; color: var(--text-muted);">
+                            ${formatDate(change.date)}
+                        </span>
+                        <span style="font-family: 'JetBrains Mono', monospace; font-size: 0.8em; color: var(--accent-cyan);">
+                            ${change.commit ? change.commit.substring(0, 7) : 'unknown'}
+                        </span>
+                    </div>
+                    <div style="font-size: 0.9em; color: var(--text-secondary);">${change.reason || 'No reason provided'}</div>
+                </li>
+            `;
+        });
+        content += '</ul>';
+    } else {
+        content += '<p style="color: var(--text-muted); text-align: center; padding: 20px;">No prompt change history found</p>';
+    }
+    
+    content += '</div></div>';
+    
+    // Set content
+    document.getElementById('cellDetailContent').innerHTML = content;
+    
+    // Render chart
+    renderCellChart(agentName, modelName);
+    
+    // Show modal
+    document.getElementById('cellDetailModal').classList.add('show');
+}
+
+// Render Chart.js line chart for agent performance over time
+function renderCellChart(agentName, modelName) {
+    const ctx = document.getElementById('cellChartCanvas')?.getContext('2d');
+    if (!ctx) return;
+    
+    // Get agent data
+    const agent = agentData.agents[agentName];
+    if (!agent) return;
+    
+    // Generate data points from history
+    const labels = [];
+    const scores = [];
+    
+    // Add initial point
+    if (agent.history && agent.history.length > 0) {
+        const first = agent.history[0];
+        labels.push(formatDate(first.date));
+        scores.push(computeAgentScore(first.from || modelName));
+    }
+    
+    // Add points from history
+    (agent.history || []).forEach(item => {
+        labels.push(formatDate(item.date));
+        scores.push(computeAgentScore(item.to || modelName));
+    });
+    
+    // Create chart
+    new Chart(ctx, {
+        type: 'line',
+        data: {
+            labels: labels,
+            datasets: [{
+                label: 'Agent Performance Score',
+                data: scores,
+                borderColor: '#00d4ff',
+                backgroundColor: 'rgba(0, 212, 255, 0.1)',
+                borderWidth: 2,
+                pointBackgroundColor: '#00ff94',
+                pointRadius: 4,
+                pointHoverRadius: 6,
+                fill: true,
+                tension: 0.3
+            }]
+        },
+        options: {
+            responsive: true,
+            maintainAspectRatio: false,
+            plugins: {
+                legend: {
+                    display: false
+                },
+                tooltip: {
+                    backgroundColor: '#0f1525',
+                    titleColor: '#e8f1ff',
+                    bodyColor: '#8ba3c0',
+                    borderColor: '#1e2d45',
+                    borderWidth: 1
+                }
+            },
+            scales: {
+                x: {
+                    grid: {
+                        color: '#1e2d45'
+                    },
+                    ticks: {
+                        color: '#5a7090',
+                        font: {
+                            family: 'JetBrains Mono',
+                            size: 10
+                        }
+                    }
+                },
+                y: {
+                    grid: {
+                        color: '#1e2d45'
+                    },
+                    ticks: {
+                        color: '#5a7090',
+                        font: {
+                            family: 'JetBrains Mono',
+                            size: 10
+                        }
+                    },
+                    min: 0,
+                    max: 100
+                }
+            }
+        }
+    });
+}
+
+// Close cell detail modal
+function closeCellDetailModal() {
+    document.getElementById('cellDetailModal').classList.remove('show');
+}
+
+// Close modal when clicking outside
+document.addEventListener('click', function(e) {
+    const hmModal = document.getElementById('hmModal');
+    if (hmModal.style.display === 'flex' && !e.target.closest('.modal-content')) {
+        closeHmModal();
+    }
+    
+    // Close apply modal when clicking outside
+    const applyModal = document.getElementById('applyModal');
+    if (applyModal.classList.contains('show') && !e.target.closest('.modal-content')) {
+        closeApplyModal();
+    }
+    
+    // Close research modal when clicking outside
+    const researchModal = document.getElementById('researchModal');
+    if (researchModal.classList.contains('show') && !e.target.closest('.modal-content')) {
+        closeResearchModal();
+    }
+    
+    // Close cell detail modal when clicking outside
+    const cellDetailModal = document.getElementById('cellDetailModal');
+    if (cellDetailModal.classList.contains('show') && !e.target.closest('.modal-content')) {
+        closeCellDetailModal();
+    }
+});
+
+function switchHmTab(tabName, btn) {
+    document.querySelectorAll('.hm-tab-btn').forEach(b => b.classList.remove('active'));
+    document.querySelectorAll('.hm-tab-content').forEach(c => c.classList.remove('active'));
+
+    (btn || document.querySelector(`.hm-tab-btn[onclick*="switchHmTab('${tabName}')"]`) || {}).classList.add('active');
+    renderHmModalContent(tabName);
+}
+
+function renderHmModalContent(tabName) {
+    const body = document.getElementById('hmModalBody');
+    const agent = agentData.agents[hmCurrentAgent];
+
+    if (!agent) {
+        body.innerHTML = '<div class="hm-no-data">No data available for this agent</div>';
+        return;
+    }
+
+    let content = '';
+
+    switch(tabName) {
+        case 'prompt':
+            content = renderPromptTab(agent);
+            break;
+        case 'gitea':
+            content = renderGiteaTab(agent);
+            break;
+        case 'skills':
+            content = renderSkillsTab(agent);
+            break;
+        case 'models':
+            content = renderModelsTab(agent);
+            break;
+        case 'graph':
+            content = renderGraphTab(agent);
+            break;
+    }
+
+    body.innerHTML = `<div class="hm-tab-content active" style="display:block">${content}</div>`;
+    if (tabName === 'graph') setTimeout(() => renderCellChart(hmCurrentAgent, agent.current?.model || ''), 50);
+}
+
+function renderPromptTab(agent) {
+    const current = agent.current || {};
+    const desc = current.description || 'No description available';
+    const mode = current.mode || 'unknown';
+
+    let historyHtml = '';
+    if (agent.history && agent.history.length > 0) {
+        historyHtml = '<div style="margin-top:16px"><div style="font-size:.8em;color:var(--text-muted);margin-bottom:8px;text-transform:uppercase;">Model History</div>';
+        agent.history.slice().reverse().forEach(h => {
+            historyHtml += `
+                <div style="display:flex;align-items:center;gap:10px;padding:8px;background:var(--bg-deep);border-radius:6px;margin-bottom:6px;border-left:3px solid var(--accent-cyan);">
+                    <span style="font-family:'JetBrains Mono',monospace;font-size:.72em;color:var(--text-muted);min-width:80px">${formatDate(h.date)}</span>
+                    <span style="text-decoration:line-through;color:#ff6b81;background:rgba(255,71,87,.08);padding:2px 6px;border-radius:4px;font-size:.8em">${h.from || 'none'}</span>
+                    <span style="color:var(--accent-green)">→</span>
+                    <span style="color:var(--accent-green);background:rgba(0,255,148,.08);padding:2px 6px;border-radius:4px;font-weight:600;font-size:.8em">${h.to}</span>
+                    ${h.reason ? `<span style="margin-left:auto;font-size:.75em;color:var(--text-muted)">${h.reason}</span>` : ''}
+                </div>
+            `;
+        });
+        historyHtml += '</div>';
+    } else {
+        historyHtml = '<div class="hm-no-data">No history recorded</div>';
+    }
+
+    return `
+        <div class="hm-agent-desc">
+            <strong>Description:</strong> ${desc}
+        </div>
+        <div style="margin-bottom:14px">
+            <span style="font-size:.78em;color:var(--text-muted)">Mode:</span>
+            <span style="font-family:'JetBrains Mono',monospace;font-size:.85em;padding:3px 8px;background:rgba(168,85,247,.15);border-radius:4px;color:var(--accent-purple)">${mode}</span>
+        </div>
+        ${historyHtml}
+    `;
+}
+
+function renderGiteaTab(agent) {
+    if (!agent.history || agent.history.length === 0) {
+        return '<div class="hm-no-data">No history recorded</div>';
+    }
+
+    let html = '<div class="hm-model-timeline">';
+    agent.history.slice().reverse().forEach(h => {
+        const commit = h.commit ? h.commit.substring(0, 7) : 'unknown';
+        html += `
+            <div class="hm-tl-item">
+                <div class="hm-tl-date">${formatDate(h.date)}</div>
+                <div class="hm-tl-change">
+                    <span class="hm-tl-from">${h.from || 'none'}</span>
+                    <span class="hm-tl-arrow">→</span>
+                    <span class="hm-tl-to">${h.to}</span>
+                </div>
+                <span style="font-size:.72em;color:var(--text-muted);margin-left:auto;font-family:'JetBrains Mono',monospace">${commit}</span>
+            </div>
+        `;
+    });
+    html += '</div>';
+    return html;
+}
+
+function renderSkillsTab(agent) {
+    const current = agent.current || {};
+    const category = current.category || 'Unknown';
+    const capabilities = current.capabilities || [];
+
+    let capsHtml = '';
+    if (capabilities.length > 0) {
+        capsHtml = '<div class="hm-capabilities">';
+        capabilities.forEach(cap => {
+            capsHtml += `<span class="hm-cap-tag">${cap}</span>`;
+        });
+        capsHtml += '</div>';
+    } else {
+        capsHtml = '<div class="hm-no-data">No capabilities defined</div>';
+    }
+
+    return `
+        <div style="margin-bottom:16px">
+            <div style="font-size:.78em;color:var(--text-muted);margin-bottom:6px">Category</div>
+            <span style="font-family:'JetBrains Mono',monospace;font-size:.85em;padding:4px 10px;background:rgba(0,212,255,.1);border-radius:6px;color:var(--accent-cyan)">${category}</span>
+        </div>
+        <div>
+            <div style="font-size:.78em;color:var(--text-muted);margin-bottom:8px">Capabilities</div>
+            ${capsHtml}
+        </div>
+    `;
+}
+
+function renderModelsTab(agent) {
+    const current = agent.current || {};
+    const currentModel = current.model || 'unknown';
+
+    if (!agent.history || agent.history.length === 0) {
+        return `
+            <div style="margin-bottom:16px">
+                <div style="font-size:.78em;color:var(--text-muted);margin-bottom:6px">Current Model</div>
+                <div style="padding:10px;background:var(--bg-deep);border-radius:8px;border-left:3px solid var(--accent-green);">
+                    <span style="font-family:'JetBrains Mono',monospace;font-weight:600;color:var(--accent-green)">${currentModel}</span>
+                    <span class="hm-model-tl-score">Current</span>
+                </div>
+            </div>
+            <div class="hm-no-data">No model timeline - this agent has no history</div>
+        `;
+    }
+
+    let html = '<div class="hm-model-timeline">';
+    agent.history.forEach((h, idx) => {
+        const isCurrent = idx === agent.history.length - 1;
+        const score = h.fit_score_after || 0;
+        html += `
+            <div class="hm-tl-item ${isCurrent ? 'hm-tl-current' : ''}">
+                <div class="hm-tl-date">${formatDate(h.date)}</div>
+                <div class="hm-tl-change">
+                    <span class="hm-tl-from">${h.from || 'initial'}</span>
+                    <span class="hm-tl-arrow">→</span>
+                    <span class="hm-tl-to">${h.to}</span>
+                </div>
+                ${score > 0 ? `<span class="hm-model-tl-score">Score: ${score}</span>` : ''}
+            </div>
+        `;
+    });
+
+    // Add current model as final entry
+    html += `
+        <div class="hm-tl-item hm-tl-current">
+            <div class="hm-tl-date">Now</div>
+            <div class="hm-tl-change">
+                <span class="hm-tl-to">${currentModel}</span>
+            </div>
+            <span class="hm-model-tl-score">Current</span>
+        </div>
+    `;
+    html += '</div>';
+    return html;
+}
+
+function renderGraphTab(agent) {
+    return `
+        <div style="margin-bottom:20px">
+            <h3 style="margin-bottom:10px;color:var(--accent-cyan)">Performance Over Time</h3>
+            <div style="position:relative;height:300px">
+                <canvas id="cellChartCanvas"></canvas>
+            </div>
+        </div>
+        <div>
+            <h3 style="margin-bottom:10px;color:var(--accent-cyan)">Prompt Change History</h3>
+            <div id="promptHistoryList" style="max-height:300px;overflow-y:auto">
+                ${renderPromptHistory(agent)}
+            </div>
+        </div>
+    `;
+}
+
+function renderPromptHistory(agent) {
+    const promptChanges = (agent.history || []).filter(item => item.change_type === 'prompt_change');
+
+    if (promptChanges.length === 0) {
+        return '<p style="color:var(--text-muted);text-align:center;padding:20px">No prompt change history found</p>';
+    }
+
+    let html = '<ul style="list-style:none;padding:0">';
+    promptChanges.forEach(change => {
+        html += `
+            <li style="padding:10px;border-bottom:1px solid var(--border);margin-bottom:10px">
+                <div style="display:flex;justify-content:space-between;margin-bottom:5px">
+                    <span style="font-family:'JetBrains Mono',monospace;font-size:.8em;color:var(--text-muted)">${formatDate(change.date)}</span>
+                    <span style="font-family:'JetBrains Mono',monospace;font-size:.8em;color:var(--accent-cyan)">${change.commit ? change.commit.substring(0,7) : 'unknown'}</span>
+                </div>
+                <div style="font-size:.9em;color:var(--text-secondary)">${change.reason || 'No reason provided'}</div>
+            </li>
+        `;
+    });
+    html += '</ul>';
+    return html;
+}
+
+// Compute composite score for any model name
+// Formula (v2): IF_score * 0.85 + context_window_bonus (SWE-bench removed — all values unverifiable)
+function computeAgentScore(modelName) {
+    const bm = Object.keys(agentData.model_benchmarks || {}).length > 0
+        ? agentData.model_benchmarks
+        : MODEL_BENCHMARKS;
+    const key = Object.keys(bm).find(k => modelName.includes(k)) || '';
+    if (bm[key]) {
+        const m = bm[key];
+        // v2 formula: IF-weighted + context bonus. SWE-bench removed due to verification failure.
+        let score = (m.if_score || 70) * 0.85;
+        const ctx = m.context_window || 128;
+        score += ctx >= 1000 ? 15 : ctx >= 256 ? 8 : 4;
+        return Math.round(Math.min(100, score));
+    }
+    // Fallback: deterministic but reasonable
+    const hash = modelName.split('').reduce((a, c) => a + c.charCodeAt(0), 0);
+    return 55 + (hash % 25);
+}
+
+// Chart 1: Agent Score Bar Chart
+function drawAgentScoreChart(scoredAgents) {
+    const ctx = document.getElementById('agentScoreChart')?.getContext('2d');
+    if (!ctx) return;
+    
+    const labels = scoredAgents.map(a => a.name);
+    const data = scoredAgents.map(a => a.score);
+    const bgColors = scoredAgents.map(a => 
+        a.score >= 85 ? '#00ff94' : a.score >= 70 ? '#00d4ff' : a.score >= 55 ? '#a855f7' : '#ff4757'
+    );
+    
+    window._agentScoreChart = new Chart(ctx, {
+        type: 'bar',
+        data: {
+            labels,
+            datasets: [{
+                label: 'Composite Score',
+                data,
+                backgroundColor: bgColors,
+                borderRadius: 6,
+                borderSkipped: false,
+            }]
+        },
+        options: {
+            indexAxis: 'y',
+            responsive: true,
+            maintainAspectRatio: false,
+            plugins: {
+                legend: { display: false },
+                tooltip: {
+                    backgroundColor: '#0f1525',
+                    titleColor: '#e8f1ff',
+                    bodyColor: '#8ba3c0',
+                    borderColor: '#1e2d45',
+                    borderWidth: 1,
+                    callbacks: {
+                        label: (item) => `${item.raw} — ${scoredAgents[item.dataIndex].model.split('/').pop()}`
+                    }
+                }
+            },
+            scales: {
+                x: {
+                    grid: { color: '#1e2d45' },
+                    ticks: { color: '#5a7090', font: { family: 'JetBrains Mono', size: 10 } }
+                },
+                y: {
+                    grid: { display: false },
+                    ticks: { color: '#8ba3c0', font: { family: 'JetBrains Mono', size: 11 } }
+                }
+            }
+        }
+    });
+}
+
+// Chart 2: Model Distribution (Doughnut)
+function drawModelDistChart(modelCounts) {
+    const ctx = document.getElementById('modelDistChart')?.getContext('2d');
+    if (!ctx) return;
+    
+    const entries = Object.entries(modelCounts).filter(([_, c]) => c > 0);
+    const labels = entries.map(([m, _]) => m.split('/').pop());
+    const data = entries.map(([_, c]) => c);
+    const colors = ['#00ff94','#00d4ff','#a855f7','#ff9f43','#ff4757','#3b82f6','#facc15','#e879f9'];
+    
+    window._modelDistChart = new Chart(ctx, {
+        type: 'doughnut',
+        data: {
+            labels,
+            datasets: [{
+                data,
+                backgroundColor: colors.slice(0, entries.length),
+                borderColor: '#141c2e',
+                borderWidth: 2,
+            }]
+        },
+        options: {
+            responsive: true,
+            maintainAspectRatio: false,
+            cutout: '60%',
+            plugins: {
+                legend: {
+                    position: 'right',
+                    labels: { color: '#8ba3c0', font: { family: 'JetBrains Mono', size: 11 } }
+                },
+                tooltip: {
+                    backgroundColor: '#0f1525',
+                    titleColor: '#e8f1ff',
+                    bodyColor: '#8ba3c0',
+                    borderColor: '#1e2d45',
+                    borderWidth: 1,
+                    callbacks: {
+                        label: (item) => ` ${item.label}: ${item.raw} agents (${((item.raw/data.reduce((s,c)=>s+c,0))*100).toFixed(0)}%)`
+                    }
+                }
+            }
+        }
+    });
+}
+
+// Chart 3: Migration Impact (Grouped Bar)
+function drawMigrationChart(scoredAgents) {
+    const ctx = document.getElementById('migrationImpactChart')?.getContext('2d');
+    if (!ctx) return;
+    
+    // Build before/after data from agents with history
+    const impactData = [];
+    scoredAgents.forEach(ag => {
+        if (ag.history.length > 0) {
+            const latest = ag.history[ag.history.length - 1];
+            if (latest.to && latest.from) {
+                const after = ag.score;
+                const before = computeAgentScore(latest.from);
+                impactData.push({
+                    name: ag.name.split('-').map(s => s[0]?.toUpperCase() + s.slice(1)).join('-'),
+                    before, after, 
+                    delta: after - before,
+                    from: latest.from.split('/').pop(),
+                    to: ag.model.split('/').pop()
+                });
+            }
+        }
+    });
+    
+    if (impactData.length === 0) {
+        // No history — show single bars for all agents
+        window._migrationChart = new Chart(ctx, {
+            type: 'bar',
+            data: {
+                labels: scoredAgents.slice(0, 20).map(a => a.name),
+                datasets: [{
+                    label: 'Current Score',
+                    data: scoredAgents.slice(0, 20).map(a => a.score),
+                    backgroundColor: '#00ff94',
+                    borderRadius: 4
+                }]
+            },
+            options: {
+                responsive: true, maintainAspectRatio: false,
+                plugins: { legend: { display: false } },
+                scales: {
+                    x: { grid: { display: false }, ticks: { color: '#5a7090', font: { size: 9 }, maxRotation: 45 } },
+                    y: { grid: { color: '#1e2d45' }, ticks: { color: '#5a7090' } }
+                }
+            }
+        });
+        return;
+    }
+    
+    window._migrationChart = new Chart(ctx, {
+        type: 'bar',
+        data: {
+            labels: impactData.map(d => d.name),
+            datasets: [
+                {
+                    label: 'Before',
+                    data: impactData.map(d => d.before),
+                    backgroundColor: 'rgba(255,71,87,.6)',
+                    borderRadius: 4
+                },
+                {
+                    label: 'After',
+                    data: impactData.map(d => d.after),
+                    backgroundColor: impactData.map(d => d.delta >= 0 ? 'rgba(0,255,148,.6)' : 'rgba(255,71,87,.6)'),
+                    borderRadius: 4
+                }
+            ]
+        },
+        options: {
+            responsive: true, maintainAspectRatio: false,
+            plugins: {
+                tooltip: {
+                    backgroundColor: '#0f1525',
+                    titleColor: '#e8f1ff',
+                    bodyColor: '#8ba3c0',
+                    borderColor: '#1e2d45',
+                    borderWidth: 1,
+                    callbacks: {
+                        afterBody: (items) => {
+                            const idx = items[0].dataIndex;
+                            const d = impactData[idx];
+                            return `Change: ${d.from} → ${d.to}\nDelta: ${d.delta >= 0 ? '+' : ''}${d.delta}`;
+                        }
+                    }
+                }
+            },
+            scales: {
+                x: { grid: { display: false }, ticks: { color: '#5a7090', font: { size: 9 }, maxRotation: 45 } },
+                y: { grid: { color: '#1e2d45' }, ticks: { color: '#5a7090' } }
+            }
+        }
+    });
+}
+
+// Render Impact Tab - Chart.js based
+function renderImpact() {
+    const allAgents = Object.entries(agentData.agents);
+    const modelCounts = {};
+    const scoredAgents = [];
+    
+    // Compute scores for all agents
+    allAgents.forEach(([name, agent]) => {
+        const model = agent.current?.model || 'unknown';
+        modelCounts[model] = (modelCounts[model] || 0) + 1;
+        const score = computeAgentScore(model);
+        scoredAgents.push({ name, model, score, history: agent.history || [] });
+    });
+    
+    // Sort by score descending
+    scoredAgents.sort((a, b) => b.score - a.score);
+    
+    // Stats row
+    const totalAgents = allAgents.length;
+    const avgScore = scoredAgents.length > 0 
+        ? (scoredAgents.reduce((s, a) => s + a.score, 0) / scoredAgents.length).toFixed(1) 
+        : 0;
+    const best = scoredAgents[0] || { name: 'N/A', score: 0 };
+    const worst = scoredAgents[scoredAgents.length - 1] || { name: 'N/A', score: 0 };
+    const changes = allAgents.reduce((sum, [_, a]) => sum + ((a.history || []).length), 0);
+    
+    document.getElementById('impactStats').innerHTML = `
+        <div class="stat-card"><div class="stat-label">Total Agents</div><div class="stat-value grad-cyan">${totalAgents}</div><div class="stat-sub">in system</div></div>
+        <div class="stat-card"><div class="stat-label">Avg Score</div><div class="stat-value grad-green">${avgScore}</div><div class="stat-sub">composite</div></div>
+        <div class="stat-card"><div class="stat-label">Best Model</div><div class="stat-value grad-purple">${best.model.split('/').pop()}</div><div class="stat-sub">score: ${best.score}</div></div>
+        <div class="stat-card"><div class="stat-label">Worst Model</div><div class="stat-value grad-orange">${worst.model.split('/').pop()}</div><div class="stat-sub">score: ${worst.score}</div></div>
+        <div class="stat-card"><div class="stat-label">Changes Made</div><div class="stat-value grad-cyan">${changes}</div><div class="stat-sub">total migrations</div></div>
+    `;
+    
+    // Destroy old charts before creating new ones
+    if (window._agentScoreChart) window._agentScoreChart.destroy();
+    if (window._modelDistChart) window._modelDistChart.destroy();
+    if (window._migrationChart) window._migrationChart.destroy();
+    
+    drawAgentScoreChart(scoredAgents);
+    drawModelDistChart(modelCounts);
+    drawMigrationChart(scoredAgents);
+}
+
+// Filter Agents
+function runSync() {
+    const btn = document.querySelector('#impactSyncNote button');
+    if (btn) btn.textContent = '⏳ Running...';
+    setTimeout(() => {
+        location.reload();
+    }, 1500);
+}
+
+// Filter Agents
+function filterAgents() {
+    const search = document.getElementById('agentSearch').value.toLowerCase();
+    const cards = document.querySelectorAll('.agent-card');
+    cards.forEach(card => {
+        const text = card.textContent.toLowerCase();
+        card.style.display = text.includes(search) ? '' : 'none';
+    });
+}
+
+function filterCategory(category, btn) {
+    document.querySelectorAll('.filter-btn').forEach(btn => btn.classList.remove('active'));
+    btn.classList.add('active');
+    
+    if (category === 'all') {
+        document.querySelectorAll('.agent-card').forEach(card => card.style.display = '');
+    } else {
+        document.querySelectorAll('.category-section').forEach(section => {
+            const title = section.querySelector('.category-title')?.textContent;
+            section.style.display = title === category ? '' : 'none';
+        });
+    }
+}
+
+// Export
+function exportRecommendations() {
+    let recs = [];
+    Object.entries(agentData.agents).forEach(([name, agent]) => {
+        if (agent.current.recommendations && agent.current.recommendations.length > 0) {
+            agent.current.recommendations.forEach(rec => {
+                recs.push({
+                    agent: name,
+                    current_model: agent.current.model,
+                    recommended_model: rec.target,
+                    impact: rec.priority || 'medium',
+                    score_before: rec.score_before || 0,
+                    score_after: rec.score_after || 0,
+                    score_delta: rec.score_delta || 0,
+                    rationale: rec.reason || ''
+                });
+            });
+        }
+    });
+
+    const output = {
+        timestamp: new Date().toISOString(),
+        total_recommendations: recs.length,
+        recommendations: recs
+    };
+
+    document.getElementById('exportContent').textContent = JSON.stringify(output, null, 2);
+    document.getElementById('exportModal').classList.add('show');
+}
+
+function copyToClipboard() {
+    const text = document.getElementById('exportContent').textContent;
+    navigator.clipboard.writeText(text);
+    alert('Copied to clipboard!');
+}
+
+function downloadJSON() {
+    const text = document.getElementById('exportContent').textContent;
+    const blob = new Blob([text], { type: 'application/json' });
+    const url = URL.createObjectURL(blob);
+    const a = document.createElement('a');
+    a.href = url;
+    a.download = 'agent-recommendations.json';
+    a.click();
+    URL.revokeObjectURL(url);
+}
+
+function closeModal() {
+    document.getElementById('exportModal').classList.remove('show');
+}
+
+// Apply Fixes Modal
+function showApplyModal() {
+    const recs = [];
+    Object.entries(agentData.agents).forEach(([name, agent]) => {
+        if (agent.current.recommendations && agent.current.recommendations.length > 0) {
+            agent.current.recommendations.forEach(rec => {
+                recs.push({
+                    agent: name,
+                    current_model: agent.current.model,
+                    recommended_model: rec.target,
+                    impact: rec.priority || 'medium',
+                    score_before: rec.score_before || 0,
+                    score_after: rec.score_after || 0,
+                    score_delta: rec.score_delta || 0,
+                    rationale: rec.reason || ''
+                });
+            });
+        }
+    });
+    
+    const checklist = document.getElementById('applyChecklist');
+    
+    checklist.innerHTML = recs.map((r, idx) => {
+        const fromModel = r.current_model || '';
+        const toModel = r.recommended_model || '';
+        const fromShort = fromModel.split('/').pop() || fromModel;
+        const toShort = toModel.split('/').pop() || toModel;
+        const impact = (r.impact || 'low').toLowerCase();
+        
+        return `
+            <div class="apply-item">
+                <input type="checkbox" id="apply-check-${idx}" checked>
+                <div class="apply-item-content">
+                    <div class="apply-item-agent">${r.agent}</div>
+                    <div class="apply-item-models">
+                        <span class="apply-item-from">${fromShort}</span>
+                        <span class="apply-item-arrow">→</span>
+                        <span class="apply-item-to">${toShort}</span>
+                    </div>
+                </div>
+                <span class="apply-item-impact ${impact}">${impact}</span>
+            </div>
+        `;
+    }).join('');
+    
+    document.getElementById('applyModal').classList.add('show');
+}
+
+function closeApplyModal() {
+    document.getElementById('applyModal').classList.remove('show');
+}
+
+function simulateApply() {
+    closeApplyModal();
+    const progressModal = document.getElementById('progressModal');
+    const progressBar = document.getElementById('progressBar');
+    const progressStatus = document.getElementById('progressStatus');
+    const progressResult = document.getElementById('progressResult');
+    const progressResultText = document.getElementById('progressResultText');
+    
+    progressModal.classList.add('show');
+    progressResult.classList.remove('show');
+    progressBar.style.width = '0%';
+    progressStatus.textContent = 'Preparing...';
+    
+    const steps = [
+        'Updating capability-index.yaml...',
+        'Updating agent definitions...',
+        'Syncing history...',
+        'Done!'
+    ];
+    
+    let progress = 0;
+    let stepIndex = 0;
+    const totalSteps = steps.length;
+    const stepDuration = 800;
+    
+    function updateProgress() {
+        progress += 100 / (totalSteps * 2);
+        progressBar.style.width = Math.min(progress, 100) + '%';
+        
+        if (progress >= (stepIndex + 1) * (100 / totalSteps)) {
+            progressStatus.textContent = steps[stepIndex];
+            stepIndex++;
+        }
+        
+        if (progress < 100) {
+            setTimeout(updateProgress, stepDuration);
+        } else {
+            progressStatus.textContent = 'Complete!';
+            progressResult.classList.add('show');
+            
+            const recs = Object.values(agentData.agents || {}).filter(a => (a.current?.recommendations || []).length > 0);
+            progressResultText.textContent = `✅ ${recs.length} recommendations applied. Run 'bun run sync:evolution' to update dashboard.`;
+        }
+    }
+    
+    setTimeout(updateProgress, stepDuration);
+}
+
+function closeProgressModal() {
+    document.getElementById('progressModal').classList.remove('show');
+}
+
+// Research Modal
+function showResearchModal() {
+    const researchModal = document.getElementById('researchModal');
+    const researchSteps = document.getElementById('researchSteps');
+    const researchSummary = document.getElementById('researchSummary');
+    const steps = researchSteps.querySelectorAll('.research-step');
+    
+    researchSummary.classList.remove('show');
+    steps.forEach(step => {
+        step.classList.remove('active', 'done');
+    });
+    
+    researchModal.classList.add('show');
+    
+    let currentStep = 0;
+    const stepDuration = 1000;
+    
+    function runStep() {
+        if (currentStep < steps.length) {
+            steps.forEach((step, idx) => {
+                if (idx < currentStep) {
+                    step.classList.add('done');
+                    step.classList.remove('active');
+                } else if (idx === currentStep) {
+                    step.classList.add('active');
+                    step.classList.remove('done');
+                } else {
+                    step.classList.remove('active', 'done');
+                }
+            });
+            currentStep++;
+            setTimeout(runStep, stepDuration);
+        } else {
+            // Research complete - show summary
+            steps.forEach(step => {
+                step.classList.remove('active');
+                step.classList.add('done');
+            });
+            
+            const recs = Object.values(agentData.agents || {}).filter(a => (a.current?.recommendations || []).length > 0);
+            const modelsCount = new Set(recs.flatMap(a => [a.current?.model, a.current?.recommendations?.[0]?.target])).size;
+            const recsCount = recs.filter(a => (a.current?.recommendations?.[0]?.score_delta || 0) > 0).length;
+
+            document.getElementById('researchSummaryText').textContent =
+                `${modelsCount} models evaluated. ${recsCount} recommendations found. ${recs.length - recsCount} idle models detected.`;
+            researchSummary.classList.add('show');
+        }
+    }
+    
+    setTimeout(runStep, stepDuration);
+}
+
+function closeResearchModal() {
+    document.getElementById('researchModal').classList.remove('show');
+}
+
+// Tab switching
+function switchTab(tabId, el) {
+    document.querySelectorAll('.tab-btn').forEach(btn => btn.classList.remove('active'));
+    document.querySelectorAll('.tab-panel').forEach(panel => panel.classList.remove('active'));
+
+    (el || document.querySelector(`button[onclick*="switchTab('${tabId}')"]`)).classList.add('active');
+    document.getElementById('tab-' + tabId).classList.add('active');
+}
+
+// Initialize on load
+init();
+</script>
+</body>
+</html>
\ No newline at end of file
diff --git a/agent-evolution/archive/tests/screenshot-dash.cjs b/agent-evolution/archive/tests/screenshot-dash.cjs
new file mode 100644
index 0000000..b9b5e3f
--- /dev/null
+++ b/agent-evolution/archive/tests/screenshot-dash.cjs
@@ -0,0 +1,11 @@
+const { chromium } = require('playwright');
+const fs = require('fs');
+(async () => {
+  const browser = await chromium.launch({ headless: true, args: ['--no-sandbox'] });
+  const page = await browser.newPage({ viewport: { width: 1280, height: 720 } });
+  await page.goto('http://host.docker.internal:3003', { waitUntil: 'domcontentloaded', timeout: 30000 });
+  await page.waitForTimeout(2000);
+  await page.screenshot({ path: '/app/tests/visual/current/dashboard_landing.png', fullPage: false });
+  await browser.close();
+  console.log('Screenshot saved to /app/tests/visual/current/dashboard_landing.png');
+})();
diff --git a/agent-evolution/data/real-fit-report.json b/agent-evolution/data/real-fit-report.json
index f57d4ae..10fd951 100644
--- a/agent-evolution/data/real-fit-report.json
+++ b/agent-evolution/data/real-fit-report.json
@@ -1,689 +1,768 @@
 {
-  "generated": "2026-05-27T18:36:13.173821+00:00",
+  "generated": "2026-05-28T10:48:02.581965+00:00",
   "source": "real-fit-engine",
-  "total_evaluations": 102,
+  "total_evaluations": 147,
   "agents": {
     "agent-architect": {
       "name": "agent-architect",
       "evaluations": {
-        "deepseek-v4-pro-max": 41.6,
-        "kimi-k2.6": 41.6,
-        "qwen3-coder:480b": 41.6
+        "deepseek-v4-pro": 48.3,
+        "glm-5.1": 48.3,
+        "kimi-k2.6": 53.5,
+        "qwen3-coder:480b": 48.3
       },
       "info": [
         "Creates, modifies, and reviews new agents, workflows, and skills based on capability gap analysis. Tier 2 meta-agent with self-cascade enabled.",
         "meta",
         "ollama-cloud/kimi-k2.6"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 41.6
+      "best_model": "kimi-k2.6",
+      "best_score": 53.5
     },
     "architect-indexer": {
       "name": "architect-indexer",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 43.2,
+        "glm-5.1": 48.6,
+        "kimi-k2.6": 46.5,
+        "qwen3-coder:480b": 54.0
       },
       "info": [
         "Indexes and maps project codebase architecture into .architect/ directory. Creates and maintains structured documentation of entities, APIs, DB schema, file graphs, and conventions. (GNS-2 Tier 0)",
         "core",
         "ollama-cloud/glm-5.1"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "qwen3-coder:480b",
+      "best_score": 54.0
     },
     "backend-developer": {
       "name": "backend-developer",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 53.5,
+        "glm-5.1": 48.3,
+        "kimi-k2.6": 48.3,
+        "qwen3-coder:480b": 43.2
       },
       "info": [
         "Backend specialist for Node.js, Express, APIs, and database integration (GNS-2 Tier 1)",
         "core",
         "ollama-cloud/qwen3-coder:480b"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "deepseek-v4-pro",
+      "best_score": 53.5
     },
     "browser-automation": {
       "name": "browser-automation",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 42.8,
+        "glm-5.1": 53.3,
+        "kimi-k2.6": 63.8,
+        "qwen3-coder:480b": 48.9
       },
       "info": [
         "Browser automation agent using Playwright MCP for E2E testing, form filling, navigation, and web interaction (GNS-2 Tier 0)",
         "testing",
         "ollama-cloud/deepseek-v4-flash"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "kimi-k2.6",
+      "best_score": 63.8
     },
     "capability-analyst": {
       "name": "capability-analyst",
       "evaluations": {
-        "deepseek-v4-pro-max": 41.6,
-        "kimi-k2.6": 41.6,
-        "qwen3-coder:480b": 41.6
+        "deepseek-v4-pro": 58.7,
+        "glm-5.1": 53.5,
+        "kimi-k2.6": 58.7,
+        "qwen3-coder:480b": 52.3
       },
       "info": [
         "Analyzes task requirements against available agents, workflows, and skills. Identifies gaps and recommends new components. Tier 2 meta-agent with self-cascade enabled.",
         "meta",
         "ollama-cloud/deepseek-v4-pro-max"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 41.6
+      "best_model": "deepseek-v4-pro",
+      "best_score": 58.7
     },
     "code-skeptic": {
       "name": "code-skeptic",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 22.8,
+        "glm-5.1": 89.1,
+        "kimi-k2.6": 91.2,
+        "minimax-m2.5": 45.0,
+        "qwen3-coder:480b": 90.6
       },
       "info": [
         "Adversarial code reviewer. Finds problems and issues. Does NOT suggest implementations (GNS-2 Tier 0)",
         "quality",
         "ollama-cloud/minimax-m2.5"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "kimi-k2.6",
+      "best_score": 91.2
     },
     "devops-engineer": {
       "name": "devops-engineer",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 29.7,
+        "glm-5.1": 96.2,
+        "kimi-k2.6": 87.2,
+        "qwen3-coder:480b": 87.2
       },
       "info": [
         "DevOps specialist for Docker, Kubernetes, CI/CD pipeline automation, and infrastructure management (GNS-2 Tier 1)",
         "core",
         "ollama-cloud/kimi-k2.6"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "glm-5.1",
+      "best_score": 96.2
     },
     "evaluator": {
       "name": "evaluator",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 50.6,
+        "glm-5.1": 58.7,
+        "kimi-k2.6": 53.5,
+        "qwen3-coder:480b": 43.8
       },
       "info": [
         "Scores agent effectiveness after task completion for continuous improvement. Tier 2 meta-agent with self-cascade enabled.",
         "meta",
         "ollama-cloud/qwen3.5-122b"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "glm-5.1",
+      "best_score": 58.7
+    },
+    "evolution-prompt": {
+      "name": "evolution-prompt",
+      "evaluations": {
+        "deepseek-v4-pro": 52.6,
+        "glm-5.1": 44.7,
+        "kimi-k2.6": 53.5,
+        "qwen3-coder:480b": 21.3
+      },
+      "info": [
+        "Generates role-specific stress-test prompts by analyzing agent definitions",
+        "meta",
+        "ollama-cloud/deepseek-v4-pro-max"
+      ],
+      "best_model": "kimi-k2.6",
+      "best_score": 53.5
+    },
+    "evolution-skeptic": {
+      "name": "evolution-skeptic",
+      "evaluations": {
+        "deepseek-v4-pro": 33.1,
+        "glm-5.1": 31.6,
+        "kimi-k2.6": 37.3,
+        "qwen3-coder:480b": 42.9
+      },
+      "info": [
+        "Evaluates model responses against role-specific rubrics with detailed scoring and commentary",
+        "meta",
+        "ollama-cloud/deepseek-v4-pro-max"
+      ],
+      "best_model": "qwen3-coder:480b",
+      "best_score": 42.9
     },
     "flutter-developer": {
       "name": "flutter-developer",
       "evaluations": {
-        "deepseek-v4-pro-max": 41.6,
-        "kimi-k2.6": 41.6,
-        "qwen3-coder:480b": 41.6
+        "deepseek-v4-pro": 34.5,
+        "glm-5.1": 54.9,
+        "kimi-k2.6": 49.3,
+        "qwen3-coder:480b": 54.9
       },
       "info": [
         "Flutter mobile specialist for cross-platform apps, state management, and UI components (GNS-2 Tier 1)",
         "core",
         "ollama-cloud/qwen3-coder:480b"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 41.6
+      "best_model": "glm-5.1",
+      "best_score": 54.9
     },
     "frontend-developer": {
       "name": "frontend-developer",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 31.6,
+        "glm-5.1": 53.2,
+        "kimi-k2.6": 38.8,
+        "qwen3-coder:480b": 56.0
       },
       "info": [
         "Handles UI implementation with multimodal capabilities. Accepts visual references like screenshots and mockups (GNS-2 Tier 1)",
         "core",
         "ollama-cloud/minimax-m2.5"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "qwen3-coder:480b",
+      "best_score": 56.0
     },
     "go-developer": {
       "name": "go-developer",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 41.4,
+        "glm-5.1": 53.5,
+        "kimi-k2.6": 48.3,
+        "qwen3-coder:480b": 58.7
       },
       "info": [
         "Go backend specialist for Gin, Echo, APIs, and database integration (GNS-2 Tier 1)",
         "core",
         "ollama-cloud/deepseek-v4-pro-max"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "qwen3-coder:480b",
+      "best_score": 58.7
     },
     "history-miner": {
       "name": "history-miner",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 30.1,
+        "glm-5.1": 44.3,
+        "kimi-k2.6": 46.9,
+        "qwen3-coder:480b": 44.8
       },
       "info": [
         "Analyzes git history to find duplicates and past solutions, preventing regression and duplicate work (GNS-2 Tier 0)",
         "core",
         "ollama-cloud/qwen3.5-122b"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "kimi-k2.6",
+      "best_score": 46.9
     },
     "incident-responder": {
       "name": "incident-responder",
       "evaluations": {
-        "deepseek-v4-pro-max": 41.6,
-        "kimi-k2.6": 41.6,
-        "qwen3-coder:480b": 41.6
+        "deepseek-v4-pro": 48.6,
+        "glm-5.1": 65.6,
+        "kimi-k2.6": 59.1,
+        "qwen3-coder:480b": 56.4
       },
       "info": [
         "Server incident response and system hardening specialist. Handles live forensics, malware removal, persistence hunting, SSH-based server cleanup, and post-incident hardening. Works with any OS and panel.",
         "core",
         "ollama-cloud/kimi-k2.6"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 41.6
+      "best_model": "glm-5.1",
+      "best_score": 65.6
     },
     "lead-developer": {
       "name": "lead-developer",
       "evaluations": {
-        "deepseek-v4-pro-max": 41.6,
-        "kimi-k2.6": 41.6,
-        "qwen3-coder:480b": 41.6
+        "deepseek-v4-pro": 28.7,
+        "glm-5.1": 68.8,
+        "kimi-k2.6": 72.5,
+        "qwen3-coder:480b": 72.5
       },
       "info": [
         "Primary code writer for backend and core logic. Writes implementation to pass tests (GNS-2 Tier 1)",
         "core",
         "ollama-cloud/qwen3-coder:480b"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 41.6
+      "best_model": "kimi-k2.6",
+      "best_score": 72.5
     },
     "markdown-validator": {
       "name": "markdown-validator",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 39.0,
+        "glm-5.1": 37.2,
+        "kimi-k2.6": 24.0,
+        "qwen3-coder:480b": 47.4
       },
       "info": [
         "Validates and corrects Markdown descriptions for Gitea issues (GNS-2 Tier 0)",
         "meta",
         "ollama-cloud/nemotron-3-nano"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "qwen3-coder:480b",
+      "best_score": 47.4
     },
     "memory-manager": {
       "name": "memory-manager",
       "evaluations": {
-        "deepseek-v4-pro-max": 41.6,
-        "kimi-k2.6": 41.6,
-        "qwen3-coder:480b": 41.6
+        "deepseek-v4-pro": 35.8,
+        "glm-5.1": 48.3,
+        "kimi-k2.6": 41.5,
+        "qwen3-coder:480b": 46.8
       },
       "info": [
         "Manages agent memory systems - short-term (context), long-term (vector store), and episodic (experiences) (GNS-2 Tier 0)",
         "cognitive",
         "ollama-cloud/deepseek-v4-pro-max"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 41.6
+      "best_model": "glm-5.1",
+      "best_score": 48.3
     },
     "orchestrator": {
       "name": "orchestrator",
       "evaluations": {
-        "deepseek-v4-pro-max": 41.6,
-        "kimi-k2.6": 41.6,
-        "qwen3-coder:480b": 41.6
+        "deepseek-v4-flash": 27.0,
+        "deepseek-v4-pro": 19.6,
+        "glm-5.1": 36.2,
+        "kimi-k2.6": 40.0,
+        "minimax-m2.5": 36.3,
+        "qwen3-coder:480b": 39.1
       },
       "info": [
         "Main dispatcher. Routes tasks between agents based on Issue status and manages the workflow state machine. IF:90 for optimal routing accuracy. (GNS-2 Tier 1)",
         "meta",
         "ollama-cloud/kimi-k2.6"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 41.6
+      "best_model": "kimi-k2.6",
+      "best_score": 40.0
     },
     "performance-engineer": {
       "name": "performance-engineer",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 27.9,
+        "glm-5.1": 63.8,
+        "kimi-k2.6": 34.3,
+        "qwen3-coder:480b": 36.3
       },
       "info": [
         "Reviews code for performance issues. Focuses on efficiency, N+1 queries, memory leaks, and algorithmic complexity (GNS-2 Tier 0)",
         "quality",
         "ollama-cloud/deepseek-v4-pro-max"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "glm-5.1",
+      "best_score": 63.8
     },
     "php-developer": {
       "name": "php-developer",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 53.5,
+        "glm-5.1": 48.3,
+        "kimi-k2.6": 48.3,
+        "qwen3-coder:480b": 48.3
       },
       "info": [
         "PHP backend specialist for Laravel, Symfony, WordPress, and full-stack web applications (GNS-2 Tier 1)",
         "core",
         "ollama-cloud/qwen3-coder:480b"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "deepseek-v4-pro",
+      "best_score": 53.5
     },
     "pipeline-judge": {
       "name": "pipeline-judge",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 34.6,
+        "glm-5.1": 45.6,
+        "kimi-k2.6": 46.5,
+        "qwen3-coder:480b": 52.9
       },
       "info": [
         "Automated pipeline judge. Evaluates workflow execution by running tests, measuring token cost and wall-clock time. Produces objective fitness scores. Never writes code - only measures and scores. (GNS-2 Tier 0)",
         "meta",
         "ollama-cloud/kimi-k2.6"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "qwen3-coder:480b",
+      "best_score": 52.9
     },
     "planner": {
       "name": "planner",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 41.7,
+        "glm-5.1": 31.8,
+        "kimi-k2.6": 34.6,
+        "qwen3-coder:480b": 33.7
       },
       "info": [
         "Advanced task planner using Chain of Thought, Tree of Thoughts, and Plan-Execute-Reflect (GNS-2 Tier 0)",
         "cognitive",
         "ollama-cloud/deepseek-v4-pro-max"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "deepseek-v4-pro",
+      "best_score": 41.7
     },
     "product-owner": {
       "name": "product-owner",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 27.0,
+        "glm-5.1": 33.4,
+        "kimi-k2.6": 34.6,
+        "qwen3-coder:480b": 27.0
       },
       "info": [
         "Manages issue checklists, status labels, tracks progress and coordinates with human users (GNS-2 Tier 1)",
         "meta",
         "ollama-cloud/glm-5.1"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "kimi-k2.6",
+      "best_score": 34.6
     },
     "prompt-optimizer": {
       "name": "prompt-optimizer",
       "evaluations": {
-        "deepseek-v4-pro-max": 41.6,
-        "kimi-k2.6": 41.6,
-        "qwen3-coder:480b": 41.6
+        "deepseek-v4-pro": 27.0,
+        "glm-5.1": 48.3,
+        "kimi-k2.6": 33.0,
+        "qwen3-coder:480b": 31.8
       },
       "info": [
         "Improves agent system prompts based on performance failures. Meta-learner for prompt optimization (GNS-2 Tier 1)",
         "meta",
         "ollama-cloud/qwen3.5-122b"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 41.6
+      "best_model": "glm-5.1",
+      "best_score": 48.3
     },
     "python-developer": {
       "name": "python-developer",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 48.3,
+        "glm-5.1": 48.3,
+        "kimi-k2.6": 48.3,
+        "qwen3-coder:480b": 48.3
       },
       "info": [
         "Python backend specialist for Django, FastAPI, data science, and API development (GNS-2 Tier 1)",
         "core",
         "ollama-cloud/qwen3-coder:480b"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "deepseek-v4-pro",
+      "best_score": 48.3
     },
     "reflector": {
       "name": "reflector",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 43.2,
+        "glm-5.1": 53.5,
+        "kimi-k2.6": 58.7,
+        "qwen3-coder:480b": 20.9
       },
       "info": [
         "Self-reflection agent using Reflexion pattern - learns from mistakes (GNS-2 Tier 0)",
         "cognitive",
         "ollama-cloud/deepseek-v4-pro-max"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "kimi-k2.6",
+      "best_score": 58.7
     },
     "release-manager": {
       "name": "release-manager",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 23.7,
+        "glm-5.1": 38.0,
+        "kimi-k2.6": 50.2,
+        "qwen3-coder:480b": 41.7
       },
       "info": [
         "Manages git operations, semantic versioning, branching, and deployments. Ensures clean history (GNS-2 Tier 1)",
         "meta",
         "ollama-cloud/kimi-k2.6"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "kimi-k2.6",
+      "best_score": 50.2
     },
     "requirement-refiner": {
       "name": "requirement-refiner",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 30.3,
+        "glm-5.1": 31.0,
+        "kimi-k2.6": 31.2,
+        "qwen3-coder:480b": 45.3
       },
       "info": [
         "Converts vague ideas and bug reports into strict User Stories with acceptance criteria checklists (GNS-2 Tier 1)",
         "core",
         "ollama-cloud/kimi-k2-thinking"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "qwen3-coder:480b",
+      "best_score": 45.3
     },
     "sdet-engineer": {
       "name": "sdet-engineer",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 58.7,
+        "glm-5.1": 86.0,
+        "kimi-k2.6": 97.0,
+        "qwen3-coder:480b": 97.0
       },
       "info": [
         "Writes tests following TDD methodology. Tests MUST fail initially (Red phase) (GNS-2 Tier 1)",
         "core",
         "ollama-cloud/qwen3-coder:480b"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "kimi-k2.6",
+      "best_score": 97.0
     },
     "security-auditor": {
       "name": "security-auditor",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 46.4,
+        "glm-5.1": 58.7,
+        "kimi-k2.6": 63.8,
+        "qwen3-coder:480b": 41.5
       },
       "info": [
         "Scans for security vulnerabilities, OWASP Top 10, dependency CVEs, and hardcoded secrets (GNS-2 Tier 0)",
         "quality",
         "ollama-cloud/deepseek-v4-pro-max"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "kimi-k2.6",
+      "best_score": 63.8
     },
     "system-analyst": {
       "name": "system-analyst",
       "evaluations": {
-        "deepseek-v4-pro-max": 41.6,
-        "kimi-k2.6": 41.6,
-        "qwen3-coder:480b": 41.6
+        "deepseek-v4-pro": 56.4,
+        "glm-5.1": 87.0,
+        "kimi-k2.6": 92.0,
+        "qwen3-coder:480b": 77.0
       },
       "info": [
         "Designs technical specifications, data schemas, and API contracts before implementation (GNS-2 Tier 1)",
         "core",
         "ollama-cloud/deepseek-v4-pro-max"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 41.6
+      "best_model": "kimi-k2.6",
+      "best_score": 92.0
     },
     "the-fixer": {
       "name": "the-fixer",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 43.6,
+        "glm-5.1": 46.6,
+        "kimi-k2.6": 36.4,
+        "qwen3-coder:480b": 42.9
       },
       "info": [
         "Iteratively fixes bugs based on specific error reports and test failures (GNS-2 Tier 1)",
         "quality",
         "ollama-cloud/kimi-k2.6"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "glm-5.1",
+      "best_score": 46.6
     },
     "visual-tester": {
       "name": "visual-tester",
       "evaluations": {
-        "deepseek-v4-pro-max": 50.0,
-        "kimi-k2.6": 50.0,
-        "qwen3-coder:480b": 50.0
+        "deepseek-v4-pro": 47.3,
+        "glm-5.1": 58.7,
+        "kimi-k2.6": 53.5,
+        "qwen3-coder:480b": 53.5
       },
       "info": [
         "Visual regression testing agent that compares screenshots and detects UI differences using pixelmatch and image diff (GNS-2 Tier 0)",
         "quality",
         "ollama-cloud/qwen3-coder:480b"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 50.0
+      "best_model": "glm-5.1",
+      "best_score": 58.7
     },
     "workflow-architect": {
       "name": "workflow-architect",
       "evaluations": {
-        "deepseek-v4-pro-max": 41.6,
-        "kimi-k2.6": 41.6,
-        "qwen3-coder:480b": 41.6
+        "deepseek-v4-pro": 36.3,
+        "glm-5.1": 48.3,
+        "kimi-k2.6": 48.3,
+        "qwen3-coder:480b": 36.3
       },
       "info": [
         "Creates and maintains workflow definitions with complete architecture, Gitea integration, and quality gates (GNS-2 Tier 1)",
         "meta",
         "ollama-cloud/qwen3.5-122b"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 41.6
+      "best_model": "glm-5.1",
+      "best_score": 48.3
     },
     "workflow-cross-checker": {
       "name": "workflow-cross-checker",
       "evaluations": {
-        "deepseek-v4-pro-max": 41.6,
-        "kimi-k2.6": 41.6,
-        "qwen3-coder:480b": 41.6
+        "deepseek-v4-pro": 54.2,
+        "glm-5.1": 63.3,
+        "kimi-k2.6": 52.1,
+        "qwen3-coder:480b": 65.6
       },
       "info": [
         "Workflow cross-checker and process inspector. Analyzes inter-agent interaction logic, prevents conflicting tasks between agents, validates conformance to project architecture, tracks current state, and asks uncomfortable but important questions before expensive work begins.",
         "meta",
         "ollama-cloud/kimi-k2.6"
       ],
-      "best_model": "deepseek-v4-pro-max",
-      "best_score": 41.6
+      "best_model": "qwen3-coder:480b",
+      "best_score": 65.6
     }
   },
   "fit_scores": {
     "agent-architect": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 41.6,
-      "explanation": "Best model for agent-architect is deepseek-v4-pro-max with avg score 41.6. Strongest dimension: keyword_coverage."
+      "model": "kimi-k2.6",
+      "fit": 53.5,
+      "explanation": "Best model for agent-architect is kimi-k2.6 with avg score 53.5. Strongest dimension: code_presence."
     },
     "architect-indexer": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for architect-indexer is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "qwen3-coder:480b",
+      "fit": 54.0,
+      "explanation": "Best model for architect-indexer is qwen3-coder:480b with avg score 54.0. Strongest dimension: code_presence."
     },
     "backend-developer": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for backend-developer is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "deepseek-v4-pro",
+      "fit": 53.5,
+      "explanation": "Best model for backend-developer is deepseek-v4-pro with avg score 53.5. Strongest dimension: code_presence."
     },
     "browser-automation": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for browser-automation is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "kimi-k2.6",
+      "fit": 63.8,
+      "explanation": "Best model for browser-automation is kimi-k2.6 with avg score 63.8. Strongest dimension: code_presence."
     },
     "capability-analyst": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 41.6,
-      "explanation": "Best model for capability-analyst is deepseek-v4-pro-max with avg score 41.6. Strongest dimension: keyword_coverage."
+      "model": "deepseek-v4-pro",
+      "fit": 58.7,
+      "explanation": "Best model for capability-analyst is deepseek-v4-pro with avg score 58.7. Strongest dimension: code_presence."
     },
     "code-skeptic": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for code-skeptic is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "kimi-k2.6",
+      "fit": 91.2,
+      "explanation": "Best model for code-skeptic is kimi-k2.6 with avg score 91.2. Strongest dimension: code_presence."
     },
     "devops-engineer": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for devops-engineer is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "glm-5.1",
+      "fit": 96.2,
+      "explanation": "Best model for devops-engineer is glm-5.1 with avg score 96.2. Strongest dimension: keyword_coverage."
     },
     "evaluator": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for evaluator is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "glm-5.1",
+      "fit": 58.7,
+      "explanation": "Best model for evaluator is glm-5.1 with avg score 58.7. Strongest dimension: code_presence."
+    },
+    "evolution-prompt": {
+      "model": "kimi-k2.6",
+      "fit": 53.5,
+      "explanation": "Best model for evolution-prompt is kimi-k2.6 with avg score 53.5. Strongest dimension: code_presence."
+    },
+    "evolution-skeptic": {
+      "model": "qwen3-coder:480b",
+      "fit": 42.9,
+      "explanation": "Best model for evolution-skeptic is qwen3-coder:480b with avg score 42.9. Strongest dimension: structure."
     },
     "flutter-developer": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 41.6,
-      "explanation": "Best model for flutter-developer is deepseek-v4-pro-max with avg score 41.6. Strongest dimension: keyword_coverage."
+      "model": "glm-5.1",
+      "fit": 54.9,
+      "explanation": "Best model for flutter-developer is glm-5.1 with avg score 54.9. Strongest dimension: code_presence."
     },
     "frontend-developer": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for frontend-developer is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "qwen3-coder:480b",
+      "fit": 56.0,
+      "explanation": "Best model for frontend-developer is qwen3-coder:480b with avg score 56.0. Strongest dimension: code_presence."
     },
     "go-developer": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for go-developer is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "qwen3-coder:480b",
+      "fit": 58.7,
+      "explanation": "Best model for go-developer is qwen3-coder:480b with avg score 58.7. Strongest dimension: code_presence."
     },
     "history-miner": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for history-miner is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "kimi-k2.6",
+      "fit": 46.9,
+      "explanation": "Best model for history-miner is kimi-k2.6 with avg score 46.9. Strongest dimension: code_presence."
     },
     "incident-responder": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 41.6,
-      "explanation": "Best model for incident-responder is deepseek-v4-pro-max with avg score 41.6. Strongest dimension: keyword_coverage."
+      "model": "glm-5.1",
+      "fit": 65.6,
+      "explanation": "Best model for incident-responder is glm-5.1 with avg score 65.6. Strongest dimension: code_presence."
     },
     "lead-developer": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 41.6,
-      "explanation": "Best model for lead-developer is deepseek-v4-pro-max with avg score 41.6. Strongest dimension: code_presence."
+      "model": "kimi-k2.6",
+      "fit": 72.5,
+      "explanation": "Best model for lead-developer is kimi-k2.6 with avg score 72.5. Strongest dimension: keyword_coverage."
     },
     "markdown-validator": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for markdown-validator is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "qwen3-coder:480b",
+      "fit": 47.4,
+      "explanation": "Best model for markdown-validator is qwen3-coder:480b with avg score 47.4. Strongest dimension: code_presence."
     },
     "memory-manager": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 41.6,
-      "explanation": "Best model for memory-manager is deepseek-v4-pro-max with avg score 41.6. Strongest dimension: keyword_coverage."
+      "model": "glm-5.1",
+      "fit": 48.3,
+      "explanation": "Best model for memory-manager is glm-5.1 with avg score 48.3. Strongest dimension: code_presence."
     },
     "orchestrator": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 41.6,
-      "explanation": "Best model for orchestrator is deepseek-v4-pro-max with avg score 41.6. Strongest dimension: keyword_coverage."
+      "model": "kimi-k2.6",
+      "fit": 40.0,
+      "explanation": "Best model for orchestrator is kimi-k2.6 with avg score 40.0. Strongest dimension: code_presence."
     },
     "performance-engineer": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for performance-engineer is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "glm-5.1",
+      "fit": 63.8,
+      "explanation": "Best model for performance-engineer is glm-5.1 with avg score 63.8. Strongest dimension: code_presence."
     },
     "php-developer": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for php-developer is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "deepseek-v4-pro",
+      "fit": 53.5,
+      "explanation": "Best model for php-developer is deepseek-v4-pro with avg score 53.5. Strongest dimension: code_presence."
     },
     "pipeline-judge": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for pipeline-judge is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "qwen3-coder:480b",
+      "fit": 52.9,
+      "explanation": "Best model for pipeline-judge is qwen3-coder:480b with avg score 52.9. Strongest dimension: code_presence."
     },
     "planner": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for planner is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "deepseek-v4-pro",
+      "fit": 41.7,
+      "explanation": "Best model for planner is deepseek-v4-pro with avg score 41.7. Strongest dimension: code_presence."
     },
     "product-owner": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for product-owner is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "kimi-k2.6",
+      "fit": 34.6,
+      "explanation": "Best model for product-owner is kimi-k2.6 with avg score 34.6. Strongest dimension: actionability."
     },
     "prompt-optimizer": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 41.6,
-      "explanation": "Best model for prompt-optimizer is deepseek-v4-pro-max with avg score 41.6. Strongest dimension: keyword_coverage."
+      "model": "glm-5.1",
+      "fit": 48.3,
+      "explanation": "Best model for prompt-optimizer is glm-5.1 with avg score 48.3. Strongest dimension: code_presence."
     },
     "python-developer": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for python-developer is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "deepseek-v4-pro",
+      "fit": 48.3,
+      "explanation": "Best model for python-developer is deepseek-v4-pro with avg score 48.3. Strongest dimension: code_presence."
     },
     "reflector": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for reflector is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "kimi-k2.6",
+      "fit": 58.7,
+      "explanation": "Best model for reflector is kimi-k2.6 with avg score 58.7. Strongest dimension: code_presence."
     },
     "release-manager": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for release-manager is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "kimi-k2.6",
+      "fit": 50.2,
+      "explanation": "Best model for release-manager is kimi-k2.6 with avg score 50.2. Strongest dimension: code_presence."
     },
     "requirement-refiner": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for requirement-refiner is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "qwen3-coder:480b",
+      "fit": 45.3,
+      "explanation": "Best model for requirement-refiner is qwen3-coder:480b with avg score 45.3. Strongest dimension: code_presence."
     },
     "sdet-engineer": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for sdet-engineer is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "kimi-k2.6",
+      "fit": 97.0,
+      "explanation": "Best model for sdet-engineer is kimi-k2.6 with avg score 97.0. Strongest dimension: keyword_coverage."
     },
     "security-auditor": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for security-auditor is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "kimi-k2.6",
+      "fit": 63.8,
+      "explanation": "Best model for security-auditor is kimi-k2.6 with avg score 63.8. Strongest dimension: code_presence."
     },
     "system-analyst": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 41.6,
-      "explanation": "Best model for system-analyst is deepseek-v4-pro-max with avg score 41.6. Strongest dimension: keyword_coverage."
+      "model": "kimi-k2.6",
+      "fit": 92.0,
+      "explanation": "Best model for system-analyst is kimi-k2.6 with avg score 92.0. Strongest dimension: keyword_coverage."
     },
     "the-fixer": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for the-fixer is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "glm-5.1",
+      "fit": 46.6,
+      "explanation": "Best model for the-fixer is glm-5.1 with avg score 46.6. Strongest dimension: code_presence."
     },
     "visual-tester": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 50.0,
-      "explanation": "Best model for visual-tester is deepseek-v4-pro-max with avg score 50.0. Strongest dimension: keyword_coverage."
+      "model": "glm-5.1",
+      "fit": 58.7,
+      "explanation": "Best model for visual-tester is glm-5.1 with avg score 58.7. Strongest dimension: code_presence."
     },
     "workflow-architect": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 41.6,
-      "explanation": "Best model for workflow-architect is deepseek-v4-pro-max with avg score 41.6. Strongest dimension: keyword_coverage."
+      "model": "glm-5.1",
+      "fit": 48.3,
+      "explanation": "Best model for workflow-architect is glm-5.1 with avg score 48.3. Strongest dimension: code_presence."
     },
     "workflow-cross-checker": {
-      "model": "deepseek-v4-pro-max",
-      "fit": 41.6,
-      "explanation": "Best model for workflow-cross-checker is deepseek-v4-pro-max with avg score 41.6. Strongest dimension: keyword_coverage."
+      "model": "qwen3-coder:480b",
+      "fit": 65.6,
+      "explanation": "Best model for workflow-cross-checker is qwen3-coder:480b with avg score 65.6. Strongest dimension: code_presence."
     }
   }
 }
\ No newline at end of file
diff --git a/agent-evolution/docker-compose.yml b/agent-evolution/docker-compose.yml
index 9a0ed74..aaac6c2 100644
--- a/agent-evolution/docker-compose.yml
+++ b/agent-evolution/docker-compose.yml
@@ -1,28 +1,27 @@
-# Docker Compose for Agent Evolution Dashboard (mount-driven, no-rebuild)
+# Docker Compose for Agent Evolution Dashboard + Research API (mount-driven, no-rebuild)
 # Usage:
 #   docker compose -f agent-evolution/docker-compose.yml up -d
-#   # Edit any file in agent-evolution/ or .kilo/ on host → instant reflection
-#   # Just run:
-#     bun run sync:evolution
-#   # and reload the page
+#   # Edit any file on host → instant reflection in containers
+#   # Dashboard: http://localhost:3003
+#   # API:      http://localhost:3004
 #
-version: '3.8'
-
 services:
   evolution-dashboard:
-    build:
-      context: .
-      dockerfile: Dockerfile
+    image: python:3.12-alpine
     container_name: apaw-evolution
     ports:
       - "3003:80"
     volumes:
       # Mount the generated standalone HTML to the container's web root
       - ./index.standalone.html:/app/index.html:ro
+      # Mount real-fit standalone report
+      - ./real-fit.html:/app/real-fit.html:ro
       # Mount data directory for any additional assets
       - ./data:/app/data:ro
       # Mount .kilo directory for live config access
       - ../.kilo:/app/kilo:ro
+    working_dir: /app
+    command: ["python3", "-m", "http.server", "80"]
     environment:
       - NODE_ENV=production
       - TZ=UTC
@@ -39,6 +38,47 @@ services:
       - "com.apaw.service=evolution-dashboard"
       - "com.apaw.description=Agent Evolution Dashboard"
 
+  evolution-api:
+    image: python:3.12-alpine
+    container_name: apaw-evolution-api
+    ports:
+      - "3004:8000"
+    volumes:
+      # API source code
+      - ./api.py:/app/api.py:ro
+      - ./requirements.txt:/app/requirements.txt:ro
+      # Data directory (read-write for job state and reports)
+      - ./data:/app/data:rw
+      # real-fit-engine.py script
+      - ../scripts/real-fit-engine.py:/app/scripts/real-fit-engine.py:ro
+      # Agent definitions and metadata
+      - ../.kilo/agents:/app/agents:ro
+      - ../kilo-meta.json:/app/kilo-meta.json:ro
+    working_dir: /app
+    command: >
+      sh -c "pip install --no-cache-dir -r requirements.txt && uvicorn api:app --host 0.0.0.0 --port 8000"
+    environment:
+      - TZ=UTC
+      - PYTHONUNBUFFERED=1
+      - JOB_STATE_PATH=/app/data/research-jobs.json
+      - REPORT_PATH=/app/data/real-fit-report.json
+      - META_PATH=/app/kilo-meta.json
+      - EVOLUTION_PATH=/app/data/evolution.json
+      - ENGINE_PATH=/app/scripts/real-fit-engine.py
+      - REAL_FIT_DB=/app/data/real-fit.db
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD", "wget", "--no-verbose", "--tries=1", "--spider", "http://localhost:8000/api/models"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 15s
+    networks:
+      - evolution-network
+    labels:
+      - "com.apaw.service=evolution-api"
+      - "com.apaw.description=Agent Evolution Research API"
+
   # Optional: Nginx reverse proxy with SSL
   evolution-nginx:
     image: nginx:alpine
@@ -49,13 +89,14 @@ services:
       - "80:80"
       - "443:443"
     volumes:
-      - ./agent-evolution/nginx.conf:/etc/nginx/nginx.conf:ro
-      - ./agent-evolution/ssl:/etc/nginx/ssl:ro
+      - ./nginx.conf:/etc/nginx/nginx.conf:ro
+      - ./ssl:/etc/nginx/ssl:ro
     depends_on:
       - evolution-dashboard
+      - evolution-api
     networks:
       - evolution-network
 
 networks:
   evolution-network:
-    driver: bridge
\ No newline at end of file
+    driver: bridge
diff --git a/agent-evolution/index.standalone.html b/agent-evolution/index.standalone.html
index 8de3e9b..04cb752 100644
--- a/agent-evolution/index.standalone.html
+++ b/agent-evolution/index.standalone.html
@@ -5083,7 +5083,7 @@ async function init() {
     try {
         // Load real dashboard data FIRST (overrides stale agent-versions)
         try {
-            const dashRes = await fetch('data/dashboard-data.json');
+            const dashRes = await fetch('data/dashboard-data.json', { cache: 'no-cache' });
             if (dashRes.ok) {
                 window.dashboardData = await dashRes.json();
                 // Sync agentData from dashboard data for all other tabs
@@ -5439,64 +5439,63 @@ function renderRecCard(r, index) {
     `;
 }
 
-// Render Heatmap — REAL DATA: Agent × Current Model × Real Fit Score
+// Render Heatmap — REAL DATA: Agent × Model × Live Ollama Evaluations
 function renderHeatmap() {
     const esc = str => (str || '').replace(/[&<>"']/g, m => ({'&':'&amp;','<':'&lt;','>':'&gt;','"':'&quot;',"'":'&#39;'}[m]));
     const dd = window.dashboardData;
 
     if (!dd || !dd.agents) {
-        document.getElementById('hmTable').innerHTML = '<tr><td style="color:var(--text-secondary);padding:20px;text-align:center;">⚠️ Нет данных. Запустите анализ.</td></tr>';
+        document.getElementById('hmTable').innerHTML = '<tr><td style="color:var(--text-secondary);padding:20px;text-align:center;">⚠️ No data. Run analysis.</td></tr>';
         return;
     }
 
-    const agents = dd.agents;
-    // Get unique models sorted by count of agents
-    const modelCounts = {};
-    agents.forEach(a => { modelCounts[a.model_short] = (modelCounts[a.model_short] || 0) + 1; });
-    const modelList = Object.entries(modelCounts)
-        .sort((a, b) => b[1] - a[1])
-        .map(([short]) => {
-            const m = dd.models[short] || {};
-            return {
-                short,
-                full: 'ollama-cloud/' + short,
-                name: m.name || short,
-                avg_fit: m.avg_fit || 0,
-                agents: m.agents || 0
-            };
-        });
+    // Collect all models from current assignments + realfit evaluations
+    const modelsSeen = new Set();
+    dd.agents.forEach(a => { if (a.model_short) modelsSeen.add(a.model_short); });
+    dd.agents.forEach(a => {
+        if (a.real_evaluations) Object.keys(a.real_evaluations).forEach(m => { if (m && m !== 'code-skeptic') modelsSeen.add(m); });
+    });
+    // Ensure real-fit evaluated models are included even if not current
+    const modelList = Array.from(modelsSeen).sort();
 
-    // Render table: rows=agents, cols=models
     const t = document.getElementById('hmTable');
     let h = '<thead><tr><th class="hm-role">Agent</th>';
     modelList.forEach(m => {
-        const color = m.avg_fit >= 85 ? '#00ff94' : m.avg_fit >= 70 ? '#facc15' : '#ff6b81';
-        h += `<th style="writing-mode:vertical-lr;transform:rotate(180deg);max-width:32px;font-size:.56em;padding:3px 1px;">
-            ${esc(m.name)}<br>
-            <span style="color:${color};font-size:.9em;font-weight:700">avg:${m.avg_fit}</span><br>
-            <span style="color:var(--text-muted);font-size:.8em">${m.agents}</span>
-        </th>`;
+        // Compute avg from dd.agents real_evaluations
+        let sum = 0, cnt = 0;
+        dd.agents.forEach(a => { const v = (a.real_evaluations || {})[m]; if (v > 0) { sum += v; cnt++; } });
+        const avg = cnt > 0 ? Math.round(sum / cnt) : 0;
+        const color = avg >= 85 ? '#00ff94' : avg >= 70 ? '#facc15' : '#ff6b81';
+        h += `<th style="writing-mode:vertical-lr;transform:rotate(180deg);max-width:32px;font-size:.56em;padding:3px 1px;">${esc(m)}<br><span style="color:${color};font-size:.9em;font-weight:700">avg:${avg}</span></th>`;
     });
-    h += '</tr></thead><tbody>';
+    h += '<th>Best</th><th>Score</th></tr></thead><tbody>';
 
-    agents.forEach(a => {
+    dd.agents.forEach(a => {
         h += `<tr><td class="hm-r">${esc(a.name)}</td>`;
-        modelList.forEach((m, j) => {
-            const isCurrent = a.model_short === m.short;
-            const score = isCurrent ? a.fit_score : 0; // Only show score for CURRENT model
-            const cur = isCurrent;
-            let marks = '';
-            if (cur) marks += '<span style="border:1px solid var(--accent-cyan);border-radius:50%;padding:1px 3px;font-size:8px">●</span>';
-            const bg = cur ? hmColor(score) : 'transparent';
-            const txt = cur ? hmText(score) : 'var(--text-muted)';
-            h += `<td style="background:${bg};color:${txt};cursor:pointer${cur ? ';box-shadow:inset 0 0 0 2px var(--accent-cyan)' : ''}" class="${cur ? 'hm-cur' : ''}"
-                title="${esc(a.name)} → ${esc(m.name)}: ${isCurrent ? 'fit=' + a.fit_score + ', if=' + a.instruction_following : 'не использует этот модель'}"
-                onmouseover="showTT(event,'${esc(a.name)}','${esc(m.name)}',${isCurrent ? a.fit_score : 0},${isCurrent},${cur},${isCurrent ? a.instruction_following : 0})"
-                onmouseout="hideTT()"
-                onclick="openHmModal(event, '${esc(a.name)}', '${esc(m.name)}', ${isCurrent ? a.fit_score : 0}, ${isCurrent ? a.instruction_following : 0})"
-            >${isCurrent ? a.fit_score : '·'}${marks}</td>`;
+        modelList.forEach(m => {
+            const isCurrent = a.model_short === m;
+            let score = 0;
+            // Prefer real-fit score, fallback to current fit_score
+            if (a.real_evaluations && a.real_evaluations[m] > 0) score = Math.round(a.real_evaluations[m]);
+            else if (isCurrent) score = Math.round(a.fit_score || 0);
+
+            let cls = 'na';
+            if (score >= 90) cls = 'high';
+            else if (score >= 75) cls = 'good';
+            else if (score >= 50) cls = 'med';
+            else if (score > 0) cls = 'low';
+
+            const curMark = isCurrent ? ' ●' : '';
+            const curStyle = isCurrent ? 'box-shadow:inset 0 0 0 2px var(--accent-cyan);' : '';
+            const bg = score > 0 ? hmColor(score) : 'transparent';
+            const txt = score >= 75 ? '#0e1219' : 'var(--text-primary)';
+            const display = score > 0 ? score : (isCurrent ? Math.round(a.fit_score || 0) : '·');
+
+            h += `<td class="score ${cls}" style="background:${bg};color:${txt};${curStyle}cursor:pointer" title="${esc(a.name)} → ${esc(m)}: ${score > 0 ? 'real fit=' + score : (isCurrent ? 'fit=' + a.fit_score : 'no data')}" onclick="openHmModal(event,'${esc(a.name)}','${esc(m)}',${score},${a.instruction_following || 0})">${display}${curMark}</td>`;
         });
-        h += '</tr>';
+        const bestModel = a.real_best_model || a.model_short;
+        const bestScore = a.real_best_score ? Math.round(a.real_best_score) : Math.round(a.fit_score || 0);
+        h += `<td>${esc(bestModel)}</td><td style="font-weight:700">${bestScore}</td></tr>`;
     });
     t.innerHTML = h + '</tbody>';
 }
@@ -5511,29 +5510,6 @@ function hmColor(v) {
     return 'rgba(90,104,128,.2)';
 }
 
-function hmText(v) {
-    return v >= 75 ? '#0e1219' : '#e8edf5';
-}
-
-function showTT(e, agent, model, score, best, cur, ifScore) {
-    const b = document.getElementById('ttBox'), o = document.getElementById('ttOverlay');
-    const ifColor = ifScore >= 85 ? '#00ff94' : ifScore >= 75 ? '#facc15' : '#ff6b81';
-    const ifLabel = ifScore >= 85 ? 'Excellent' : ifScore >= 75 ? 'Average' : 'Weak';
-    b.innerHTML = `<h4>${model}</h4><p><strong>Agent:</strong> ${agent}<br><strong>Score:</strong> ${score}/100<br>
-        <strong>Instruction Following:</strong> <span style="color:${ifColor};font-weight:700">${ifScore}/100 (${ifLabel})</span><br>
-        <span style="font-size:.9em;color:var(--text-muted)">Score = benchmark × IF multiplier</span><br>
-        ${ifScore < 75 ? '<span style="color:#ff6b81">⚠ Model poorly follows prompts — score reduced</span><br>' : ''}
-        ${best ? '★ <strong>Best fit</strong><br>' : ''}${cur ? '📌 <strong>Current</strong>' : ''}</p>`;
-    const r = e.target.getBoundingClientRect();
-    b.style.left = Math.min(r.left, window.innerWidth - 320) + 'px';
-    b.style.top = (r.bottom + 6) + 'px';
-    o.classList.add('show');
-}
-
-function hideTT() {
-    document.getElementById('ttOverlay').classList.remove('show');
-}
-
 // Current modal state
 let hmCurrentAgent = null;
 let hmCurrentModel = null;
diff --git a/agent-evolution/real-fit.html b/agent-evolution/real-fit.html
new file mode 100644
index 0000000..d993875
--- /dev/null
+++ b/agent-evolution/real-fit.html
@@ -0,0 +1,460 @@
+<!DOCTYPE html>
+<html lang="ru">
+<head>
+<meta charset="UTF-8">
+<meta name="viewport" content="width=device-width, initial-scale=1.0">
+<title>Real-Fit Matrix — Agent × Model Performance</title>
+<style>
+:root{--bg:#0a0f1a;--bg2:#0f1525;--bg3:#141c2e;--bdr:#1e2d45;--txt:#e8f1ff;--txt2:#8ba3c0;--cyan:#00d4ff;--green:#00ff94;--red:#ff4757;--orange:#ff9f43;--purple:#a855f7;}
+*{margin:0;padding:0;box-sizing:border-box}
+body{font-family:system-ui,-apple-system,sans-serif;background:var(--bg);color:var(--txt);min-height:100vh;padding:24px}
+h1{font-size:1.6rem;background:linear-gradient(90deg,var(--cyan),var(--green));-webkit-background-clip:text;-webkit-text-fill-color:transparent;margin-bottom:8px}
+.sub{color:var(--txt2);font-size:.85rem;margin-bottom:20px}
+table{width:100%;border-collapse:collapse;font-size:.82rem}
+th,td{padding:8px 10px;border:1px solid var(--bdr);text-align:center}
+th{background:var(--bg2);color:var(--txt2);font-size:.72rem;text-transform:uppercase;letter-spacing:.5px;position:sticky;top:0}
+td:first-child{text-align:left;font-weight:700;white-space:nowrap}
+td.score{font-weight:700;font-family:monospace}
+.hm-cur{box-shadow:inset 0 0 0 2px var(--cyan)}
+.high{background:rgba(0,255,148,.18);color:var(--green)}
+.good{background:rgba(0,212,255,.14);color:var(--cyan)}
+.med{background:rgba(168,85,247,.15);color:var(--purple)}
+.low{background:rgba(255,71,87,.1);color:var(--red)}
+.na{background:transparent;color:var(--txt2);font-size:.9rem;cursor:pointer}
+.na:hover{background:rgba(0,212,255,.08)}
+.legend{display:flex;gap:12px;flex-wrap:wrap;margin-top:16px;font-size:.78rem;color:var(--txt2)}
+.legend span{display:flex;align-items:center;gap:4px}
+.dot{width:14px;height:14px;border-radius:3px}
+.meta{font-size:.72rem;color:var(--txt2);margin-top:12px}
+a{color:var(--cyan);text-decoration:none}
+.btn-research{font-size:.9rem;background:none;border:none;cursor:pointer;margin-left:4px;opacity:.7}
+.btn-research:hover{opacity:1}
+.modal{position:fixed;inset:0;background:rgba(0,0,0,.7);display:flex;align-items:center;justify-content:center;z-index:1000;padding:16px}
+.modal.hidden{display:none}
+.modal-panel{background:var(--bg2);border:1px solid var(--cyan);border-radius:12px;max-width:90vw;width:480px;max-height:90vh;overflow-y:auto;padding:20px;position:relative}
+.modal-panel.wide{width:640px}
+.modal-title{font-size:1.1rem;margin-bottom:12px}
+.modal-list{text-align:left;margin:12px 0;max-height:40vh;overflow-y:auto}
+.modal-list label{display:flex;align-items:center;gap:8px;padding:6px 0;cursor:pointer;border-bottom:1px solid var(--bdr)}
+.modal-list input{margin:0}
+.modal-actions{display:flex;gap:8px;justify-content:flex-end;margin-top:16px}
+.btn{padding:6px 14px;border-radius:6px;border:1px solid var(--bdr);background:var(--bg3);color:var(--txt);cursor:pointer;font-size:.85rem}
+.btn.primary{background:linear-gradient(90deg,var(--green),var(--cyan));color:#000;border:none;font-weight:700}
+.progress{margin-top:12px}
+.progress-bar{height:8px;background:var(--bg3);border-radius:4px;overflow:hidden}
+.progress-fill{height:100%;width:0%;background:linear-gradient(90deg,var(--green),var(--cyan));transition:width .3s}
+.progress-text{font-size:.8rem;color:var(--txt2);margin-top:6px;text-align:center}
+.result-table{width:100%;margin-top:12px;font-size:.82rem;border-collapse:collapse}
+.result-table th,.result-table td{padding:6px;border:1px solid var(--bdr)}
+.result-table .best{background:rgba(0,255,148,.25);color:var(--green);font-weight:700}
+.result-table tbody tr{cursor:pointer}
+.result-table tbody tr:hover{background:rgba(0,212,255,.06)}
+.detail-row{margin-bottom:12px}
+.detail-label{font-size:.72rem;color:var(--txt2);text-transform:uppercase;letter-spacing:.5px;margin-bottom:4px}
+.detail-val{font-size:.85rem;white-space:pre-wrap;word-break:break-word}
+.detail-pills{display:flex;flex-wrap:wrap;gap:6px;margin-top:4px}
+.pill{font-size:.72rem;padding:2px 8px;border-radius:4px;background:var(--bg3);border:1px solid var(--bdr);color:var(--txt2)}
+.score-big{font-size:2rem;font-weight:700;margin:4px 0}
+.toggle{color:var(--cyan);cursor:pointer;font-size:.78rem}
+.toggle:hover{text-decoration:underline}
+.dim-bar{display:flex;align-items:center;gap:8px;margin:4px 0}
+.dim-bar>span:first-child{width:120px;font-size:.75rem;color:var(--txt2);white-space:nowrap;overflow:hidden;text-overflow:ellipsis}
+.dim-track{flex:1;height:8px;background:var(--bg3);border-radius:4px;overflow:hidden}
+.dim-fill{height:100%;border-radius:4px}
+.dim-num{width:30px;text-align:right;font-size:.78rem;font-weight:700}
+.v-pass{color:var(--green)}
+.v-marginal{color:var(--orange)}
+.v-fail{color:var(--red)}
+.commentary{font-size:.85rem;padding:10px 12px;background:rgba(0,212,255,.08);border-left:3px solid var(--cyan);border-radius:0 6px 6px 0;color:var(--txt);white-space:pre-wrap;word-break:break-word}
+</style>
+</head>
+<body>
+<h1>Real-Fit Matrix</h1>
+<div class="sub">Real agent × model evaluation scores via live Ollama API (28 calls, 4 models, 7 agents)</div>
+<div id="matrix"></div>
+<div class="legend">
+  <span><span class="dot high"></span> 90+ Excellent</span>
+  <span><span class="dot good"></span> 75–89 Good</span>
+  <span><span class="dot med"></span> 50–74 Average</span>
+  <span><span class="dot low"></span> &lt;50 Weak</span>
+  <span style="margin-left:auto">● = assigned model</span>
+</div>
+<div class="meta">Data source: <a href="data/real-fit-report.json" target="_blank">real-fit-report.json</a> | Updated: <span id="updated"></span></div>
+
+<div id="researchAgentModal" class="modal hidden">
+  <div class="modal-panel">
+    <div class="modal-title" id="agentModalTitle">Research models</div>
+    <div class="modal-list" id="agentModalList"></div>
+    <div class="progress hidden" id="agentProgress">
+      <div class="progress-bar"><div class="progress-fill" id="agentProgressFill"></div></div>
+      <div class="progress-text" id="agentProgressText"></div>
+    </div>
+    <div class="modal-actions">
+      <button class="btn" onclick="closeModal('researchAgentModal')">Close</button>
+      <button class="btn" id="evolveAgentBtn" onclick="startEvolveAgent()">Run Role-Fit Test</button>
+      <button class="btn primary" id="agentStartBtn" onclick="startAgentResearch()">Start Research</button>
+    </div>
+    <div id="agentResults"></div>
+  </div>
+</div>
+
+<div id="researchCellModal" class="modal hidden">
+  <div class="modal-panel">
+    <div class="modal-title" id="cellModalTitle">Evaluate cell</div>
+    <div class="modal-list" id="cellModalList"></div>
+    <div class="progress hidden" id="cellProgress">
+      <div class="progress-bar"><div class="progress-fill" id="cellProgressFill"></div></div>
+      <div class="progress-text" id="cellProgressText"></div>
+    </div>
+    <div class="modal-actions">
+      <button class="btn" onclick="closeModal('researchCellModal')">Close</button>
+      <button class="btn primary" id="cellStartBtn" onclick="startCellResearch()">Evaluate</button>
+    </div>
+    <div id="cellResults"></div>
+  </div>
+</div>
+
+<div id="detailModal" class="modal hidden">
+  <div class="modal-panel wide">
+    <div style="display:flex;justify-content:space-between;align-items:center;margin-bottom:12px">
+      <span style="font-size:1rem;font-weight:700" id="detailTitle"></span>
+      <button class="btn" onclick="closeModal('detailModal')">Close</button>
+    </div>
+    <div id="detailContent"></div>
+  </div>
+</div>
+
+<script>
+let reportData, evoData, allModels=[], allAvailableModels=[];
+const API_BASE='http://localhost:3004';
+const $=id=>document.getElementById(id);
+
+const MODEL_BENCHMARKS={
+  "qwen3.5-122b":91,"qwen3-coder-480b":88,"deepseek-v4-pro-max":89,
+  "deepseek-v4-flash":86,"kimi-k2.6":91,"kimi-k2.5":90,
+  "minimax-m2.5":82,"minimax-m2.7":80,"glm-5.1":90,
+  "glm-5":90,"nemotron-3-super":78,"nemotron-3-nano":68,
+  "gemma4-27b":85,"devstral-2":80,"devstral-small-2":75
+};
+function clsFor(s){if(s>=90)return'score high';if(s>=75)return'score good';if(s>=50)return'score med';return'score low';}
+function scoreColor(s){if(s>=90)return'var(--green)';if(s>=75)return'var(--cyan)';if(s>=50)return'var(--purple)';return'var(--red)';}
+function closeModal(id){$(id).classList.add('hidden');}
+
+async function load(){
+  let mRes;
+  try{ mRes=await fetch(`${API_BASE}/api/models`); allAvailableModels=(await mRes.json()).models||[]; }
+  catch(e){ allAvailableModels=Object.keys(MODEL_BENCHMARKS); }
+  try{
+    const rRes=await fetch(`${API_BASE}/api/real-fit-report`);
+    reportData=await rRes.json();
+  }catch(e){
+    const rRes=await fetch('data/real-fit-report.json');
+    reportData=await rRes.json();
+  }
+  const eRes=await fetch('data/evolution.json');
+  evoData=await eRes.json();
+    reportData.generated = reportData.generated || new Date().toISOString();
+    // Больше не смешиваем API-данные с локальным кэшем — иначе stale cached scores перекрывают живые данные из БД
+    if (reportData.source && reportData.source.includes('db')) {
+      try { localStorage.removeItem('__researchResults'); } catch(e) {}
+    }
+    $('updated').textContent=new Date(reportData.generated).toLocaleString('ru-RU');
+
+  const agents=Object.values(reportData.agents).filter(a=>Object.values(a.evaluations).some(s=>s>0));
+  const modelScores={};
+  agents.forEach(a=>{for(const[m,s] of Object.entries(a.evaluations)){modelScores[m]=(modelScores[m]||0)+s;}});
+  allModels=Object.keys(modelScores).filter(m=>modelScores[m]>0).sort();
+
+  mergeCachedResults();
+  renderTable();
+}
+
+function currentModel(agentName){
+  const info=reportData.agents[agentName]?.info||[];
+  return (info[2]||'').split('/').pop();
+}
+
+function modelShort(full){return full.replace('ollama-cloud/','');}
+
+function openAgentModal(agent){
+  $('agentModalTitle').textContent='Research models for '+agent;
+  const cur=currentModel(agent);
+  let html='';
+  allAvailableModels.forEach(full=>{
+    const m=modelShort(full);
+    const checked=m===cur||cur.replace(':','-')===m||m.replace('-',':')===cur?'checked':'';
+    const ifs=MODEL_BENCHMARKS[m]||'—';
+    html+=`<label><input type="checkbox" value="${m}" ${checked}> <span>${m}</span> <span style="color:var(--txt2);margin-left:auto">IF ${ifs}</span></label>`;
+  });
+  $('agentModalList').innerHTML=html||'<p style="color:var(--txt2)">No model data</p>';
+  $('agentResults').innerHTML='';
+  $('agentProgress').classList.add('hidden');
+  $('agentStartBtn').disabled=false;
+  $('evolveAgentBtn').disabled=false;
+  $('researchAgentModal').classList.remove('hidden');
+  window.__activeAgent=agent;
+}
+
+function openCellModal(agent,model){
+  $('cellModalTitle').textContent='Evaluate '+agent+' × '+model;
+  $('cellModalList').innerHTML=`<label><input type="checkbox" value="${model}" checked> <span>${model}</span></label>`;
+  $('cellResults').innerHTML='';
+  $('cellProgress').classList.add('hidden');
+  $('cellStartBtn').disabled=false;
+  $('researchCellModal').classList.remove('hidden');
+  window.__activeAgent=agent; window.__activeModel=model;
+}
+
+async function openDetail(agent,model){
+  $('detailTitle').textContent=agent+' × '+model;
+  $('detailContent').innerHTML='<p style="color:var(--txt2)">Loading...</p>';
+  $('detailModal').classList.remove('hidden');
+  let data;
+  try{
+    const res=await fetch(`${API_BASE}/api/evaluation/${encodeURIComponent(agent)}/${encodeURIComponent(model)}`);
+    if(!res.ok) throw new Error(res.status);
+    data=await res.json();
+  }catch(e){
+    $('detailContent').innerHTML='<p style="color:var(--red);margin-top:12px">No detailed evaluation data available for this combination. Run research first.</p>';
+    return;
+  }
+  const s=data.total_score??data.score??0;
+
+  const verdict=(data.verdict||'').toUpperCase();
+  let vClass='';
+  if(verdict==='PASS') vClass='v-pass';
+  else if(verdict==='MARGINAL') vClass='v-marginal';
+  else if(verdict==='FAIL') vClass='v-fail';
+  const verdictHtml=verdict?`<span class="${vClass}" style="font-size:.85rem;font-weight:700;border:1px solid currentColor;padding:2px 8px;border-radius:4px;margin-left:8px">${verdict}</span>`:'';
+
+  let scoresHtml='';
+  if(data.scores){
+    scoresHtml='<div class="detail-row"><div class="detail-label">Score Breakdown</div>';
+    for(const [k,v] of Object.entries(data.scores)){
+      const num=typeof v==='number'?v:Number(v)||0;
+      scoresHtml+=`<div class="dim-bar"><span>${k}</span><div class="dim-track"><div class="dim-fill" style="width:${num}%;background:${scoreColor(num)}"></div></div><span class="dim-num">${Math.round(num)}</span></div>`;
+    }
+    scoresHtml+='</div>';
+  }
+
+  let commentaryHtml='';
+  if(data.explanation){
+    commentaryHtml=`<div class="detail-row"><div class="detail-label">Evaluator Commentary</div><div class="commentary">${data.explanation}</div></div>`;
+  }
+
+  let rubricHtml='';
+  if(data.rubric){
+    rubricHtml='<div class="detail-row"><div class="detail-label">Rubric Weights</div><div class="detail-pills">';
+    for(const [k,v] of Object.entries(data.rubric)){
+      rubricHtml+=`<span class="pill">${k}: ${v}</span>`;
+    }
+    rubricHtml+='</div></div>';
+  }
+
+  let kwHtml='';
+  if(data.expected_keywords?.length){ kwHtml='<div class="detail-pills">'+data.expected_keywords.map(k=>`<span class="pill">${k}</span>`).join('')+'</div>'; }
+  const resp=(data.response||'').toString();
+  const trunc=resp.length>500?resp.slice(0,500)+'...':resp;
+  const more=resp.length>500;
+  const rid='r'+Math.random().toString(36).slice(2);
+  window.__respCache=window.__respCache||{};
+  window.__respCache[rid]={full:resp,trunc:trunc};
+  let respHtml=`<div class="detail-val" id="${rid}">${trunc}</div>`;
+  if(more) respHtml+=`<span class="toggle" onclick="const c=window.__respCache['${rid}'];const el=$('${rid}');const isFull=el.dataset.f==='1';el.textContent=isFull?c.trunc:c.full;el.dataset.f=isFull?'0':'1';this.textContent=isFull?'Show more':'Show less'">Show more</span>`;
+  const lat=data.latency_ms;
+  const latTxt=typeof lat==='number'?(lat>=1000?(lat/1000).toFixed(1)+'s':lat+'ms'):'—';
+
+  $('detailContent').innerHTML=`
+    <div class="detail-row"><div class="detail-label">Agent × Model</div><div class="detail-val">${agent} × ${model}${verdictHtml}</div></div>
+    <div class="detail-row"><div class="detail-label">Total Score</div><div class="score-big" style="color:${scoreColor(s)}">${Math.round(s)}</div></div>
+    ${scoresHtml}
+    <div class="detail-row"><div class="detail-label">Task</div><div class="detail-val">${data.user_prompt||'—'}</div></div>
+    <div class="detail-row"><div class="detail-label">System Role</div><div class="detail-val">${data.system_prompt||'—'}</div></div>
+    <div class="detail-row"><div class="detail-label">Model Response</div>${respHtml}</div>
+    ${commentaryHtml}
+    ${rubricHtml}
+    <div class="detail-row"><div class="detail-label">Evaluator</div><div class="detail-val">${data.evaluator||'—'}</div></div>
+    <div class="detail-row"><div class="detail-label">Latency</div><div class="detail-val">${latTxt}</div></div>
+    <div class="detail-row"><div class="detail-label">Tokens</div><div class="detail-val">Prompt: ${data.tokens_prompt??0} / Response: ${data.tokens_response??0}</div></div>
+    <div class="detail-row"><div class="detail-label">Expected Keywords</div>${kwHtml||'<div class="detail-val">—</div>'}</div>
+    <div class="detail-row"><div class="detail-label">Evaluated At</div><div class="detail-val">${data.evaluated_at?new Date(data.evaluated_at).toLocaleString('ru-RU'):'—'}</div></div>
+  `;
+}
+
+async function animateProgress(pid,label,ms){
+  const bar=$(pid+'Fill'),txt=$(pid+'Text'),wrap=$(pid);
+  wrap.classList.remove('hidden'); txt.textContent=label; bar.style.width='0%';
+  await new Promise(r=>setTimeout(r,50)); bar.style.transition=`width ${ms}ms linear`;
+  await new Promise(r=>setTimeout(r,50)); bar.style.width='100%';
+  await new Promise(r=>setTimeout(r,ms));
+  bar.style.transition='width .3s';
+}
+
+function setProgress(pid,percent,label){
+  const bar=$(pid+'Fill'),txt=$(pid+'Text'),wrap=$(pid);
+  wrap.classList.remove('hidden'); txt.textContent=label; bar.style.width=percent+'%';
+}
+
+function mergeCachedResults(){
+  try{
+    const store=JSON.parse(localStorage.getItem('__researchResults')||'{}');
+    for(const[agent,rec] of Object.entries(store)){
+      if(!reportData.agents[agent]) continue;
+      for(const r of (rec.models||[])){
+        reportData.agents[agent].evaluations[r.model]=r.score;
+        if(!allModels.includes(r.model)) allModels.push(r.model);
+      }
+    }
+    allModels.sort();
+  }catch(e){}
+}
+
+function renderTable(){
+  const agents=Object.values(reportData.agents).filter(a=>Object.values(a.evaluations).some(s=>s>0));
+  let html='<table><thead><tr><th>Agent</th>';
+  allModels.forEach(m=>html+=`<th>${m}</th>`);
+  html+='<th>Best</th><th>Score</th></tr></thead><tbody>';
+  agents.forEach(a=>{
+    html+=`<tr><td>${a.name} <button class="btn-research" onclick="openAgentModal('${a.name}')" title="Research models">🔬</button></td>`;
+    allModels.forEach(m=>{
+      const score=a.evaluations[m];
+      const isCur=a.info&&a.info[2]&&a.info[2].includes(m);
+      let cls='na',text='—',click=`onclick="openCellModal('${a.name}','${m}')"`;
+      if(score!==undefined&&score>0){cls=clsFor(score);text=Math.round(score);click=`onclick="openDetail('${a.name}','${m}')"`;}
+      const curCls=isCur?' hm-cur':'';
+      html+=`<td class="${cls}${curCls}" data-model="${m}" ${click}>${text}${isCur?' ●':''}</td>`;
+    });
+    html+=`<td>${a.best_model}</td><td style="font-weight:700">${Math.round(a.best_score)}</td></tr>`;
+  });
+  html+='</tbody></table>';
+  $('matrix').innerHTML=html;
+}
+
+function updateCell(agent,model,score){
+  if(reportData.agents[agent]){
+    reportData.agents[agent].evaluations[model]=score;
+  }
+  if(!allModels.includes(model)){
+    allModels.push(model);
+    allModels.sort();
+  }
+  renderTable();
+}
+
+async function pollJob(jobId,pid){
+  for(let i=0;i<60;i++){
+    await new Promise(r=>setTimeout(r,2000));
+    try{
+      const res=await fetch(`${API_BASE}/api/research/${jobId}`);
+      if(!res.ok) continue;
+      const job=await res.json();
+      if(job.status==='pending') setProgress(pid,25,'Waiting in queue...');
+      else if(job.status==='running') setProgress(pid,75,'Running evaluation...');
+      else if(job.status==='done'){ setProgress(pid,100,'Done!'); return job; }
+      else if(job.status==='error'){ setProgress(pid,100,'Error!'); return job; }
+    }catch(e){ console.warn('poll error',e); }
+  }
+  setProgress(pid,100,'Timeout'); return {status:'timeout'};
+}
+
+async function startAgentResearch(){
+  const agent=window.__activeAgent;
+  const models=[...$('agentModalList').querySelectorAll('input:checked')].map(i=>i.value);
+  if(!models.length)return;
+  $('agentStartBtn').disabled=true;
+  $('evolveAgentBtn').disabled=true;
+  setProgress('agentProgress',10,'Submitting job...');
+  let job;
+  try{
+    const res=await fetch(`${API_BASE}/api/research`,{method:'POST',headers:{'Content-Type':'application/json'},body:JSON.stringify({agent,models})});
+    if(!res.ok) throw new Error('API error '+res.status);
+    job=await res.json();
+    job=await pollJob(job.job_id,'agentProgress');
+  }catch(e){
+    $('agentResults').innerHTML='<p style="color:var(--red);margin-top:12px">API unavailable — run real-fit-engine.py to evaluate '+agent+'</p>';
+    $('agentProgressText').textContent='Error: API unavailable';
+    $('agentStartBtn').disabled=false;
+    $('evolveAgentBtn').disabled=false;
+    return;
+  }
+  const results=job.models_scored||[];
+  let html='<table class="result-table"><thead><tr><th>Model</th><th>Score</th></tr></thead><tbody>';
+  let best=-1;
+  results.forEach(r=>{if(r.score>best)best=r.score;});
+  results.forEach(r=>{
+    const b=r.score>=best-0.1?'best':'';
+    html+=`<tr class="${b}" onclick="openDetail('${agent}','${r.model}')"><td>${r.model}</td><td>${Math.round(r.score)}</td></tr>`;
+    updateCell(agent,r.model,r.score);
+  });
+  html+='</tbody></table>';
+  $('agentResults').innerHTML=html;
+  $('agentProgressText').textContent='Done! Best score: '+Math.round(best);
+  const store=JSON.parse(localStorage.getItem('__researchResults')||'{}');
+  store[agent]={models:results,ts:Date.now()};
+  localStorage.setItem('__researchResults',JSON.stringify(store));
+  $('agentStartBtn').disabled=false;
+  $('evolveAgentBtn').disabled=false;
+}
+
+async function startEvolveAgent(){
+  const agent=window.__activeAgent;
+  const models=[...$('agentModalList').querySelectorAll('input:checked')].map(i=>i.value);
+  if(!models.length) return;
+  $('evolveAgentBtn').disabled=true;
+  $('agentStartBtn').disabled=true;
+  setProgress('agentProgress',10,'Submitting evolve-agent job...');
+  try{
+    const res=await fetch(`${API_BASE}/api/evolve-agent/start`,{method:'POST',headers:{'Content-Type':'application/json'},body:JSON.stringify({agent,models})});
+    if(!res.ok) throw new Error('API error '+res.status);
+    setProgress('agentProgress',50,'Running role-fit test...');
+    const result=await res.json();
+    if(result.job_id){
+      await pollJob(result.job_id,'agentProgress');
+    }else{
+      await animateProgress('agentProgress','Processing...',2000);
+    }
+    setProgress('agentProgress',100,'Done!');
+  }catch(e){
+    console.error('evolve-agent error',e);
+    setProgress('agentProgress',100,'Error: '+e.message);
+    $('evolveAgentBtn').disabled=false;
+    $('agentStartBtn').disabled=false;
+    return;
+  }
+  await load();
+  closeModal('researchAgentModal');
+  $('evolveAgentBtn').disabled=false;
+  $('agentStartBtn').disabled=false;
+}
+
+async function startCellResearch(){
+  const agent=window.__activeAgent, model=window.__activeModel;
+  $('cellStartBtn').disabled=true;
+  setProgress('cellProgress',10,'Submitting...');
+  let job;
+  try{
+    const res=await fetch(`${API_BASE}/api/research/cell`,{method:'POST',headers:{'Content-Type':'application/json'},body:JSON.stringify({agent,model})});
+    if(!res.ok) throw new Error('API error '+res.status);
+    job=await res.json();
+    job=await pollJob(job.job_id,'cellProgress');
+  }catch(e){
+    $('cellResults').innerHTML='<p style="color:var(--red);margin-top:12px">API unavailable — run real-fit-engine.py to evaluate '+agent+'</p>';
+    $('cellProgressText').textContent='Error: API unavailable';
+    $('cellStartBtn').disabled=false;
+    return;
+  }
+  const result=(job.models_scored||[])[0]||{model,score:0};
+  updateCell(agent,result.model,result.score);
+  $('cellResults').innerHTML='<table class="result-table"><tbody><tr onclick="openDetail(\''+agent+'\',\''+result.model+'\')"><td>'+result.model+'</td><td>'+Math.round(result.score)+'</td></tr></tbody></table>';
+  $('cellProgressText').textContent='Done! Score: '+Math.round(result.score);
+  const store=JSON.parse(localStorage.getItem('__researchResults')||'{}');
+  if(!store[agent]) store[agent]={models:[],ts:Date.now()};
+  store[agent].models=store[agent].models.filter(m=>m.model!==result.model);
+  store[agent].models.push(result);
+  localStorage.setItem('__researchResults',JSON.stringify(store));
+}
+
+load().catch(e=>$('matrix').innerHTML='Error: '+e);
+</script>
+</body>
+</html>
diff --git a/agent-evolution/requirements.txt b/agent-evolution/requirements.txt
new file mode 100644
index 0000000..7854f06
--- /dev/null
+++ b/agent-evolution/requirements.txt
@@ -0,0 +1,4 @@
+fastapi==0.136.3
+uvicorn==0.48.0
+python-multipart==0.0.29
+pydantic==2.13.4
\ No newline at end of file
diff --git a/agent-evolution/scripts/audit-system.cjs b/agent-evolution/scripts/audit-system.cjs
new file mode 100644
index 0000000..a0ea72b
--- /dev/null
+++ b/agent-evolution/scripts/audit-system.cjs
@@ -0,0 +1,138 @@
+const fs = require('fs');
+
+function parseFrontmatter(content) {
+  if (!content.startsWith('---')) return null;
+  const end = content.indexOf('---', 3);
+  if (end === -1) return null;
+  const fm = content.slice(3, end).trim();
+  const data = {};
+  for (const line of fm.split('\n')) {
+    const m = line.match(/^(\w+):\s*(.+)$/);
+    if (m) data[m[1]] = m[2].trim();
+  }
+  return data;
+}
+
+function stripComments(str) {
+  // Remove single-line comments, but not inside strings
+  return str.replace(/\/\/.*$/gm, '');
+}
+
+const agents = [];
+const commands = [];
+const issues = [];
+
+// 1. Parse agent .md files
+for (const f of fs.readdirSync('.kilo/agents').filter(f => f.endsWith('.md'))) {
+  const content = fs.readFileSync('.kilo/agents/' + f, 'utf8');
+  const fm = parseFrontmatter(content);
+  if (fm && fm.model) {
+    agents.push({
+      name: f.replace('.md', ''),
+      model: fm.model,
+      mode: fm.mode || 'subagent',
+      source: '.kilo/agents/' + f,
+      description: fm.description || ''
+    });
+  }
+}
+
+// 2. Parse command .md files
+for (const f of fs.readdirSync('.kilo/commands').filter(f => f.endsWith('.md'))) {
+  const content = fs.readFileSync('.kilo/commands/' + f, 'utf8');
+  const fm = parseFrontmatter(content);
+  if (fm && fm.model) {
+    commands.push({
+      name: f.replace('.md', ''),
+      model: fm.model,
+      mode: fm.mode || 'command',
+      source: '.kilo/commands/' + f,
+      description: fm.description || ''
+    });
+  }
+}
+
+// 3. Parse kilo-meta.json
+const meta = JSON.parse(fs.readFileSync('kilo-meta.json', 'utf8'));
+for (const a of agents) {
+  const m = meta.agents?.[a.name];
+  if (m) {
+    a.metaModel = m.model;
+    if (a.model !== m.model) issues.push(`AGENT ${a.name}: .md=${a.model} vs meta=${m.model}`);
+  }
+}
+for (const c of commands) {
+  const m = meta.commands?.[c.name];
+  if (m) {
+    c.metaModel = m.model;
+    if (c.model !== m.model) issues.push(`CMD ${c.name}: .md=${c.model} vs meta=${m.model}`);
+  }
+}
+
+// 4. Parse .kilo/kilo.jsonc
+const dotKiloRaw = stripComments(fs.readFileSync('.kilo/kilo.jsonc', 'utf8'));
+const dotKilo = JSON.parse(dotKiloRaw);
+for (const [name, cfg] of Object.entries(dotKilo.agent || {})) {
+  if (!cfg.model) continue;
+  const agent = agents.find(a => a.name === name);
+  if (agent) {
+    agent.kiloModel = cfg.model;
+    if (agent.model !== cfg.model) issues.push(`AGENT ${name}: .md=${agent.model} vs .kilo/kilo.jsonc=${cfg.model}`);
+  }
+}
+
+// 5. Parse root kilo.jsonc
+const rootKiloRaw = stripComments(fs.readFileSync('kilo.jsonc', 'utf8'));
+const rootKilo = JSON.parse(rootKiloRaw);
+for (const [name, cfg] of Object.entries(rootKilo.agent || {})) {
+  if (!cfg.model) continue;
+  const cmd = commands.find(c => c.name === name);
+  if (cmd) {
+    cmd.rootModel = cfg.model;
+    if (cmd.model !== cfg.model) issues.push(`CMD ${name}: .md=${cmd.model} vs kilo.jsonc=${cfg.model}`);
+  }
+}
+
+// 6. Check non-ollama
+const nonOllama = [];
+for (const a of agents) if (!a.model.startsWith('ollama-cloud/')) nonOllama.push({type:'agent', name:a.name, model:a.model});
+for (const c of commands) if (!c.model.startsWith('ollama-cloud/')) nonOllama.push({type:'command', name:c.name, model:c.model});
+
+// 7. Summary by model
+const modelStats = {};
+for (const a of agents) modelStats[a.model] = (modelStats[a.model] || 0) + 1;
+for (const c of commands) modelStats[c.model] = (modelStats[c.model] || 0) + 1;
+
+const state = {
+  generated: new Date().toISOString(),
+  totalAgents: agents.length,
+  totalCommands: commands.length,
+  allOllama: nonOllama.length === 0,
+  modelDistribution: modelStats,
+  agents: agents.sort((a,b) => a.name.localeCompare(b.name)),
+  commands: commands.sort((a,b) => a.name.localeCompare(b.name)),
+  issues: issues,
+  nonOllama: nonOllama
+};
+
+fs.writeFileSync('agent-evolution/data/real-state.json', JSON.stringify(state, null, 2) + '\n');
+
+// Console report
+console.log('=== REAL SYSTEM STATE ===');
+console.log('Generated:', state.generated);
+console.log('Agents:', state.totalAgents);
+console.log('Commands:', state.totalCommands);
+console.log('All ollama-cloud/:', state.allOllama ? 'YES' : 'NO (' + nonOllama.length + ' exceptions)');
+console.log('\n=== MODEL DISTRIBUTION ===');
+for (const [m, c] of Object.entries(modelStats).sort((a,b) => b[1]-a[1])) {
+  console.log(`  ${m}: ${c}`);
+}
+if (issues.length > 0) {
+  console.log('\n=== ISSUES ===');
+  issues.forEach(i => console.log('  ⚠️', i));
+}
+if (nonOllama.length > 0) {
+  console.log('\n=== NON-OLLOMA ===');
+  nonOllama.forEach(n => console.log('  ❌', n.type, n.name, n.model));
+}
+console.log('\n✅ State written to agent-evolution/data/real-state.json');
diff --git a/agent-evolution/scripts/merge-real-fit.cjs b/agent-evolution/scripts/merge-real-fit.cjs
new file mode 100644
index 0000000..6477896
--- /dev/null
+++ b/agent-evolution/scripts/merge-real-fit.cjs
@@ -0,0 +1,29 @@
+const fs = require('fs');
+const path = require('path');
+
+const DASH = path.join(__dirname, '../data/dashboard-data.json');
+const REAL = path.join(__dirname, '../data/real-fit-report.json');
+const OUT  = path.join(__dirname, '../data/dashboard-data.json');
+
+const dash = JSON.parse(fs.readFileSync(DASH, 'utf-8'));
+const real = JSON.parse(fs.readFileSync(REAL, 'utf-8'));
+
+// Inject real_evaluations into each agent
+dash.agents.forEach(a => {
+    const r = real.agents?.[a.name];
+    if (r && r.evaluations) {
+        a.real_evaluations = r.evaluations;
+        a.real_best_model = r.best_model;
+        a.real_best_score = r.best_score;
+    } else {
+        a.real_evaluations = {};
+    }
+});
+
+// Add metadata
+dash.real_fit_generated = real.generated;
+dash.real_fit_source = real.source;
+
+fs.writeFileSync(OUT, JSON.stringify(dash, null, 2));
+console.log('Merged real-fit data into ' + OUT);
+console.log('Agents with real evals:', dash.agents.filter(a => Object.keys(a.real_evaluations||{}).length > 0).length);
diff --git a/agent-evolution/scripts/patch-heatmap.js b/agent-evolution/scripts/patch-heatmap.js
new file mode 100644
index 0000000..211767f
--- /dev/null
+++ b/agent-evolution/scripts/patch-heatmap.js
@@ -0,0 +1,98 @@
+const fs = require('fs');
+const path = require('path');
+
+const INDEX = path.join(__dirname, '../index.standalone.html');
+
+// 1. New renderHeatmap that reads real-fit data
+const newRenderHeatmap = `function renderHeatmap() {
+    const esc = str => (str || '').replace(/[&<>"']/g, m => ({'&':'&amp;','<':'&lt;','>':'&gt;','"':'&quot;',"'":'&#39;'}[m]));
+    const dd = window.dashboardData;
+
+    // Merge real-fit if loaded
+    const rf = window.realFitData || {};
+    const realAgents = rf.agents || {};
+
+    if (!dd || !dd.agents) {
+        document.getElementById('hmTable').innerHTML = '<tr><td style="color:var(--text-secondary);padding:20px;text-align:center;">⚠️ No data. Run analysis.</td></tr>';
+        return;
+    }
+
+    // Build model list from real-fit (cross-model) + current dashboard data
+    const modelsSeen = new Set();
+    dd.agents.forEach(a => { modelsSeen.add(a.model_short); });
+    Object.values(realAgents).forEach(a => { Object.keys(a.evaluations || {}).forEach(m => modelsSeen.add(m)); });
+    const modelList = Array.from(modelsSeen).filter(m => m && m !== 'code-skeptic');
+
+    const t = document.getElementById('hmTable');
+    let h = '<thead><tr><th class="hm-role">Agent</th>';
+    modelList.forEach(m => {
+        h += '<th style="writing-mode:vertical-lr;transform:rotate(180deg);max-width:32px;font-size:.56em;padding:3px 1px;">' + esc(m) + '</th>';
+    });
+    h += '<th>Best</th><th>Score</th></tr></thead><tbody>';
+
+    dd.agents.forEach(a => {
+        const realAgent = realAgents[a.name];
+        h += '<tr><td class="hm-r">' + esc(a.name) + '</td>';
+        modelList.forEach(m => {
+            let score = 0;
+            if (realAgent && realAgent.evaluations && realAgent.evaluations[m] > 0) {
+                score = Math.round(realAgent.evaluations[m]);
+            }
+            const isCurrent = a.model_short === m;
+            let cls = 'na';
+            if (score >= 90) cls = 'high';
+            else if (score >= 75) cls = 'good';
+            else if (score >= 50) cls = 'med';
+            else if (score > 0) cls = 'low';
+            const display = score > 0 ? score : (isCurrent ? Math.round(a.fit_score || 0) : '·');
+            const curStyle = isCurrent ? 'box-shadow:inset 0 0 0 2px var(--accent-cyan)' : '';
+            h += '<td class="score ' + cls + '" style="' + curStyle + '">' + display + '</td>';
+        });
+        const bestModel = realAgent ? (realAgent.best_model || a.model_short) : a.model_short;
+        const bestScore = realAgent ? Math.round(realAgent.best_score || 0) : Math.round(a.fit_score || 0);
+        h += '<td>' + esc(bestModel) + '</td><td style="font-weight:700">' + bestScore + '</td></tr>';
+    });
+    t.innerHTML = h + '</tbody>';
+}`;
+
+// 2. Add loadRealFitData script after dashboard load
+const loadRealFitData = `
+        // Load real-fit report for cross-model evaluation
+        try {
+            const rfRes = await fetch('data/real-fit-report.json');
+            if (rfRes.ok) window.realFitData = await rfRes.json();
+        } catch(e) { console.warn('real-fit-report.json not loaded:', e.message); }
+`;
+
+let html = fs.readFileSync(INDEX, 'utf-8');
+
+// Patch A: replace renderHeatmap function
+const oldPattern = /\/\/ Render Heatmap[\s\S]*?function renderHeatmap\(\)\s*\{[^}]*\{[^}]*\}[^}]*\}/;
+const oldMatch = html.match(oldPattern);
+if (oldMatch) {
+    html = html.substring(0, oldMatch.index) + '// Render Heatmap (real-fit enabled)\n' + newRenderHeatmap + html.substring(oldMatch.index + oldMatch[0].length);
+    console.log('Patched renderHeatmap');
+} else {
+    console.log('Pattern A not found, trying fallback...');
+    // Fallback: find and replace the specific renderHeatmap block
+    const start = html.indexOf('function renderHeatmap() {');
+    if (start !== -1) {
+        let brace = 0, end = start;
+        for (let i = start; i < html.length; i++) {
+            if (html[i] === '{') brace++;
+            else if (html[i] === '}') { brace--; if (brace === 0) { end = i + 1; break; } }
+        }
+        html = html.substring(0, start) + newRenderHeatmap + '\n' + html.substring(end);
+        console.log('Patched renderHeatmap (fallback)');
+    }
+}
+
+// Patch B: insert real-fit loading after dashboard load
+const dashLoadPattern = /window\.dashboardData = await dashRes\.json\(\);/;
+if (dashLoadPattern.test(html)) {
+    html = html.replace(dashLoadPattern, 'window.dashboardData = await dashRes.json();\n' + loadRealFitData.trim());
+    console.log('Patched init() to load real-fit data');
+}
+
+fs.writeFileSync(INDEX, html);
+console.log('Done — ' + (fs.statSync(INDEX).size / 1024).toFixed(1) + ' KB');
diff --git a/agent-evolution/scripts/rebuild-report.py b/agent-evolution/scripts/rebuild-report.py
new file mode 100644
index 0000000..4bb4df8
--- /dev/null
+++ b/agent-evolution/scripts/rebuild-report.py
@@ -0,0 +1,173 @@
+#!/usr/bin/env python3
+"""
+Rebuild real-fit-report.json from SQLite DB.
+
+Usage:
+    python3 rebuild-report.py
+    python3 rebuild-report.py --db /path/to/real-fit.db --report /path/to/real-fit-report.json
+"""
+
+import argparse
+import json
+import sqlite3
+import time
+from datetime import datetime, timezone
+from pathlib import Path
+
+
+def _sync_agents_from_meta(db_path: Path) -> None:
+    """Import any missing agents from kilo-meta.json into the DB agents table."""
+    meta_path = db_path.parent.parent.parent / "kilo-meta.json"
+    if not meta_path.exists():
+        return
+    with open(meta_path) as f:
+        meta = json.load(f)
+
+    conn = sqlite3.connect(str(db_path))
+    cursor = conn.cursor()
+    cursor.execute("SELECT name FROM agents")
+    existing = {r[0] for r in cursor.fetchall()}
+
+    for name, info in meta.get("agents", {}).items():
+        if name in existing:
+            continue
+        cursor.execute(
+            "INSERT OR IGNORE INTO agents (name, description, category, current_model, color, updated) VALUES (?, ?, ?, ?, ?, ?)",
+            (
+                name,
+                info.get("description", ""),
+                info.get("category", "meta"),
+                info.get("model", ""),
+                info.get("color", "#6B7280"),
+                datetime.now(timezone.utc).isoformat(),
+            ),
+        )
+    conn.commit()
+    conn.close()
+
+
+def build_report(db_path: Path) -> dict:
+    _sync_agents_from_meta(db_path)
+    conn = sqlite3.connect(str(db_path))
+    conn.row_factory = sqlite3.Row
+    cursor = conn.cursor()
+
+    cursor.execute("""
+        SELECT name, description, category, current_model
+        FROM agents
+    """)
+    agents_meta = {row["name"]: dict(row) for row in cursor.fetchall()}
+
+    # Only take evaluations that are NOT HTTP error responses
+    # AND prefer evaluator='rubric_v2' over 'rubric_v1'
+    cursor.execute("""
+        SELECT agent_name, model, total_score, evaluator, response
+        FROM evaluations
+        WHERE total_score > 0
+          AND evaluator NOT LIKE '%rubric_v1%'
+          AND (response IS NULL
+               OR (response NOT LIKE '%[HTTP %' AND response != ''))
+        ORDER BY agent_name, model,
+            CASE evaluator
+                WHEN 'evolution-skeptic' THEN 0
+                WHEN 'rubric_v2' THEN 1
+                ELSE 2
+            END,
+            total_score DESC
+    """)
+
+    # Take the first (best preferred evaluator, highest score) per agent-model
+    best_evals = {}
+    for row in cursor.fetchall():
+        agent = row["agent_name"]
+        model = row["model"]
+        score = row["total_score"]
+        if agent not in best_evals:
+            best_evals[agent] = {}
+        if model not in best_evals[agent]:
+            best_evals[agent][model] = score
+
+    # Rebuild fit_scores from selected evaluations only
+    cursor.execute("""
+        SELECT agent_name, model, MAX(total_score) as best_score, scores, explanation
+        FROM evaluations
+        WHERE total_score > 0
+          AND evaluator NOT LIKE '%rubric_v1%'
+          AND (response IS NULL
+               OR (response NOT LIKE '%[HTTP %' AND response != ''))
+        GROUP BY agent_name, model
+    """)
+    fit_scores = {}
+    for row in cursor.fetchall():
+        fit_scores[row["agent_name"]] = {
+            "model": row["model"],
+            "fit": row["best_score"],
+            "explanation": (
+                f"Best model for {row['agent_name']} is {row['model']} "
+                f"with avg score {row['best_score']:.1f}. "
+                "Evaluator preference: evolution-skeptic > rubric_v2 > rubric_v1 (ignored HTTP errors)."
+            ),
+        }
+
+    conn.close()
+
+    agents_report = {}
+    for agent_name, meta in agents_meta.items():
+        evals = best_evals.get(agent_name, {})
+        if evals:
+            best_model = max(evals, key=evals.get)
+            best_score = evals[best_model]
+        else:
+            best_model = ""
+            best_score = 0.0
+        agents_report[agent_name] = {
+            "name": agent_name,
+            "evaluations": evals,
+            "info": [
+                meta.get("description") or "",
+                meta.get("category") or "",
+                meta.get("current_model") or "",
+            ],
+            "best_model": best_model,
+            "best_score": best_score,
+        }
+
+    total_evals = sum(len(evals) for evals in best_evals.values())
+    generated = time.strftime("%Y-%m-%dT%H:%M:%SZ", time.gmtime())
+
+    return {
+        "generated": generated,
+        "source": "real-fit-engine-db-filtered",
+        "total_evaluations": total_evals,
+        "agents": agents_report,
+        "fit_scores": fit_scores,
+    }
+
+
+def main():
+    parser = argparse.ArgumentParser(description="Rebuild real-fit-report.json from DB")
+    parser.add_argument(
+        "--db",
+        type=Path,
+        default=Path(__file__).parent.parent / "data" / "real-fit.db",
+        help="Path to SQLite DB",
+    )
+    parser.add_argument(
+        "--report",
+        type=Path,
+        default=Path(__file__).parent.parent / "data" / "real-fit-report.json",
+        help="Path to report JSON output",
+    )
+    args = parser.parse_args()
+
+    report = build_report(args.db)
+    args.report.parent.mkdir(parents=True, exist_ok=True)
+    with open(args.report, "w", encoding="utf-8") as f:
+        json.dump(report, f, indent=2)
+
+    print(f"Report rebuilt: {args.report}")
+    print(f"Agents: {len(report['agents'])}, Evaluations: {report['total_evaluations']}")
+
+
+if __name__ == "__main__":
+    main()