fix(config): bulk-remove remaining deepseek-v4-pro-max references
- kilo.jsonc: 2 commands + capability-index entries - capability-index.yaml: 30+ stale refs in recommended_models lists - commands/*.md: hotfix, plan, code, feature, evolution, evolve-agent All normalized to deepseek-v4-pro.
This commit is contained in:
@@ -25,7 +25,7 @@ agents:
|
||||
- ollama-cloud/qwen3-coder:480b
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- groq/llama-3.1-8b-instant
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
failover_strategy: downgraded
|
||||
reasoning_effort: low
|
||||
frontend-developer:
|
||||
@@ -169,7 +169,7 @@ agents:
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
- groq/llama-3.1-8b-instant
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
failover_strategy: downgraded
|
||||
reasoning_effort: low
|
||||
go-developer:
|
||||
@@ -199,7 +199,7 @@ agents:
|
||||
- code-skeptic
|
||||
- orchestrator
|
||||
fallback_models:
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- groq/llama-3.1-8b-instant
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
@@ -233,7 +233,7 @@ agents:
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
- groq/llama-3.1-8b-instant
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
failover_strategy: downgraded
|
||||
reasoning_effort: low
|
||||
devops-engineer:
|
||||
@@ -260,7 +260,7 @@ agents:
|
||||
- orchestrator
|
||||
fallback_models:
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- ollama-cloud/glm-5.1
|
||||
failover_strategy: downgraded
|
||||
reasoning_effort: low
|
||||
@@ -290,7 +290,7 @@ agents:
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- ollama-cloud/minimax-m2.5
|
||||
- groq/llama-3.1-8b-instant
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
failover_strategy: downgraded
|
||||
reasoning_effort: low
|
||||
code-skeptic:
|
||||
@@ -316,7 +316,7 @@ agents:
|
||||
- orchestrator
|
||||
fallback_models:
|
||||
- ollama-cloud/qwen3-coder:480b
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- groq/llama-3.1-8b-instant
|
||||
- ollama-cloud/kimi-k2.6
|
||||
failover_strategy: mixed
|
||||
@@ -342,7 +342,7 @@ agents:
|
||||
- release-manager
|
||||
- orchestrator
|
||||
fallback_models:
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- ollama-cloud/glm-5.1
|
||||
failover_strategy: downgraded
|
||||
@@ -368,7 +368,7 @@ agents:
|
||||
- security-auditor
|
||||
- orchestrator
|
||||
fallback_models:
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- ollama-cloud/glm-5.1
|
||||
- ollama-cloud/kimi-k2.6
|
||||
failover_strategy: downgraded
|
||||
@@ -395,7 +395,7 @@ agents:
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- ollama-cloud/qwen3-coder:480b
|
||||
- groq/llama-3.1-8b-instant
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
failover_strategy: mixed
|
||||
reasoning_effort: medium
|
||||
browser-automation:
|
||||
@@ -418,7 +418,7 @@ agents:
|
||||
- orchestrator
|
||||
fallback_models:
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- groq/llama-3.1-8b-instant
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
failover_strategy: downgraded
|
||||
@@ -458,7 +458,7 @@ agents:
|
||||
- orchestrator
|
||||
fallback_models:
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- groq/llama-3.1-8b-instant
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
failover_strategy: downgraded
|
||||
@@ -483,7 +483,7 @@ agents:
|
||||
delegates_to: []
|
||||
fallback_models:
|
||||
- ollama-cloud/glm-5.1
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- ollama-cloud/kimi-k2.6
|
||||
failover_strategy: downgraded
|
||||
reasoning_effort: high
|
||||
@@ -507,7 +507,7 @@ agents:
|
||||
- agent-architect
|
||||
- orchestrator
|
||||
fallback_models:
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
failover_strategy: downgraded
|
||||
@@ -564,7 +564,7 @@ agents:
|
||||
- architect-indexer
|
||||
fallback_models:
|
||||
- ollama-cloud/glm-5.1
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- groq/llama-3.1-8b-instant
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
failover_strategy: mixed
|
||||
@@ -590,7 +590,7 @@ agents:
|
||||
delegates_to:
|
||||
- evaluator
|
||||
fallback_models:
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- groq/llama-3.1-8b-instant
|
||||
- ollama-cloud/glm-5
|
||||
@@ -619,7 +619,7 @@ agents:
|
||||
- product-owner
|
||||
- orchestrator
|
||||
fallback_models:
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
failover_strategy: downgraded
|
||||
@@ -644,7 +644,7 @@ agents:
|
||||
fallback_models:
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
failover_strategy: downgraded
|
||||
reasoning_effort: low
|
||||
product-owner:
|
||||
@@ -669,7 +669,7 @@ agents:
|
||||
- ollama-cloud/glm-5
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
- groq/llama-3.1-8b-instant
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
failover_strategy: mixed
|
||||
reasoning_effort: low
|
||||
pipeline-judge:
|
||||
@@ -695,7 +695,7 @@ agents:
|
||||
- prompt-optimizer
|
||||
fallback_models:
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- groq/llama-3.1-8b-instant
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
failover_strategy: mixed
|
||||
@@ -718,7 +718,7 @@ agents:
|
||||
delegates_to: []
|
||||
fallback_models:
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
failover_strategy: downgraded
|
||||
reasoning_effort: low
|
||||
@@ -739,7 +739,7 @@ agents:
|
||||
delegates_to:
|
||||
- orchestrator
|
||||
fallback_models:
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- ollama-cloud/glm-5.1
|
||||
- groq/llama-3.1-8b-instant
|
||||
- ollama/qwen3.5-122b
|
||||
@@ -766,7 +766,7 @@ agents:
|
||||
- system-analyst
|
||||
fallback_models:
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
failover_strategy: downgraded
|
||||
reasoning_effort: high
|
||||
@@ -791,7 +791,7 @@ agents:
|
||||
mode: subagent
|
||||
delegates_to: []
|
||||
fallback_models:
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- ollama-cloud/glm-5.1
|
||||
failover_strategy: downgraded
|
||||
@@ -817,7 +817,7 @@ agents:
|
||||
mode: subagent
|
||||
delegates_to: []
|
||||
fallback_models:
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- ollama-cloud/glm-5.1
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
failover_strategy: downgraded
|
||||
@@ -844,7 +844,7 @@ agents:
|
||||
delegates_to: []
|
||||
fallback_models:
|
||||
- openrouter/qwen/qwen3.6-plus:free
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- ollama-cloud/glm-5.1
|
||||
failover_strategy: downgraded
|
||||
reasoning_effort: low
|
||||
@@ -918,7 +918,7 @@ agents:
|
||||
- reflector
|
||||
- planner
|
||||
fallback_models:
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- ollama-cloud/glm-5.1
|
||||
- ollama-cloud/kimi-k2.6
|
||||
failover_strategy: downgraded
|
||||
@@ -946,7 +946,7 @@ agents:
|
||||
- evolution-skeptic
|
||||
- orchestrator
|
||||
fallback_models:
|
||||
- ollama-cloud/deepseek-v4-pro-max
|
||||
- ollama-cloud/deepseek-v4-pro
|
||||
- ollama-cloud/kimi-k2.6
|
||||
- ollama-cloud/glm-5.1
|
||||
- ollama-cloud/qwen3-coder:480b
|
||||
|
||||
@@ -1,7 +1,7 @@
|
||||
---
|
||||
description: Generates code for small tasks and hotfixes
|
||||
mode: code
|
||||
model: ollama-cloud/deepseek-v4-pro-max
|
||||
model: ollama-cloud/deepseek-v4-pro
|
||||
color: "#10B981"
|
||||
---
|
||||
|
||||
|
||||
@@ -337,8 +337,8 @@ $ /evolution research
|
||||
|
||||
| Agent | Current | Score | Recommended | Score | Δ | Impact |
|
||||
|-------|---------|-------|-------------|-------|---|--------|
|
||||
| planner | nemotron-3-super | 80 | deepseek-v4-pro-max | 88 | +8 | high |
|
||||
| go-developer | qwen3-coder | 85 | deepseek-v4-pro-max | 88 | +3 | medium |
|
||||
| planner | nemotron-3-super | 80 | deepseek-v4-pro | 88 | +8 | high |
|
||||
| go-developer | qwen3-coder | 85 | deepseek-v4-pro | 88 | +3 | medium |
|
||||
| [built-in] debug | glm-5.1 | 88 | kimi-k2.6 | 90 | +2 | high |
|
||||
|
||||
### Output
|
||||
|
||||
@@ -19,7 +19,7 @@ Evaluate which model is the **BEST FIT** for a specific agent role by generating
|
||||
```bash
|
||||
/evolve-agent # evaluate all agents across all fallback models
|
||||
/evolve-agent --agent code-skeptic # focus on one agent
|
||||
/evolve-agent --agent code-skeptic --models ollama-cloud/gpt-oss:120b,ollama-cloud/deepseek-v4-pro-max
|
||||
/evolve-agent --agent code-skeptic --models ollama-cloud/gpt-oss:120b,ollama-cloud/deepseek-v4-pro
|
||||
/evolve-agent --dry-run # show what would be tested without running
|
||||
/evolve-agent --report # generate comparison table from existing DB data
|
||||
```
|
||||
@@ -126,7 +126,7 @@ Output:
|
||||
|--------|------|-------------|
|
||||
| id | INTEGER PK | Auto-increment |
|
||||
| prompt_id | INTEGER FK | References test_prompts.id |
|
||||
| model | TEXT | Model ID tested (e.g. "ollama-cloud/deepseek-v4-pro-max") |
|
||||
| model | TEXT | Model ID tested (e.g. "ollama-cloud/deepseek-v4-pro") |
|
||||
| response | TEXT | Raw model response (truncated if >16 KB) |
|
||||
| scores | TEXT (JSON) | `{adherence, reasoning, instruction, boundary, output}` |
|
||||
| total_score | REAL | Weighted average across dimensions |
|
||||
@@ -185,13 +185,13 @@ $ /evolve-agent --agent code-skeptic
|
||||
|
||||
| Model | Adherence | Reasoning | Instruction | Boundary | Output | **Fit** | Δ vs Current |
|
||||
|-------|-----------|-----------|-------------|----------|--------|---------|-------------|
|
||||
| ollama-cloud/deepseek-v4-pro-max | 94 | 91 | 89 | 87 | 92 | **91** | +3 |
|
||||
| ollama-cloud/deepseek-v4-pro | 94 | 91 | 89 | 87 | 92 | **91** | +3 |
|
||||
| ollama-cloud/kimi-k2.6 | 91 | 88 | 90 | 85 | 89 | **89** | +1 |
|
||||
| ollama-cloud/gpt-oss:120b | 82 | 79 | 81 | 80 | 84 | **81** | -7 |
|
||||
|
||||
**Best fit**: deepseek-v4-pro-max (91/100)
|
||||
**Best fit**: deepseek-v4-pro (91/100)
|
||||
**Current model**: kimi-k2.6 (89/100)
|
||||
**Recommendation**: Consider upgrading to deepseek-v4-pro-max (+2 points)
|
||||
**Recommendation**: Consider upgrading to deepseek-v4-pro (+2 points)
|
||||
|
||||
### Updated Files
|
||||
- `agent-evolution/data/real-fit-report.json`
|
||||
@@ -227,9 +227,9 @@ $ /evolve-agent --report
|
||||
|
||||
| Agent | Current Model | Best Fallback | Fit Score | Gap |
|
||||
|-------|---------------|---------------|-----------|-----|
|
||||
| code-skeptic | kimi-k2.6 | deepseek-v4-pro-max | 91 | +2 |
|
||||
| planner | deepseek-v4-pro-max | deepseek-v4-pro-max | 88 | 0 |
|
||||
| lead-developer | kimi-k2.6 | deepseek-v4-pro-max | 87 | +3 |
|
||||
| code-skeptic | kimi-k2.6 | deepseek-v4-pro | 91 | +2 |
|
||||
| planner | deepseek-v4-pro | deepseek-v4-pro | 88 | 0 |
|
||||
| lead-developer | kimi-k2.6 | deepseek-v4-pro | 87 | +3 |
|
||||
|
||||
Last DB update: 2026-05-27T18:30:00Z
|
||||
```
|
||||
@@ -249,7 +249,7 @@ When run via Gitea issue:
|
||||
```markdown
|
||||
## /evolve-agent results for code-skeptic
|
||||
|
||||
**Best fit**: deepseek-v4-pro-max (91/100)
|
||||
**Best fit**: deepseek-v4-pro (91/100)
|
||||
**Current**: kimi-k2.6 (89/100)
|
||||
|
||||
| Dimension | Current | Best | Δ |
|
||||
@@ -260,7 +260,7 @@ When run via Gitea issue:
|
||||
| Boundary Awareness | 85 | 87 | +2 |
|
||||
| Output Quality | 89 | 92 | +3 |
|
||||
|
||||
**Recommendation**: Upgrade to deepseek-v4-pro-max
|
||||
**Recommendation**: Upgrade to deepseek-v4-pro
|
||||
**Confidence**: high (3 model sweep, 5 prompts, 15 evaluations)
|
||||
```
|
||||
|
||||
|
||||
@@ -1,7 +1,7 @@
|
||||
---
|
||||
description: Full feature development pipeline from requirements to release
|
||||
mode: feature
|
||||
model: ollama-cloud/deepseek-v4-pro-max
|
||||
model: ollama-cloud/deepseek-v4-pro
|
||||
color: "#059669"
|
||||
permission:
|
||||
read: allow
|
||||
|
||||
@@ -1,7 +1,7 @@
|
||||
---
|
||||
description: Quick bug fix workflow for urgent production issues
|
||||
mode: hotfix
|
||||
model: ollama-cloud/deepseek-v4-pro-max
|
||||
model: ollama-cloud/deepseek-v4-pro
|
||||
color: "#DC2626"
|
||||
permission:
|
||||
read: allow
|
||||
|
||||
@@ -1,7 +1,7 @@
|
||||
---
|
||||
description: Creates detailed task plans with breakdown, estimates, and dependencies
|
||||
mode: plan
|
||||
model: ollama-cloud/deepseek-v4-pro-max
|
||||
model: ollama-cloud/deepseek-v4-pro
|
||||
color: "#3B82F6"
|
||||
permission:
|
||||
read: allow
|
||||
|
||||
@@ -455,7 +455,7 @@
|
||||
"planner": {
|
||||
"description": "Advanced task planner using Chain of Thought, Tree of Thoughts, and Plan-Execute-Reflect",
|
||||
"mode": "subagent",
|
||||
"model": "ollama-cloud/deepseek-v4-pro-max",
|
||||
"model": "ollama-cloud/deepseek-v4-pro",
|
||||
"color": "#F59E0B",
|
||||
"permission": {
|
||||
"read": "allow",
|
||||
@@ -471,7 +471,7 @@
|
||||
"reflector": {
|
||||
"description": "Self-reflection agent using Reflexion pattern - learns from mistakes",
|
||||
"mode": "subagent",
|
||||
"model": "ollama-cloud/deepseek-v4-pro-max",
|
||||
"model": "ollama-cloud/deepseek-v4-pro",
|
||||
"color": "#10B981",
|
||||
"permission": {
|
||||
"read": "allow",
|
||||
|
||||
Reference in New Issue
Block a user