{ "$schema": "http://json-schema.org/draft-07/schema#", "$id": "https://app.kilo.ai/model-research.schema.json", "title": "APAW Model Research Output", "description": "Schema for automated model research and recommendation output", "type": "object", "required": ["version", "generated", "source", "models", "recommendations", "heatmap"], "properties": { "version": { "type": "string", "const": "1.0.0" }, "generated": { "type": "string", "format": "date-time" }, "source": { "type": "string", "description": "What triggered this research (e.g. /evolution, /research, manual)" }, "trigger": { "type": "object", "properties": { "type": { "type": "string", "enum": ["evolution_cycle", "manual_research", "fitness_below_threshold", "scheduled"] }, "issue": { "type": "integer" }, "fitness_score": { "type": "number" }, "reason": { "type": "string" } } }, "models": { "type": "array", "items": { "type": "object", "required": ["id", "name", "organization", "if_score", "provider"], "properties": { "id": { "type": "string", "description": "Full model ID like ollama-cloud/qwen3-coder:480b" }, "name": { "type": "string" }, "organization": { "type": "string" }, "parameters": { "type": "string" }, "context_window": { "type": "string" }, "swe_bench": { "type": ["number", "null"] }, "swe_bench_pro": { "type": ["number", "null"] }, "terminal_bench": { "type": ["number", "null"] }, "live_codebench": { "type": ["number", "null"] }, "gpqa": { "type": ["number", "null"] }, "hle": { "type": ["number", "null"] }, "browse_comp": { "type": ["number", "null"] }, "if_score": { "type": "number", "minimum": 0, "maximum": 100, "description": "Instruction Following composite score (IFEval + IFBench)" }, "categories": { "type": "array", "items": { "type": "string" } }, "tags": { "type": "array", "items": { "type": "string" } }, "provider": { "type": "string", "enum": ["ollama", "ollama-cloud", "openrouter", "groq", "hybrid"] }, "free": { "type": "boolean" }, "cost_per_1m_input": { "type": ["number", "string", "null"] }, "description": { "type": "string" }, "availability": { "type": "object", "properties": { "rpm": { "type": ["integer", "null"] }, "rpd": { "type": ["integer", "string", "null"] }, "tpm": { "type": ["integer", "string", "null"] }, "tpd": { "type": ["integer", "string", "null"] } } }, "speed_tps": { "type": ["number", "string", "null"] } } } }, "recommendations": { "type": "array", "items": { "type": "object", "required": ["agent", "action", "current_model", "recommended_model", "impact", "rationale"], "properties": { "agent": { "type": "string" }, "action": { "type": "string", "enum": ["update_model", "confirm_model", "add_fallback", "redesign_agent"] }, "current_model": { "type": "string" }, "current_provider": { "type": "string" }, "recommended_model": { "type": "string" }, "recommended_provider": { "type": "string" }, "fallback_model": { "type": "string" }, "fallback_strategy": { "type": "string" }, "impact": { "type": "string", "enum": ["critical", "high", "medium", "low"] }, "expected_improvement": { "type": "object", "properties": { "quality": { "type": "string" }, "speed": { "type": "string" }, "context_window": { "type": "string" } } }, "score_before": { "type": "number" }, "score_after": { "type": "number" }, "score_delta": { "type": "number" }, "rationale": { "type": "string" }, "applied": { "type": "boolean", "default": false }, "applied_date": { "type": ["string", "null"], "format": "date-time" } } } }, "heatmap": { "type": "object", "description": "Agent × Model compatibility matrix with IF adjustment", "required": ["models", "agents"], "properties": { "models": { "type": "array", "items": { "type": "object", "required": ["id", "if_score"], "properties": { "id": { "type": "string" }, "display_name": { "type": "string" }, "provider": { "type": "string" }, "if_score": { "type": "number" } } } }, "agents": { "type": "array", "items": { "type": "object", "required": ["agent", "reasoning_effort", "scores"], "properties": { "agent": { "type": "string" }, "current_model": { "type": "string" }, "reasoning_effort": { "type": "string", "enum": ["L", "M", "H"] }, "scores": { "type": "object", "additionalProperties": { "type": "number" }, "description": "Model ID → compatibility score (0-100, IF-adjusted)" } } } }, "if_adjustment_formula": { "type": "string", "default": "score * (0.7 + 0.3 * IF/100)" } } }, "closed_source_comparison": { "type": "object", "description": "APAW pipeline models vs top closed-source models", "properties": { "benchmarks": { "type": "array" }, "models": { "type": "array" }, "apaw_best_per_benchmark": { "type": "object" }, "closed_best_per_benchmark": { "type": "object" } } }, "capability_index_patch": { "type": "array", "description": "Ready-to-apply patches to capability-index.yaml", "items": { "type": "object", "required": ["agent", "set"], "properties": { "agent": { "type": "string" }, "set": { "type": "object", "additionalProperties": true } } } }, "summary": { "type": "object", "properties": { "avg_quality_improvement": { "type": "string" }, "providers_used": { "type": "array", "items": { "type": "string" } }, "key_models": { "type": "array", "items": { "type": "string" } }, "total_recommendations": { "type": "integer" }, "applied_count": { "type": "integer" }, "pending_count": { "type": "integer" } } } } }