@echo off REM Evolution Test Runner for Windows REM Runs pipeline-judge tests with precise measurements setlocal enabledelayedexpansion echo === Evolution Test Runner === echo. REM Check Docker where docker >nul 2>&1 if %errorlevel% neq 0 ( echo Error: Docker not found echo Please install Docker Desktop first: echo winget install Docker.DockerDesktop echo. echo Or run tests locally ^(less precise^): echo bun test --reporter=json --coverage exit /b 1 ) REM Check Docker daemon docker info >nul 2>&1 if %errorlevel% neq 0 ( echo Warning: Docker daemon not running echo Please start Docker Desktop and try again exit /b 1 ) REM Get workflow type set WORKFLOW=%1 if "%WORKFLOW%"=="" set WORKFLOW=feature echo Running evolution test for: %WORKFLOW% echo. REM Build container echo Building evolution test container... docker-compose -f docker/evolution-test/docker-compose.yml build REM Run test if "%WORKFLOW%"=="all" ( echo Running ALL workflow tests in parallel... docker-compose -f docker/evolution-test/docker-compose.yml up docker-compose -f docker/evolution-test/docker-compose.yml up fitness-aggregator ) else ( docker-compose -f docker/evolution-test/docker-compose.yml up evolution-%WORKFLOW% ) REM Show results echo. echo === Test Results === if exist .kilo\logs\fitness-history.jsonl ( echo Latest fitness scores: powershell -Command "Get-Content .kilo\logs\fitness-history.jsonl -Tail 4 | ForEach-Object { $j = $_ | ConvertFrom-Json; Write-Host (' ' + $j.workflow + ': fitness=' + $j.fitness + ', time=' + $j.time_ms + 'ms, tokens=' + $j.tokens) }" ) else ( echo No fitness history found ) REM Cleanup echo. echo Cleaning up... docker-compose -f docker/evolution-test/docker-compose.yml down -v 2>nul echo Done!