Kova/src/selfcheck.mjs

import { chmod, mkdir, mkdtemp, readFile, rm, stat, utimes, writeFile } from "node:fs/promises";
import { tmpdir } from "node:os";
import { join } from "node:path";
import { quoteShell, runCommand } from "./commands.mjs";
import { runCleanupCommand } from "./cleanup.mjs";
import { summarizeCpuProfiles } from "./collectors/node-profiles.mjs";
import { summarizeHeapProfiles } from "./collectors/heap.mjs";
import { evaluateRecord } from "./evaluator.mjs";
import { evaluateGate } from "./matrix/gate.mjs";
import {
  comparePerformanceToBaseline,
  loadBaselineStore,
  reviewBaselineUpdate,
  saveBaselineStore,
  updateBaselineStore
} from "./performance/baselines.mjs";
import { buildPerformanceSummary } from "./performance/stats.mjs";
import { loadProcessRoles } from "./registries/process-roles.mjs";
import { validateProfileShape } from "./registries/profiles.mjs";
import { validateScenarioShape } from "./registries/scenarios.mjs";
import { validateStateShape } from "./registries/states.mjs";
import { validateRegistryReferences } from "./registries/validate.mjs";
import { assertSafeScenarioCommand } from "./safety.mjs";
import { parseTimelineText } from "./collectors/timeline.mjs";
import {
  summarizeEmbeddedRunTraces,
  summarizeLivenessWarnings,
  summarizeRuntimeDepsLogs
} from "./collectors/logs.mjs";
import {
  buildAgentTurnBreakdown,
  summarizeAgentTurnBreakdownForMarkdown
} from "./collectors/agent-turns.mjs";
import { buildAgentCliPreProviderAttribution } from "./collectors/agent-cli-attribution.mjs";
import {
  attributedSpanIntervals,
  buildGatewaySessionPreProviderAttribution
} from "./collectors/gateway-session-turn-attribution.mjs";
import {
  computeProviderTurnAttribution,
  parseProviderRequestLog,
  parseTimelineProviderRequestLog
} from "./collectors/provider.mjs";
import { captureProcessSnapshot, classifyRegistryRolesForProcess, classifySnapshotRolesForProcess, diffProcessSnapshots, summarizeResourceSamples } from "./collectors/resources.mjs";
import { renderMarkdownReport, renderPasteSummary, renderReportSummary } from "./reporting/report.mjs";
import { compareReports, renderCompareSummary } from "./reporting/compare.mjs";
import {
  ocmAt,
  ocmEnvDestroy,
  ocmEnvExec,
  ocmEnvExecShell,
  ocmLogs,
  ocmRuntimeBuildLocal,
  ocmRuntimeRemoveJson,
  ocmServiceStatusJson,
  ocmTargetSelector
} from "./ocm/commands.mjs";
import {
  checkAggregateThreshold,
  checkDuration,
  checkEvidenceThreshold,
  checkRoleThresholds,
  checkTurnThreshold
} from "./evaluation/violations.mjs";

export async function runSelfCheck(flags = {}) {
  const checks = [];
  const tmp = await mkdtemp(join(tmpdir(), "kova-self-check-"));

  try {
    checks.push(await commandCheck(
      "syntax",
      "for f in bin/kova.mjs $(find src -name '*.mjs' -type f | sort); do node --check \"$f\" || exit 1; done"
    ));
    checks.push(await jsonCommandCheck("version-json", "node bin/kova.mjs version --json", (data) => {
      assertEqual(data.schemaVersion, "kova.version.v1", "version schema");
      assertString(data.version, "version");
    }));
    checks.push(await jsonCommandCheck("setup-json", "node bin/kova.mjs setup --ci --json", (data) => {
      assertEqual(data.schemaVersion, "kova.setup.v1", "setup schema");
      assertEqual(data.ok, true, "setup ok");
      assertEqual(data.auth?.method, "mock", "setup auth default");
      assertArrayNotEmpty(data.checks, "setup checks");
    }));
    checks.push(await failingCommandCheck(
      "setup-non-tty-requires-mode",
      "node bin/kova.mjs setup --json",
      "kova setup requires --non-interactive or --ci when stdin is not a TTY"
    ));
    checks.push(await credentialStoreSelfCheck(tmp));
    checks.push(await failingCommandCheck(
      "live-auth-requires-credentials",
      `KOVA_HOME=${quoteShell(join(tmp, "empty-auth-home"))} node bin/kova.mjs run --target runtime:stable --scenario fresh-install --auth live --json`,
      "--auth live requires configured live credentials"
    ));
    checks.push(await interactiveSetupChoiceCheck(tmp));
    checks.push(await externalCliSetupCheck(tmp));
    checks.push(await externalCliOpenClawConfigCheck(tmp));
    checks.push(await anthropicApiKeyOpenClawConfigCheck(tmp));
    checks.push(await mockAuthOpenClawConfigCheck(tmp));
    checks.push(await claudeCliOpenClawConfigCheck(tmp));
    checks.push(await liveApiKeyExecutionCheck(tmp));
    checks.push(await liveExternalCliDryRunCheck(tmp));
    checks.push(await liveAnthropicExternalCliDryRunCheck(tmp));
    checks.push(await liveExternalCliFallbackCheck(tmp));
    checks.push(await failingCommandCheck(
      "setup-custom-provider-rejects-external-cli",
      `KOVA_HOME=${quoteShell(join(tmp, "custom-external-cli-home"))} node bin/kova.mjs setup --non-interactive --provider custom-openai --auth external-cli --json`,
      "external-cli auth is only supported for provider openai or anthropic"
    ));
    checks.push(await failingCommandCheck(
      "setup-external-cli-verifies-auth",
      `HOME=${quoteShell(join(tmp, "no-codex-auth"))} KOVA_HOME=${quoteShell(join(tmp, "missing-external-cli-auth-home"))} node bin/kova.mjs setup --non-interactive --provider openai --auth external-cli --json`,
      "external-cli codex is not usable"
    ));
    checks.push(await externalCliRunAuthVerificationCheck(tmp));
    checks.push(await commandTimeoutContractCheck());
    checks.push(ocmCommandBuildersCheck());
    checks.push(evaluationViolationHelpersCheck());
    checks.push(localBuildTargetSetupResourceExclusionCheck());
    checks.push(await jsonCommandCheck("plan-json", "node bin/kova.mjs plan --json", (data) => {
      assertEqual(data.schemaVersion, "kova.plan.v1", "plan schema");
      assertArrayNotEmpty(data.surfaces, "plan surfaces");
      assertArrayNotEmpty(data.processRoles, "plan process roles");
      assertArrayNotEmpty(data.metrics, "plan metrics");
      assertArrayNotEmpty(data.scenarios, "plan scenarios");
      assertArrayNotEmpty(data.states, "plan states");
      assertArrayNotEmpty(data.profiles, "profiles");
      assertEqual(data.coverage?.schemaVersion, "kova.coverage.v1", "coverage schema");
      assertArrayNotEmpty(data.coverage?.scenarioSurfaceMap, "scenario surface map");
      const releaseCoverage = data.coverage?.profiles?.find((profile) => profile.id === "release");
      const releaseProfile = data.profiles?.find((profile) => profile.id === "release");
      assertArrayNotEmpty(releaseCoverage?.required?.platforms, "release required platform coverage");
      assertArrayNotEmpty(releaseCoverage?.required?.requirements, "release required requirement coverage");
      assertArrayNotEmpty(releaseCoverage?.currentPlatformKeys, "current platform coverage keys");
      assertEqual(releaseProfile?.purpose, "release", "release profile purpose");
      assertEqual((releaseProfile?.calibration?.surfaceCount ?? 0) > 0, true, "release profile calibrated surfaces");
      assertEqual((releaseProfile?.calibration?.roleCount ?? 0) > 0, true, "release profile calibrated roles");
      const officialSurface = data.surfaces.find((surface) => surface.id === "official-plugin-install");
      assertEqual(Boolean(officialSurface), true, "official plugin surface present");
      assertArrayNotEmpty(officialSurface?.purposes, "official plugin surface purposes");
      assertArrayNotEmpty(officialSurface?.requirements, "official plugin surface requirements");
      assertEqual(data.states.some((state) => state.id === "official-plugins"), true, "official plugins state present");
      assertEqual(data.scenarios.some((scenario) => scenario.id === "official-plugin-install" && scenario.surface === "official-plugin-install"), true, "official plugin scenario present");
      if (data.scenarios.some((scenario) => typeof scenario.surface !== "string" || scenario.surface.length === 0)) {
        throw new Error("every scenario must expose a surface");
      }
      if (data.scenarios.some((scenario) => !Array.isArray(scenario.proves) || scenario.proves.length === 0)) {
        throw new Error("every scenario must declare the surface requirement ids it proves");
      }
    }));
    checks.push(await inventoryPlanCheck(tmp));
    checks.push(await jsonCommandCheck("matrix-plan-json", "node bin/kova.mjs matrix plan --profile smoke --target runtime:stable --include scenario:fresh-install --parallel 2 --json", (data) => {
      assertEqual(data.schemaVersion, "kova.matrix.plan.v1", "matrix plan schema");
      assertEqual(data.profile?.id, "smoke", "matrix profile id");
      assertArrayNotEmpty(data.entries, "matrix entries");
      assertEqual(data.resolvedCoverage?.schemaVersion, "kova.resolvedCoverage.v1", "resolved coverage schema");
      assertEqual(data.resolvedCoverage?.statuses?.planned, 1, "resolved planned obligation count");
      assertEqual(data.resolvedCoverage?.warnings?.length, 0, "resolved coverage migration warnings");
      assertEqual(data.resolvedCoverage?.obligations?.[0]?.surface, "fresh-install", "resolved obligation surface");
      assertEqual(data.resolvedCoverage?.obligations?.[0]?.requirement, "baseline", "resolved obligation requirement");
      assertEqual(data.entries.length, 1, "matrix include filter count");
      assertEqual(data.controls?.requestedParallel, 2, "matrix requested parallel");
    }));
    checks.push(await jsonCommandCheck("matrix-plan-repeat-json", "node bin/kova.mjs matrix plan --profile smoke --target runtime:stable --include scenario:fresh-install --repeat 3 --json", (data) => {
      assertEqual(data.controls?.repeat, 3, "matrix repeat control");
    }));
    checks.push(await jsonCommandCheck("channel-upgrade-plan-json", "node bin/kova.mjs matrix plan --profile channel-upgrade --target channel:beta --json", (data) => {
      assertEqual(data.profile?.id, "channel-upgrade", "channel upgrade profile id");
      assertEqual(data.target, "channel:beta", "channel upgrade target");
      assertEqual(data.entries?.[0]?.scenario?.id, "upgrade-stable-channel-to-beta", "channel upgrade scenario");
    }));
    checks.push(await failingCommandCheck(
      "channel-upgrade-rejects-wrong-target-value",
      "node bin/kova.mjs matrix plan --profile channel-upgrade --target channel:stable --json",
      "upgrade-stable-channel-to-beta supports target value beta, got stable"
    ));
    checks.push(await jsonCommandCheck("local-build-upgrade-plan-json", "node bin/kova.mjs matrix plan --profile local-build-upgrade --target local-build:/tmp/openclaw --include scenario:upgrade-stable-channel-to-local-build --json", (data) => {
      assertEqual(data.profile?.id, "local-build-upgrade", "local-build upgrade profile id");
      assertEqual(data.entries?.[0]?.scenario?.id, "upgrade-stable-channel-to-local-build", "local-build stable upgrade scenario");
    }));
    checks.push(await jsonCommandCheck("channel-upgrade-dry-run-json", `node bin/kova.mjs run --target channel:beta --scenario upgrade-stable-channel-to-beta --state stable-channel-user --report-dir ${quoteShell(tmp)} --json`, async (data) => {
      const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
      const record = report.records?.[0];
      const commands = (record?.phases ?? []).flatMap((phase) => phase.commands ?? []);
      assertEqual(commands.some((command) => command.includes("ocm start") && command.includes("--channel stable")), true, "stable start command present");
      assertEqual(commands.some((command) => command.includes("ocm upgrade") && /--channel '?beta'?/.test(command)), true, "beta upgrade command present");
    }));
    checks.push(await jsonCommandCheck("durable-clone-local-build-dry-run-json", `node bin/kova.mjs run --target local-build:/tmp/openclaw --scenario upgrade-durable-clone-to-local-build --state plugin-index --source-env 'Team Env' --report-dir ${quoteShell(tmp)} --json`, async (data) => {
      const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
      const record = report.records?.[0];
      const commands = (record?.phases ?? []).flatMap((phase) => phase.commands ?? []);
      assertEqual(commands.some((command) => command.includes("ocm env clone 'Team Env'")), true, "quoted source env clone command present");
      assertEqual(commands.some((command) => command.includes("ocm upgrade") && /--runtime '?kova-local-/.test(command)), true, "local-build runtime upgrade command present");
    }));
    checks.push(await jsonCommandCheck("run-auth-default-mock-json", `node bin/kova.mjs run --target runtime:stable --scenario fresh-install --report-dir ${quoteShell(tmp)} --json`, async (data) => {
      const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
      const record = report.records?.[0];
      assertEqual(record?.auth?.mode, "mock", "default auth mode");
      const phaseIds = record?.phases?.map((phase) => phase.id) ?? [];
      if (!phaseIds.includes("auth-prepare") || !phaseIds.includes("auth-setup") || !phaseIds.includes("auth-cleanup")) {
        throw new Error(`default mock auth phases missing: ${phaseIds.join(", ")}`);
      }
    }));
    checks.push(await jsonCommandCheck("run-auth-missing-override-json", `node bin/kova.mjs run --target runtime:stable --scenario provider-models --state model-auth-missing --report-dir ${quoteShell(tmp)} --json`, async (data) => {
      const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
      const record = report.records?.[0];
      assertEqual(record?.auth?.mode, "missing", "missing auth override mode");
      const phaseIds = record?.phases?.map((phase) => phase.id) ?? [];
      if (phaseIds.includes("auth-prepare") || phaseIds.includes("auth-setup")) {
        throw new Error(`missing auth override should not inject auth phases: ${phaseIds.join(", ")}`);
      }
    }));
    checks.push(await jsonCommandCheck("run-auth-live-source-env-json", `node bin/kova.mjs run --auth live --target runtime:stable --scenario gateway-session-send-turn-existing-user --source-env 'Team Env' --report-dir ${quoteShell(tmp)} --json`, async (data) => {
      const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
      const record = report.records?.[0];
      assertEqual(record?.auth?.mode, "live", "source-env live auth mode");
      assertEqual(record?.auth?.source, "source-env", "source-env live auth source");
      assertEqual(record?.auth?.setup, false, "source-env live auth does not patch config");
      const phaseIds = record?.phases?.map((phase) => phase.id) ?? [];
      if (phaseIds.includes("auth-setup") || phaseIds.includes("auth-prepare")) {
        throw new Error(`source-env live auth should not inject auth phases: ${phaseIds.join(", ")}`);
      }
      const commands = record?.phases?.flatMap((phase) => phase.commands ?? []) ?? [];
      assertEqual(commands.some((command) => command.includes("ocm env clone 'Team Env'")), true, "source env clone command present");
      assertEqual(commands.some((command) => command.includes("run-gateway-session-send-turn.mjs")), true, "gateway session helper command present");
    }));
    for (const item of [
      ["agent-gateway-rpc-turn", "agent-gateway-rpc-turn", "ocm @"],
      ["gateway-session-send-turn", "gateway-session-send-turn", "run-gateway-session-send-turn.mjs"],
      ["tui-message-turn", "tui-message-turn", "run-tui-message-turn.mjs"],
      ["openai-compatible-turn", "openai-compatible-turn", "run-openai-compatible-turn.mjs"]
    ]) {
      const [scenarioId, surfaceId, expectedCommand] = item;
      checks.push(await jsonCommandCheck(`message-ingress-${scenarioId}-dry-run-json`, `node bin/kova.mjs run --target runtime:stable --scenario ${scenarioId} --state mock-openai-provider --report-dir ${quoteShell(tmp)} --json`, async (data) => {
        const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
        const record = report.records?.[0];
        assertEqual(record?.surface, surfaceId, `${scenarioId} surface`);
        assertEqual(record?.auth?.mode, "mock", `${scenarioId} mock auth mode`);
        const commands = record?.phases?.flatMap((phase) => phase.commands ?? []) ?? [];
        assertEqual(commands.some((command) => command.includes(expectedCommand)), true, `${scenarioId} ingress command`);
      }));
    }
    checks.push(await jsonCommandCheck("run-profiling-dry-run-json", `node bin/kova.mjs run --target runtime:stable --scenario fresh-install --node-profile --report-dir ${quoteShell(tmp)} --json`, async (data) => {
      const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
      assertEqual(report.records?.[0]?.profiling?.enabled, true, "profiling marker");
      assertEqual(report.performance?.profiledRunCount, 1, "profiled run count");
    }));
    checks.push(await jsonCommandCheck("workspace-scan-dry-run-json", `node bin/kova.mjs run --target runtime:stable --scenario workspace-scan-pressure --state large-workspace --report-dir ${quoteShell(tmp)} --json`, async (data) => {
      const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
      const record = report.records?.[0];
      assertEqual(record?.surface, "workspace-scan", "workspace scan surface");
      const phaseIds = record?.phases?.map((phase) => phase.id) ?? [];
      if (!phaseIds.includes("state-start")) {
        throw new Error(`large workspace state setup after start missing: ${phaseIds.join(", ")}`);
      }
      const commands = record?.phases?.flatMap((phase) => phase.commands ?? []) ?? [];
      assertEqual(commands.some((command) => command.includes("kova-large")), true, "large workspace fixture command");
      assertEqual(commands.some((command) => command.includes("ocm service restart")), true, "workspace restart command");
      assertEqual(commands.some((command) => command.includes("run-soak-loop.mjs") && command.includes("--duration-ms 15000")), true, "workspace repeated command loop");
    }));
    checks.push(await jsonCommandCheck("mcp-runtime-dry-run-json", `node bin/kova.mjs run --target runtime:stable --scenario mcp-runtime-start-stop --state fresh --report-dir ${quoteShell(tmp)} --json`, async (data) => {
      const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
      const record = report.records?.[0];
      assertEqual(record?.surface, "mcp-runtime", "MCP runtime surface");
      const commands = record?.phases?.flatMap((phase) => phase.commands ?? []) ?? [];
      const bridgeCommand = commands.find((command) => command.includes("mcp-bridge-smoke.mjs")) ?? "";
      assertEqual(bridgeCommand.includes("--artifact-dir '"), true, "MCP bridge helper receives quoted artifact dir");
      assertEqual(commands.some((command) => command.includes("ocm start") && command.includes("--json")), true, "MCP gateway start command");
      assertEqual(record?.thresholds?.mcpProcessLeaks, 0, "MCP process leak threshold");
    }));
    checks.push(await commandCheck(
      "mcp-runtime-role-patterns",
      "node -e \"const role=require('./process-roles/mcp-runtime.json'); if (role.commandPatterns.includes('mcp') || role.processPatterns.includes('mcp') || role.processPatterns.some((p)=>p.includes('modelcontextprotocol'))) process.exit(1);\""
    ));
    checks.push(await jsonCommandCheck("browser-automation-dry-run-json", `node bin/kova.mjs run --target runtime:stable --scenario browser-automation-smoke --state fresh --report-dir ${quoteShell(tmp)} --json`, async (data) => {
      const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
      const record = report.records?.[0];
      assertEqual(record?.surface, "browser-automation", "browser automation surface");
      const commands = record?.phases?.flatMap((phase) => phase.commands ?? []) ?? [];
      const browserCommand = commands.find((command) => command.includes("browser-automation-smoke.mjs")) ?? "";
      assertEqual(browserCommand.includes("--artifact-dir '"), true, "browser helper receives quoted artifact dir");
      assertEqual(record?.thresholds?.browserProcessLeaks, 0, "browser process leak threshold");
    }));
    checks.push(await jsonCommandCheck("media-understanding-dry-run-json", `node bin/kova.mjs run --target runtime:stable --scenario media-understanding-timeout --state fresh --report-dir ${quoteShell(tmp)} --json`, async (data) => {
      const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
      const record = report.records?.[0];
      assertEqual(record?.surface, "media-understanding", "media understanding surface");
      const commands = record?.phases?.flatMap((phase) => phase.commands ?? []) ?? [];
      const mediaCommand = commands.find((command) => command.includes("media-understanding-timeout.mjs")) ?? "";
      assertEqual(mediaCommand.includes("--artifact-dir '"), true, "media helper receives quoted artifact dir");
      assertEqual(mediaCommand.includes("--timeout-ms 1200"), true, "media helper receives provider timeout");
      assertEqual(mediaCommand.includes("--max-command-ms 45000"), true, "media helper allows cold CLI evidence before outer timeout");
      assertEqual(record?.auth?.mockProvider?.mode, "timeout", "media scenario mock timeout mode");
      assertEqual(record?.thresholds?.mediaTimeoutObserved, 1, "media timeout threshold");
      assertEqual(record?.thresholds?.providerRequestCountMin, 1, "media provider request threshold");
    }));
    checks.push(await jsonCommandCheck("network-offline-dry-run-json", `node bin/kova.mjs run --target runtime:stable --scenario agent-network-offline --state fresh --report-dir ${quoteShell(tmp)} --json`, async (data) => {
      const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
      const record = report.records?.[0];
      assertEqual(record?.surface, "network-offline", "network offline surface");
      assertEqual(record?.auth?.mode, "none", "network offline opts out of default mock auth");
      const phaseIds = record?.phases?.map((phase) => phase.id) ?? [];
      if (phaseIds.includes("auth-prepare") || phaseIds.includes("auth-setup")) {
        throw new Error(`network offline must not start mock auth phases: ${phaseIds.join(", ")}`);
      }
      const commands = record?.phases?.flatMap((phase) => phase.commands ?? []) ?? [];
      const networkCommand = commands.find((command) => command.includes("agent-network-offline.mjs")) ?? "";
      assertEqual(networkCommand.includes("--artifact-dir '"), true, "network helper receives quoted artifact dir");
      assertEqual(networkCommand.includes("--max-command-ms 45000"), true, "network helper allows cold CLI evidence before outer timeout");
      assertEqual(record?.thresholds?.networkFailureObserved, 1, "network failure threshold");
    }));
    checks.push(await jsonCommandCheck("diagnostic-profile-plan-json", "node bin/kova.mjs matrix plan --profile diagnostic --target local-build:/tmp/openclaw --include scenario:release-runtime-startup --json", (data) => {
      assertEqual(data.schemaVersion, "kova.matrix.plan.v1", "diagnostic matrix plan schema");
      assertEqual(data.profile?.id, "diagnostic", "diagnostic profile id");
      assertEqual(data.profile?.diagnostics?.timelineRequired, true, "diagnostic timeline required");
      assertArrayNotEmpty(data.entries, "diagnostic entries");
    }));
    checks.push(await failingCommandCheck(
      "diagnostic-profile-rejects-non-local-build",
      "node bin/kova.mjs matrix plan --profile diagnostic --target runtime:stable --json",
      "profile 'diagnostic' requires target kind local-build"
    ));
    checks.push(await failingCommandCheck(
      "invalid-parallel-rejected",
      "node bin/kova.mjs matrix plan --profile smoke --target runtime:stable --parallel nope --json",
      "--parallel must be a positive integer"
    ));
    checks.push(await failingCommandCheck(
      "invalid-timeout-rejected",
      "node bin/kova.mjs run --target runtime:stable --scenario fresh-install --timeout-ms 0 --json",
      "--timeout-ms must be a positive integer"
    ));
    checks.push(await failingCommandCheck(
      "baseline-requires-execute",
      "node bin/kova.mjs run --target runtime:stable --scenario fresh-install --baseline --json",
      "--baseline and --save-baseline require --execute"
    ));
    checks.push(await failingCommandCheck(
      "save-baseline-requires-reviewed-good",
      "node bin/kova.mjs run --target runtime:stable --scenario fresh-install --execute --save-baseline --json",
      "--save-baseline requires --reviewed-good"
    ));
    checks.push(await failingCommandCheck(
      "exhaustive-execute-requires-explicit-flag",
      "node bin/kova.mjs matrix run --profile exhaustive --target runtime:stable --execute --json",
      "executing profile 'exhaustive' requires --allow-exhaustive"
    ));
    checks.push(await jsonCommandCheck("cleanup-json", "node bin/kova.mjs cleanup envs --json", (data) => {
      assertEqual(data.schemaVersion, "kova.cleanup.envs.v1", "cleanup schema");
      assertEqual(data.execute, false, "cleanup execute flag");
      assertArray(data.envs, "cleanup envs");
    }));
    checks.push(await cleanupArtifactsCheck(tmp));
    checks.push(await diagnosticsTimelineCheck());
    checks.push(await diagnosticsOpenSpanCheck());
    checks.push(diagnosticsTimelineEvaluationCheck());
    checks.push(runtimeDepsLogParserCheck());
    checks.push(embeddedRunLogParserCheck());
    checks.push(runtimeDepsWarmReuseEvaluationCheck());
    checks.push(await performanceBaselineCheck(tmp));
    checks.push(markdownFailureCardsCheck());
    checks.push(reportRecommendedNextScenarioCheck());
    checks.push(readinessClassificationCheck());
    checks.push(healthReadinessModelCheck());
    checks.push(agentContainmentHealthScopeCheck());
    checks.push(await resourceRoleAttributionCheck(tmp));
    checks.push(await resourceRootCommandRoleBoundaryCheck());
    checks.push(await resourceRolePollutionCheck());
    checks.push(await gatewaySessionSurfaceContractCheck());
    checks.push(await processSnapshotCheck(tmp));
    checks.push(roleThresholdEvaluationCheck());
    checks.push(thresholdPolicyCalibrationCheck());
    checks.push(await cleanupRetryCheck(tmp));
    checks.push(stateRegistryValidationCheck());
    checks.push(scenarioCloneFirstValidationCheck());
    checks.push(scenarioHealthScopeValidationCheck());
    checks.push(scenarioStateCompatibilityCheck());
    checks.push(await cpuProfileParserCheck());
    checks.push(await heapProfileParserCheck());
    checks.push(await providerEvidenceParserCheck());
    checks.push(agentTurnBreakdownCheck());
    checks.push(gatewaySessionTurnEvaluationCheck());
    checks.push(gatewaySessionPreProviderAttributionCheck());
    checks.push(agentCliPreProviderAttributionCheck());
    checks.push(await mockProviderBehaviorCheck(tmp));
    checks.push(providerFailureEvaluationCheck());
    checks.push(agentColdWarmEvaluationCheck());
    checks.push(sourceReleaseCompareCheck());
    checks.push(await concurrentAgentRunnerCheck(tmp));
    checks.push(providerConcurrentEvaluationCheck());
    checks.push(agentAuthFailureEvaluationCheck());
    checks.push(await soakLoopRunnerCheck(tmp));
    checks.push(soakTrendEvaluationCheck());
    checks.push(mcpBridgeEvidenceEvaluationCheck());
    checks.push(browserAutomationEvidenceEvaluationCheck());
    checks.push(mediaUnderstandingEvidenceEvaluationCheck());
    checks.push(networkOfflineEvidenceEvaluationCheck());
    checks.push(await officialPluginInstallRunnerCheck(tmp));
    checks.push(await jsonCommandCheck(
      "dry-run-state-lifecycle-json",
      `node bin/kova.mjs run --target runtime:stable --scenario fresh-install --state missing-plugin-index --report-dir ${quoteShell(tmp)} --json`,
      async (data) => {
        assertEqual(data.schemaVersion, "kova.run.receipt.v1", "state dry-run receipt schema");
        const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
        const commands = report.records?.[0]?.phases?.flatMap((phase) => phase.commands ?? []) ?? [];
        if (!commands.some((command) => command.includes("rm -f") && command.includes("plugins/installs.json"))) {
          throw new Error("state lifecycle command missing from dry-run report");
        }
      }
    ));
    checks.push(await jsonCommandCheck(
      "official-plugin-install-dry-run-json",
      `node bin/kova.mjs run --target runtime:stable --scenario official-plugin-install --state official-plugins --report-dir ${quoteShell(tmp)} --json`,
      async (data) => {
        const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
        const commands = report.records?.[0]?.phases?.flatMap((phase) => phase.commands ?? []) ?? [];
        assertEqual(commands.some((command) => command.includes("run-official-plugin-install.mjs") && command.includes("states/official-plugins.json")), true, "official plugin state-backed command present");
      }
    ));
    checks.push(await jsonCommandCheck(
      "dry-run-source-env-quoting-json",
      `node bin/kova.mjs run --target runtime:stable --scenario upgrade-existing-user --source-env 'Team Env' --report-dir ${quoteShell(tmp)} --json`,
      async (data) => {
        const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
        const command = report.records?.[0]?.phases
          ?.flatMap((phase) => phase.commands ?? [])
          ?.find((item) => item.includes("ocm env clone")) ?? "";
        if (!command.includes("ocm env clone 'Team Env'")) {
          throw new Error(`source env was not shell-quoted: ${command}`);
        }
      }
    ));
    checks.push(await localBuildRuntimeCleanupCheck(tmp));
    checks.push(await localBuildRuntimeAlreadyAbsentCleanupCheck(tmp));

    const receiptCheck = await jsonCommandCheck(
      "dry-run-report-json",
      `node bin/kova.mjs run --target runtime:stable --scenario fresh-install --repeat 2 --report-dir ${quoteShell(tmp)} --json`,
      (data) => {
        assertEqual(data.schemaVersion, "kova.run.receipt.v1", "run receipt schema");
        assertEqual(data.mode, "dry-run", "run mode");
        assertEqual(data.summary?.statuses?.["DRY-RUN"], 2, "dry-run repeat count");
        assertEqual(data.performance?.repeat, 2, "run receipt repeat");
        assertString(data.jsonPath, "json report path");
      }
    );
    checks.push(receiptCheck);

    checks.push(await jsonCommandCheck(
      "matrix-dry-run-json",
      `node bin/kova.mjs matrix run --profile smoke --target runtime:stable --include tag:plugins --exclude state:stale-runtime-deps --parallel 2 --report-dir ${quoteShell(tmp)} --json`,
      (data) => {
        assertEqual(data.schemaVersion, "kova.matrix.run.receipt.v1", "matrix run receipt schema");
        assertEqual(data.mode, "dry-run", "matrix dry-run mode");
        assertString(data.jsonPath, "matrix json report path");
        assertString(data.bundlePath, "matrix bundle path");
        if (!data.bundlePath.startsWith(tmp)) {
          throw new Error(`matrix bundle path should use report dir: ${data.bundlePath}`);
        }
        assertEqual(data.summary?.statuses?.["DRY-RUN"], 5, "filtered matrix dry-run count");
      }
    ));
    checks.push(await gateDryRunCheck(tmp));
    checks.push(gatePartialFailureCheck());
    checks.push(gatePartialPassCheck());
    checks.push(gatePlatformCoverageCheck());
    checks.push(gateNonReleaseOutcomeCheck());
    checks.push(gateRequirementCoverageCheck());
    checks.push(gateSubsystemSummaryCheck());
    checks.push(safetyGuardCheck());
    checks.push(await failingCommandCheck(
      "gate-preflight-source-env",
      `node bin/kova.mjs matrix run --profile release --target runtime:stable --execute --gate --report-dir ${quoteShell(tmp)} --json`,
      "release gate preflight failed: --source-env <env> is required"
    ));

    if (receiptCheck.status === "PASS") {
      const report = JSON.parse(await readFile(receiptCheck.data.jsonPath, "utf8"));
      checks.push(validateReport(report));
      checks.push(await jsonCommandCheck(
        "report-compare-json",
        `node bin/kova.mjs report compare ${quoteShell(receiptCheck.data.jsonPath)} ${quoteShell(receiptCheck.data.jsonPath)} --json`,
        (data) => {
          assertEqual(data.schemaVersion, "kova.compare.v1", "compare schema");
          assertEqual(data.ok, true, "compare ok");
          assertEqual(data.regressionCount, 0, "compare regression count");
        }
      ));
      checks.push(await jsonCommandCheck(
        "report-bundle-json",
        `node bin/kova.mjs report bundle ${quoteShell(receiptCheck.data.jsonPath)} --output-dir ${quoteShell(tmp)} --json`,
        (data) => {
          assertEqual(data.schemaVersion, "kova.artifact.bundle.v1", "bundle schema");
          assertString(data.outputPath, "bundle output path");
          assertString(data.checksumPath, "bundle checksum path");
          assertString(data.sha256, "bundle sha256");
          assertEqual(data.included?.artifactIndex, true, "bundle includes artifact index");
          assertEqual(data.artifactIndex?.path, "artifact-index.json", "artifact index path");
          assertEqual((data.artifactIndex?.fileCount ?? 0) > 0, true, "artifact index file count");
        }
      ));
    }
  } finally {
    await rm(tmp, { recursive: true, force: true });
  }

  const ok = checks.every((check) => check.status === "PASS");
  const result = {
    schemaVersion: "kova.selfcheck.v1",
    generatedAt: new Date().toISOString(),
    ok,
    checks: checks.map(({ data, ...check }) => check)
  };

  if (flags.json) {
    console.log(JSON.stringify(result, null, 2));
  } else {
    for (const check of result.checks) {
      console.log(`${check.status} ${check.id}${check.message ? `: ${check.message}` : ""}`);
    }
  }

  if (!ok) {
    throw new Error("self-check failed");
  }
}

function ocmCommandBuildersCheck() {
  try {
    assertEqual(ocmTargetSelector({ kind: "npm", value: "2026.4.27" }), "--version '2026.4.27'", "npm selector");
    assertEqual(ocmTargetSelector({ kind: "channel", value: "beta" }), "--channel 'beta'", "channel selector");
    assertEqual(ocmTargetSelector({ kind: "runtime", value: "stable" }), "--runtime 'stable'", "runtime selector");
    assertEqual(
      ocmTargetSelector({ kind: "local-build", value: "/tmp/openclaw", runtimeName: "kova-local-test" }),
      "--runtime 'kova-local-test'",
      "local-build selector"
    );
    assertEqual(ocmServiceStatusJson("Team Env"), "ocm service status 'Team Env' --json", "quoted service status");
    assertEqual(ocmLogs("Team Env", { tail: 25, raw: true }), "ocm logs 'Team Env' --tail '25' --raw", "quoted logs");
    assertEqual(ocmEnvDestroy("Team Env"), "ocm env destroy 'Team Env' --yes", "quoted env destroy");
    assertEqual(ocmAt("Team Env", ["status"]), "ocm @'Team Env' -- 'status'", "quoted at command");
    assertEqual(
      ocmEnvExec("Team Env", ["node", "support/script.mjs", "--name", "O'Hara"]),
      "ocm env exec 'Team Env' -- 'node' 'support/script.mjs' '--name' 'O'\\''Hara'",
      "quoted env exec args"
    );
    assertEqual(
      ocmEnvExecShell("Team Env", "printf '%s\\n' ok"),
      "ocm env exec 'Team Env' -- 'sh' '-lc' 'printf '\\''%s\\n'\\'' ok'",
      "quoted env exec shell"
    );
    assertEqual(
      ocmRuntimeBuildLocal("kova-local-test", "/tmp/Open Claw"),
      "ocm runtime build-local 'kova-local-test' --repo '/tmp/Open Claw' --force",
      "quoted local runtime build"
    );
    assertEqual(ocmRuntimeRemoveJson("kova-local-test"), "ocm runtime remove 'kova-local-test' --json", "quoted runtime remove");
    return {
      id: "ocm-command-builders",
      status: "PASS",
      command: "validate centralized OCM command builders",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "ocm-command-builders",
      status: "FAIL",
      command: "validate centralized OCM command builders",
      durationMs: 0,
      message: error.message
    };
  }
}

function evaluationViolationHelpersCheck() {
  try {
    const violations = [];
    checkDuration(violations, [{ command: "openclaw status", durationMs: 51 }], "statusMs", 50, (command) => command.includes("status"));
    checkEvidenceThreshold(violations, "media", "mediaDescribeMs", 101, 100, "Media describe");
    checkRoleThresholds(violations, { gateway: { peakRssMb: 901, maxCpuPercent: 41 } }, { gateway: { peakRssMb: 900, maxCpuPercent: 40 } });
    checkAggregateThreshold(violations, 201, "agentTurnP95Ms", 200);
    checkTurnThreshold(violations, { phaseId: "turn", preProviderMs: 301 }, "preProviderMs", 300, "pre-provider latency was 301ms");
    assertEqual(violations.length, 6, "violation helper count");
    assertEqual(violations.some((violation) => violation.metric === "resourceByRole.gateway.peakRssMb"), true, "role RSS violation");
    assertEqual(violations.some((violation) => violation.phaseId === "turn"), true, "turn threshold violation");
    return {
      id: "evaluation-violation-helpers",
      status: "PASS",
      command: "validate evaluation violation helper contract",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "evaluation-violation-helpers",
      status: "FAIL",
      command: "validate evaluation violation helper contract",
      durationMs: 0,
      message: error.message
    };
  }
}

function localBuildTargetSetupResourceExclusionCheck() {
  try {
    const record = {
      scenario: "local-build-runtime-resources",
      status: "PASS",
      phases: [
        {
          id: "target-setup",
          measurementScope: "harness",
          results: [{
            command: "ocm runtime build-local kova-local-test --repo /tmp/openclaw --force",
            status: 0,
            durationMs: 60000,
            resourceSamples: syntheticResourceSamples({
              peakRssMb: 2500,
              maxCpuPercent: 350,
              role: "build-tooling"
            })
          }]
        },
        {
          id: "auth-prepare",
          measurementScope: "harness",
          results: [{
            command: "node support/mock-openai-server.mjs",
            status: 0,
            durationMs: 500,
            resourceSamples: syntheticResourceSamples({
              peakRssMb: 1900,
              maxCpuPercent: 320,
              role: "mock-provider"
            })
          }]
        },
        {
          id: "scenario-command",
          measurementScope: "product",
          results: [{
            command: "ocm @kova-self-check -- status",
            status: 0,
            durationMs: 100,
            resourceSamples: syntheticResourceSamples({
              peakRssMb: 100,
              maxCpuPercent: 20,
              role: "gateway"
            })
          }, {
            command: "node support/kova-helper.mjs",
            status: 0,
            durationMs: 100,
            resourceSamples: syntheticResourceSamples({
              peakRssMb: 600,
              maxCpuPercent: 30,
              role: "command-tree"
            })
          }]
        },
        {
          id: "auth-cleanup",
          measurementScope: "cleanup",
          results: [{
            command: "kill $(cat mock/pid)",
            status: 0,
            durationMs: 50,
            resourceSamples: syntheticResourceSamples({
              peakRssMb: 1800,
              maxCpuPercent: 300,
              role: "mock-provider"
            })
          }]
        }
      ],
      finalMetrics: {
        service: { gatewayState: "disabled" },
        logs: zeroLogMetrics()
      }
    };
    evaluateRecord(record, { thresholds: { peakRssMb: 200 } }, {
      surface: { thresholds: {}, resourcePrimaryRole: "gateway" },
      targetPlan: { kind: "local-build" }
    });
    assertEqual(record.status, "PASS", "local-build target setup resources ignored status");
    assertEqual(record.measurements.peakRssMb, 100, "local-build target setup resources ignored RSS");
    assertEqual(record.measurements.resourcePeakTrackedRssMb, 600, "tracked product helper RSS retained separately");
    assertEqual(record.measurements.resourcePrimaryRole, "gateway", "primary resource role retained");
    assertEqual(record.measurements.resourceByRole.gateway.peakRssMb, 100, "scenario role RSS retained");
    assertEqual(record.measurements.resourceByRole["build-tooling"], undefined, "target setup role excluded");
    assertEqual(record.measurements.resourceByRole["mock-provider"], undefined, "harness auth resources excluded");
    assertEqual(record.measurements.measurementScopeSummary.harnessCommandCount, 2, "harness command count");
    assertEqual(record.measurements.measurementScopeSummary.cleanupCommandCount, 1, "cleanup command count");
    assertEqual(record.violations, undefined, "no-service local-build record has no gateway violation");
    return {
      id: "local-build-target-setup-resource-exclusion",
      status: "PASS",
      command: "evaluate local-build target setup resource exclusion",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "local-build-target-setup-resource-exclusion",
      status: "FAIL",
      command: "evaluate local-build target setup resource exclusion",
      durationMs: 0,
      message: error.message
    };
  }
}

function syntheticResourceSamples({ peakRssMb, maxCpuPercent, role }) {
  return {
    sampleCount: 1,
    peakTotalRssMb: peakRssMb,
    maxTotalCpuPercent: maxCpuPercent,
    peakCommandTreeRssMb: peakRssMb,
    peakGatewayRssMb: role === "gateway" ? peakRssMb : 0,
    byRole: {
      [role]: {
        peakRssMb,
        maxCpuPercent,
        peakProcessCount: 1
      }
    },
    topRolesByRss: [{ role, peakRssMb, maxCpuPercent }],
    topRolesByCpu: [{ role, peakRssMb, maxCpuPercent }],
    topByRss: [],
    topByCpu: []
  };
}

function gatePartialFailureCheck() {
  try {
    const gate = evaluateGate({
      mode: "execution",
      controls: {
        include: ["scenario:release-runtime-startup"],
        exclude: []
      },
      records: [
        {
          scenario: "release-runtime-startup",
          state: { id: "fresh" },
          status: "FAIL",
          title: "Release Runtime Startup",
          likelyOwner: "OpenClaw",
          violations: [{ message: "gateway became healthy after 47100ms, beyond the 30000ms threshold" }],
          phases: []
        }
      ]
    }, {
      id: "release",
      gate: {
        id: "test-release-gate",
        blocking: [
          { scenario: "release-runtime-startup", state: "fresh" },
          { scenario: "fresh-install", state: "fresh" }
        ]
      }
    });

    assertEqual(gate.verdict, "DO_NOT_SHIP", "partial gate failure verdict");
    assertEqual(gate.partial, true, "partial gate marker");
    assertEqual(gate.complete, false, "partial gate completeness");
    assertEqual(gate.missingRequiredCount, 1, "partial gate missing count");
    assertEqual(gate.cards.some((card) => card.kind === "filtered-required-scenario"), true, "filtered required card");
    return {
      id: "gate-partial-failure-do-not-ship",
      status: "PASS",
      command: "evaluate synthetic partial release gate failure",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "gate-partial-failure-do-not-ship",
      status: "FAIL",
      command: "evaluate synthetic partial release gate failure",
      durationMs: 0,
      message: error.message
    };
  }
}

function gatePartialPassCheck() {
  try {
    const gate = evaluateGate({
      mode: "execution",
      controls: {
        include: ["scenario:release-runtime-startup"],
        exclude: []
      },
      records: [
        {
          scenario: "release-runtime-startup",
          state: { id: "fresh" },
          status: "PASS",
          title: "Release Runtime Startup",
          likelyOwner: "OpenClaw",
          phases: []
        }
      ]
    }, {
      id: "release",
      gate: {
        id: "test-release-gate",
        blocking: [
          { scenario: "release-runtime-startup", state: "fresh" },
          { scenario: "fresh-install", state: "fresh" }
        ]
      }
    });

    assertEqual(gate.verdict, "PARTIAL", "partial gate pass verdict");
    assertEqual(gate.ok, false, "partial gate not ok");
    assertEqual(gate.complete, false, "partial gate completeness");
    assertEqual(gate.partial, true, "partial gate marker");
    return {
      id: "gate-partial-pass",
      status: "PASS",
      command: "evaluate synthetic partial release gate pass",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "gate-partial-pass",
      status: "FAIL",
      command: "evaluate synthetic partial release gate pass",
      durationMs: 0,
      message: error.message
    };
  }
}

function gatePlatformCoverageCheck() {
  try {
    const gate = evaluateGate({
      mode: "execution",
      controls: {
        include: [],
        exclude: []
      },
      platform: {
        os: "darwin",
        arch: "arm64",
        release: "25.3.0",
        node: "v24.13.0"
      },
      records: [
        {
          scenario: "release-runtime-startup",
          state: { id: "fresh" },
          status: "PASS",
          title: "Release Runtime Startup",
          likelyOwner: "OpenClaw",
          phases: []
        }
      ]
    }, {
      id: "release",
      gate: {
        id: "test-release-gate",
        coverage: {
          platforms: {
            blocking: ["darwin-arm64"],
            warning: ["linux-x64"]
          }
        },
        blocking: [
          { scenario: "release-runtime-startup", state: "fresh" }
        ]
      }
    });

    assertEqual(gate.verdict, "SHIP", "current required platform coverage should pass");
    assertEqual(gate.outcome, "SHIP", "release gate outcome matches ship verdict");
    assertEqual(gate.complete, true, "platform-covered gate completeness");
    assertEqual(gate.cards.some((card) => card.coverage === "platform" && card.expected === "platform coverage darwin-arm64"), false, "darwin-arm64 should not be missing");
    assertEqual(gate.cards.some((card) => card.coverage === "platform" && card.expected === "platform coverage linux-x64" && card.severity === "warning"), true, "linux warning platform should remain visible");
    return {
      id: "gate-platform-coverage",
      status: "PASS",
      command: "evaluate synthetic release gate platform coverage",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "gate-platform-coverage",
      status: "FAIL",
      command: "evaluate synthetic release gate platform coverage",
      durationMs: 0,
      message: error.message
    };
  }
}

function gateNonReleaseOutcomeCheck() {
  try {
    const gate = evaluateGate({
      mode: "execution",
      controls: {
        include: [],
        exclude: []
      },
      records: [
        {
          scenario: "gateway-performance",
          surface: "gateway-performance",
          state: { id: "many-bundled-plugins" },
          status: "PASS",
          title: "Gateway Performance",
          likelyOwner: "OpenClaw",
          phases: []
        }
      ]
    }, {
      id: "benchmark",
      purpose: "performance",
      gate: {
        id: "test-performance-gate",
        blocking: [
          { scenario: "gateway-performance", state: "many-bundled-plugins" }
        ]
      }
    });

    assertEqual(gate.verdict, "SHIP", "non-release gate keeps compatibility verdict");
    assertEqual(gate.outcome, "PASS", "non-release gate maps ship verdict to pass outcome");
    assertEqual(gate.purpose, "performance", "non-release gate purpose");
    return {
      id: "gate-non-release-outcome",
      status: "PASS",
      command: "evaluate synthetic non-release gate outcome",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "gate-non-release-outcome",
      status: "FAIL",
      command: "evaluate synthetic non-release gate outcome",
      durationMs: 0,
      message: error.message
    };
  }
}

function gateRequirementCoverageCheck() {
  try {
    const profile = {
      id: "release",
      gate: {
        id: "test-release-gate",
        coverage: {
          requirements: {
            blocking: ["release-runtime-startup:baseline"],
            warning: ["fresh-install:baseline"]
          }
        },
        blocking: [
          { scenario: "release-runtime-startup", state: "fresh" }
        ]
      }
    };
    const report = {
      mode: "execution",
      controls: {
        include: [],
        exclude: []
      },
      records: [
        {
          scenario: "release-runtime-startup",
          surface: "release-runtime-startup",
          state: { id: "fresh" },
          status: "PASS",
          title: "Release Runtime Startup",
          likelyOwner: "OpenClaw",
          phases: []
        }
      ]
    };
    const gate = evaluateGate(report, profile, {
      resolvedCoverage: {
        obligations: [{
          surface: "release-runtime-startup",
          requirement: "baseline",
          scenario: "release-runtime-startup",
          state: "fresh",
          status: "planned"
        }]
      }
    });

    assertEqual(gate.verdict, "SHIP", "required requirement coverage should pass");
    assertEqual(gate.cards.some((card) => card.coverage === "requirement" && card.expected === "requirement coverage release-runtime-startup:baseline"), false, "covered requirement should not be missing");
    assertEqual(gate.cards.some((card) => card.coverage === "requirement" && card.expected === "requirement coverage fresh-install:baseline" && card.severity === "warning"), true, "missing warning requirement should remain visible");
    return {
      id: "gate-requirement-coverage",
      status: "PASS",
      command: "evaluate synthetic release gate requirement coverage",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "gate-requirement-coverage",
      status: "FAIL",
      command: "evaluate synthetic release gate requirement coverage",
      durationMs: 0,
      message: error.message
    };
  }
}

function gateSubsystemSummaryCheck() {
  try {
    const gate = evaluateGate({
      mode: "execution",
      controls: {
        include: [],
        exclude: []
      },
      records: [
        {
          scenario: "gateway-performance",
          state: { id: "many-bundled-plugins" },
          status: "FAIL",
          title: "Gateway Performance",
          likelyOwner: "gateway-runtime",
          violations: [{ message: "gateway RSS 1200 MB exceeded threshold 900 MB" }],
          phases: []
        },
        {
          scenario: "agent-provider-timeout",
          state: { id: "mock-openai-provider" },
          status: "FAIL",
          title: "Agent Provider Timeout",
          likelyOwner: "agent-runtime/provider",
          violations: [{ message: "provider timeout was not contained" }],
          phases: []
        }
      ]
    }, {
      id: "release",
      gate: {
        id: "test-release-gate",
        blocking: [
          { scenario: "gateway-performance", state: "many-bundled-plugins" },
          { scenario: "agent-provider-timeout", state: "mock-openai-provider" }
        ]
      }
    });

    assertEqual(gate.verdict, "DO_NOT_SHIP", "subsystem gate verdict");
    assertEqual(gate.subsystems?.length, 2, "subsystem count");
    assertEqual(gate.fixerSummaries?.length, 2, "fixer summary count");
    assertEqual(gate.fixerSummaries[0]?.fixerPrompt.includes("Use the JSON report card measurements"), true, "fixer prompt evidence guidance");
    return {
      id: "gate-subsystem-summary",
      status: "PASS",
      command: "evaluate synthetic gate subsystem summaries",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "gate-subsystem-summary",
      status: "FAIL",
      command: "evaluate synthetic gate subsystem summaries",
      durationMs: 0,
      message: error.message
    };
  }
}

async function performanceBaselineCheck(tmp) {
  try {
    const platform = { os: "darwin", arch: "arm64", release: "test", node: "v24.0.0" };
    const targetPlan = { kind: "local-build", value: "/tmp/openclaw" };
    const baselineReport = syntheticPerformanceReport({
      runId: "baseline",
      platform,
      target: "local-build:/tmp/openclaw",
      records: [
        syntheticPerformanceRecord(1, { health: syntheticHealthMeasurement({ healthReadyAtMs: 1000 }), peakRssMb: 400, cpuPercentMax: 20, eventLoopDelayMs: 100, agentTurnMs: 2000 }),
        syntheticPerformanceRecord(2, { health: syntheticHealthMeasurement({ healthReadyAtMs: 1200 }), peakRssMb: 420, cpuPercentMax: 22, eventLoopDelayMs: 110, agentTurnMs: 2200 }),
        syntheticPerformanceRecord(3, { health: syntheticHealthMeasurement({ healthReadyAtMs: 1100 }), peakRssMb: 410, cpuPercentMax: 21, eventLoopDelayMs: 105, agentTurnMs: 2100 })
      ]
    });
    baselineReport.performance = buildPerformanceSummary(baselineReport.records, { repeat: 3 });

    const baselinePath = join(tmp, "baselines.json");
    const unreviewed = reviewBaselineUpdate(baselineReport, { reviewedGood: false });
    assertEqual(unreviewed.ok, false, "baseline update requires review");
    assertEqual(unreviewed.blockers.some((blocker) => blocker.kind === "review-required"), true, "baseline review-required blocker");

    const failingReport = syntheticPerformanceReport({
      runId: "failing",
      platform,
      target: "local-build:/tmp/openclaw",
      records: [
        {
          ...syntheticPerformanceRecord(1, { health: syntheticHealthMeasurement({ healthReadyAtMs: 1000 }), peakRssMb: 400 }),
          status: "FAIL",
          violations: [{ message: "gateway readiness exceeded threshold" }]
        }
      ]
    });
    failingReport.performance = buildPerformanceSummary(failingReport.records, { repeat: 1 });
    const failingReview = reviewBaselineUpdate(failingReport, { reviewedGood: true });
    assertEqual(failingReview.ok, false, "failing report rejected for baseline");
    assertEqual(failingReview.blockers.some((blocker) => blocker.kind === "non-passing-records"), true, "non-passing blocker");

    const profiledReport = syntheticPerformanceReport({
      runId: "profiled",
      platform,
      target: "local-build:/tmp/openclaw",
      records: [
        {
          ...syntheticPerformanceRecord(1, { health: syntheticHealthMeasurement({ healthReadyAtMs: 1000 }), peakRssMb: 400 }),
          profiling: { enabled: true, interpretation: "instrumented run", baselineEligible: false }
        }
      ]
    });
    profiledReport.performance = buildPerformanceSummary(profiledReport.records, { repeat: 1 });
    const profiledReview = reviewBaselineUpdate(profiledReport, { reviewedGood: true });
    assertEqual(profiledReview.ok, false, "profiled report rejected for baseline");
    assertEqual(profiledReview.blockers.some((blocker) => blocker.kind === "profiled-run"), true, "profiled-run blocker");

    const savedStore = updateBaselineStore(await loadBaselineStore(baselinePath), baselineReport, { targetPlan, reviewedGood: true });
    await saveBaselineStore(baselinePath, savedStore);
    const loadedStore = await loadBaselineStore(baselinePath);
    assertEqual(Object.keys(loadedStore.entries).length, 1, "baseline entry count");
    assertEqual(
      Object.keys(loadedStore.entries)[0].includes("/tmp/openclaw"),
      true,
      "baseline key includes target value"
    );
    const otherTargetComparison = comparePerformanceToBaseline(baselineReport, loadedStore, {
      targetPlan: { kind: "local-build", value: "/tmp/other-openclaw" }
    });
    assertEqual(otherTargetComparison.missingBaselineCount, 1, "different target value misses baseline");

    const parallelReport = {
      ...baselineReport,
      controls: { parallel: 2 },
      performance: {
        ...baselineReport.performance,
        parallel: 2,
        parallelContaminated: true
      }
    };
    const parallelReview = reviewBaselineUpdate(parallelReport, { reviewedGood: true });
    assertEqual(parallelReview.ok, false, "parallel report rejected for baseline");
    assertEqual(parallelReview.blockers.some((blocker) => blocker.kind === "parallel-performance"), true, "parallel-performance blocker");

    const currentReport = syntheticPerformanceReport({
      runId: "current",
      platform,
      target: "local-build:/tmp/openclaw",
      records: [
        syntheticPerformanceRecord(1, { health: syntheticHealthMeasurement({ healthReadyAtMs: 1800 }), peakRssMb: 500, cpuPercentMax: 30, eventLoopDelayMs: 180, agentTurnMs: 3000 }),
        syntheticPerformanceRecord(2, { health: syntheticHealthMeasurement({ healthReadyAtMs: 1900 }), peakRssMb: 510, cpuPercentMax: 31, eventLoopDelayMs: 190, agentTurnMs: 3100 }),
        syntheticPerformanceRecord(3, { health: syntheticHealthMeasurement({ healthReadyAtMs: 2000 }), peakRssMb: 520, cpuPercentMax: 32, eventLoopDelayMs: 200, agentTurnMs: 3200 })
      ]
    });
    currentReport.performance = buildPerformanceSummary(currentReport.records, { repeat: 3 });
    assertEqual(currentReport.performance.groups[0].metrics.readinessHealthReadyMs.median, 1900, "performance median");
    assertEqual(currentReport.performance.groups[0].metrics.readinessHealthReadyMs.p95, 1990, "performance p95");

    const comparison = comparePerformanceToBaseline(currentReport, loadedStore, {
      targetPlan,
      regressionThresholds: {
        startupRegressionPercent: 10,
        rssRegressionPercent: 10,
        cpuRegressionPercent: 10,
        eventLoopRegressionPercent: 10,
        agentLatencyRegressionPercent: 10
      }
    });
    assertEqual(comparison.ok, false, "baseline comparison regression");
    assertEqual(comparison.regressions.some((regression) => regression.metric === "readinessHealthReadyMs"), true, "startup regression present");
    const regressedReview = reviewBaselineUpdate({
      ...currentReport,
      baseline: { path: baselinePath, comparison }
    }, { reviewedGood: true });
    assertEqual(regressedReview.ok, false, "regressed current report rejected for baseline update");
    assertEqual(regressedReview.blockers.some((blocker) => blocker.kind === "baseline-regression"), true, "baseline-regression blocker");

    const gate = evaluateGate({
      mode: "execution",
      controls: {},
      platform,
      baseline: { path: baselinePath, comparison },
      records: currentReport.records
    }, {
      id: "perf-gate",
      gate: {
        id: "perf-gate",
        blocking: [{ scenario: "fresh-install", state: "fresh" }]
      }
    });
    assertEqual(gate.verdict, "DO_NOT_SHIP", "performance regression gate verdict");
    assertEqual(gate.baseline?.regressionCount, comparison.regressionCount, "gate baseline regression count");
    assertEqual(gate.baseline?.regressedGroups?.[0]?.scenario, "fresh-install", "gate baseline group scenario");
    assertEqual(gate.cards.some((card) => card.kind === "performance-regression"), true, "performance regression gate card");

    return {
      id: "performance-baseline-regression",
      status: "PASS",
      command: "evaluate synthetic repeat performance baseline",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "performance-baseline-regression",
      status: "FAIL",
      command: "evaluate synthetic repeat performance baseline",
      durationMs: 0,
      message: error.message
    };
  }
}

function syntheticPerformanceReport({ runId, platform, target, records }) {
  return {
    schemaVersion: "kova.report.v1",
    generatedAt: "2026-04-29T00:00:00.000Z",
    runId,
    mode: "execution",
    target,
    platform,
    records
  };
}

function syntheticPerformanceRecord(index, measurements) {
  return {
    scenario: "fresh-install",
    surface: "fresh-install",
    title: "Fresh Install",
    status: "PASS",
    target: "local-build:/tmp/openclaw",
    state: { id: "fresh", title: "Fresh" },
    repeat: { index, total: 3 },
    envName: `kova-fresh-install-r${index}`,
    measurements,
    phases: []
  };
}

function syntheticHealthMeasurement({ listeningReadyAtMs = null, healthReadyAtMs = null } = {}) {
  return {
    schemaVersion: "kova.health.v1",
    readiness: {
      phaseId: "start",
      listeningReadyAtMs,
      healthReadyAtMs,
      classification: "ready",
      severity: "pass",
      reason: "synthetic readiness",
      thresholdMs: 30000,
      deadlineMs: 90000,
      attempts: 1
    },
    startupSamples: emptySyntheticHealthSummary("startup-sample"),
    postReadySamples: emptySyntheticHealthSummary("post-ready"),
    unknownSamples: emptySyntheticHealthSummary("unknown"),
    final: {
      ...emptySyntheticHealthSummary("final"),
      gatewayState: "running",
      ok: true,
      healthOk: true
    },
    slowestSample: null
  };
}

function emptySyntheticHealthSummary(scope) {
  return {
    scope,
    count: 0,
    okCount: 0,
    failureCount: 0,
    minMs: null,
    p50Ms: null,
    p95Ms: null,
    maxMs: null,
    slowestPhaseId: null
  };
}

async function gateDryRunCheck(tmp) {
  const command = `node bin/kova.mjs matrix run --profile release --target runtime:stable --include scenario:release-runtime-startup --gate --report-dir ${quoteShell(tmp)} --json`;
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000 });
  try {
    if (result.status === 0) {
      throw new Error("gate dry-run should exit non-zero");
    }
    const data = JSON.parse(result.stdout);
    assertEqual(data.schemaVersion, "kova.matrix.run.receipt.v1", "gate receipt schema");
    assertEqual(data.gate?.verdict, "BLOCKED", "gate dry-run verdict");
    assertEqual(data.gate?.ok, false, "gate dry-run ok");
    const report = JSON.parse(await readFile(data.jsonPath, "utf8"));
    assertEqual(report.gate?.cards?.some((card) => card.kind === "not-executed"), true, "gate not-executed card");
    const summary = renderReportSummary(report, { structured: true });
    assertString(summary.failureBrief?.fixerPrompt, "failure brief fixer prompt");
    assertString(data.retainedGateArtifacts?.outputDir, "retained gate artifact dir");
    assertString(data.retainedGateArtifacts?.pasteSummaryPath, "retained paste summary path");
    const retained = JSON.parse(await readFile(`${data.retainedGateArtifacts.outputDir}/retained-artifacts.json`, "utf8"));
    assertEqual(retained.verdict, "BLOCKED", "retained artifact verdict");
    await rm(data.retainedGateArtifacts.outputDir, { recursive: true, force: true });
    return {
      id: "gate-dry-run-blocked",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "gate-dry-run-blocked",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

function safetyGuardCheck() {
  try {
    assertSafeScenarioCommand("ocm start kova-safe-test --runtime stable --json", {}, "kova-safe-test");
    assertSafeScenarioCommand("ocm env clone 'Team Env' kova-safe-test --json", { sourceEnv: "Team Env" }, "kova-safe-test");
    const blockedCases = [
      "ocm env destroy Violet --yes",
      "ocm upgrade Violet --channel beta --json",
      "ocm @Violet -- status",
      "ocm env clone 'Team Env' Violet --json"
    ];
    let blocked = 0;
    for (const command of blockedCases) {
      try {
        assertSafeScenarioCommand(command, { sourceEnv: "Team Env" }, "kova-safe-test");
      } catch (error) {
        if (/refusing to mutate non-Kova/.test(error.message)) {
          blocked += 1;
        }
      }
    }
    assertEqual(blocked, blockedCases.length, "durable env mutation cases blocked");
    let wrongSourceBlocked = false;
    try {
      assertSafeScenarioCommand("ocm env clone Other kova-safe-test --json", { sourceEnv: "Team Env" }, "kova-safe-test");
    } catch (error) {
      wrongSourceBlocked = /refusing to mutate non-Kova/.test(error.message);
    }
    assertEqual(wrongSourceBlocked, true, "unexpected source env clone blocked");
    return {
      id: "durable-env-mutation-guard",
      status: "PASS",
      command: "evaluate synthetic command guard cases",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "durable-env-mutation-guard",
      status: "FAIL",
      command: "evaluate synthetic command guard cases",
      durationMs: 0,
      message: error.message
    };
  }
}

async function localBuildRuntimeCleanupCheck(tmp) {
  const binDir = join(tmp, "mock-bin");
  const repoDir = join(tmp, "mock-openclaw repo");
  const reportDir = join(tmp, "local-build-cleanup-report");
  const ocmLog = join(tmp, "mock-ocm.log");
  const removeCount = join(tmp, "mock-runtime-remove-count");
  await mkdir(binDir, { recursive: true });
  await mkdir(repoDir, { recursive: true });
  const ocmPath = join(binDir, "ocm");
  await writeFile(ocmPath, `#!/bin/sh
printf '%s\\n' "$*" >> "$KOVA_MOCK_OCM_LOG"
case "$1:$2" in
  runtime:build-local) echo '{"ok":true}'; exit 0 ;;
  runtime:remove)
    count=0
    if [ -f "$KOVA_MOCK_REMOVE_COUNT" ]; then count=$(cat "$KOVA_MOCK_REMOVE_COUNT"); fi
    count=$((count + 1))
    printf '%s' "$count" > "$KOVA_MOCK_REMOVE_COUNT"
    if [ "$count" -lt 2 ]; then echo 'runtime busy shutting down' >&2; exit 1; fi
    echo '{"removed":true}'
    exit 0
    ;;
  service:status) echo '{"running":false,"desiredRunning":false,"childPid":null,"gatewayPort":null,"gatewayState":"stopped"}'; exit 0 ;;
  env:exec) exit 0 ;;
  env:destroy) echo '{"destroyed":true}'; exit 0 ;;
esac
case "$1" in
  start) echo '{"ok":true}'; exit 0 ;;
  logs) exit 0 ;;
  @*) echo 'ok'; exit 0 ;;
  --version) echo 'mock-ocm'; exit 0 ;;
esac
echo "unhandled mock ocm command: $*" >&2
exit 2
`, "utf8");
  await chmod(ocmPath, 0o755);

  const command = `node bin/kova.mjs run --target local-build:${quoteShell(repoDir)} --scenario fresh-install --execute --report-dir ${quoteShell(reportDir)} --json`;
  const result = await runCommand(command, {
    timeoutMs: 30000,
    maxOutputChars: 1000000,
    env: {
      PATH: `${binDir}:${process.env.PATH}`,
      KOVA_MOCK_OCM_LOG: ocmLog,
      KOVA_MOCK_REMOVE_COUNT: removeCount
    }
  });

  try {
    if (result.status !== 0) {
      throw new Error(result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`);
    }
    const receipt = JSON.parse(result.stdout);
    const report = JSON.parse(await readFile(receipt.jsonPath, "utf8"));
    const log = await readFile(ocmLog, "utf8");
    assertEqual(report.targetCleanup?.status, "removed", "local-build target cleanup status");
    assertEqual(report.targetCleanup?.result?.attempts?.length, 2, "local-build target cleanup retry attempts");
    if (!/runtime remove kova-local-\d+ --json/.test(log)) {
      throw new Error(`runtime remove was not called; log:\n${log}`);
    }
    return {
      id: "local-build-runtime-cleanup",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "local-build-runtime-cleanup",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function localBuildRuntimeAlreadyAbsentCleanupCheck(tmp) {
  const binDir = join(tmp, "mock-bin-absent-runtime");
  const repoDir = join(tmp, "mock-openclaw failed build");
  const reportDir = join(tmp, "local-build-absent-cleanup-report");
  const ocmLog = join(tmp, "mock-ocm-absent.log");
  await mkdir(binDir, { recursive: true });
  await mkdir(repoDir, { recursive: true });
  const ocmPath = join(binDir, "ocm");
  await writeFile(ocmPath, `#!/bin/sh
printf '%s\\n' "$*" >> "$KOVA_MOCK_OCM_LOG"
case "$1:$2" in
  runtime:build-local) echo 'dependency install failed' >&2; exit 1 ;;
  runtime:remove) echo 'ocm: runtime "kova-local-mock" does not exist' >&2; exit 1 ;;
  service:status) echo '{"running":false,"desiredRunning":false,"childPid":null,"gatewayPort":null,"gatewayState":"stopped"}'; exit 0 ;;
  env:destroy) echo 'ocm: environment "kova-mock" does not exist' >&2; exit 1 ;;
esac
case "$1" in
  --version) echo 'mock-ocm'; exit 0 ;;
esac
echo "unhandled mock ocm command: $*" >&2
exit 2
`, "utf8");
  await chmod(ocmPath, 0o755);

  const command = `node bin/kova.mjs run --target local-build:${quoteShell(repoDir)} --scenario fresh-install --execute --report-dir ${quoteShell(reportDir)} --json`;
  const result = await runCommand(command, {
    timeoutMs: 30000,
    maxOutputChars: 1000000,
    env: {
      PATH: `${binDir}:${process.env.PATH}`,
      KOVA_MOCK_OCM_LOG: ocmLog
    }
  });

  try {
    if (result.status !== 0) {
      throw new Error(result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`);
    }
    const receipt = JSON.parse(result.stdout);
    const report = JSON.parse(await readFile(receipt.jsonPath, "utf8"));
    const summaryResult = await runCommand(`node bin/kova.mjs report summarize ${quoteShell(receipt.jsonPath)} --json`, {
      timeoutMs: 30000,
      maxOutputChars: 1000000
    });
    if (summaryResult.status !== 0) {
      throw new Error(summaryResult.stderr.trim() || summaryResult.stdout.trim() || `summary exit ${summaryResult.status}`);
    }
    const summary = JSON.parse(summaryResult.stdout);
    const log = await readFile(ocmLog, "utf8");
    assertEqual(report.summary?.statuses?.BLOCKED, 1, "failed local-build scenario status");
    assertEqual(report.records?.[0]?.cleanup, "already-absent", "already absent env cleanup status");
    assertEqual(report.targetCleanup?.status, "already-absent", "already absent local-build target cleanup status");
    assertEqual(summary.scenarios?.[0]?.failureReason, "dependency install failed", "summary failure reason");
    if (!/runtime remove kova-local-\d+ --json/.test(log)) {
      throw new Error(`runtime remove was not called after failed build; log:\n${log}`);
    }
    return {
      id: "local-build-runtime-already-absent-cleanup",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "local-build-runtime-already-absent-cleanup",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function cpuProfileParserCheck() {
  try {
    const summary = await summarizeCpuProfiles(["fixtures/diagnostics/sample.cpuprofile"], { limit: 3 });
    assertEqual(summary.profileCount, 1, "CPU profile count");
    assertEqual(summary.parseErrorCount, 0, "CPU profile parse errors");
    assertEqual(summary.topFunctions[0]?.functionName, "collectBundledPluginMetadata", "top CPU function");
    assertEqual(summary.topFunctions[0]?.selfMs, 7, "top CPU self ms");
    return {
      id: "cpu-profile-parser",
      status: "PASS",
      command: "parse fixtures/diagnostics/sample.cpuprofile",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "cpu-profile-parser",
      status: "FAIL",
      command: "parse fixtures/diagnostics/sample.cpuprofile",
      durationMs: 0,
      message: error.message
    };
  }
}

async function heapProfileParserCheck() {
  try {
    const summary = await summarizeHeapProfiles(["fixtures/diagnostics/sample.heapprofile"], { limit: 3 });
    assertEqual(summary.profileCount, 1, "heap profile count");
    assertEqual(summary.parseErrorCount, 0, "heap profile parse errors");
    assertEqual(summary.topFunctions[0]?.functionName, "loadBundledPluginMetadata", "top heap function");
    assertEqual(summary.topFunctions[0]?.selfSizeMb, 7, "top heap size mb");
    return {
      id: "heap-profile-parser",
      status: "PASS",
      command: "parse fixtures/diagnostics/sample.heapprofile",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "heap-profile-parser",
      status: "FAIL",
      command: "parse fixtures/diagnostics/sample.heapprofile",
      durationMs: 0,
      message: error.message
    };
  }
}

async function providerEvidenceParserCheck() {
  try {
    const text = await readFile("fixtures/provider/mock-requests.jsonl", "utf8");
    const evidence = parseProviderRequestLog(text);
    assertEqual(evidence.requestCount, 2, "provider request count");
    assertEqual(evidence.providerDurationMs, 6700, "provider duration includes first through last response");
    assertEqual(evidence.firstByteLatencyMs, 15, "first byte latency");
    const timelineEvidence = parseTimelineProviderRequestLog([
      JSON.stringify({
        schemaVersion: "openclaw.diagnostics.v1",
        type: "provider.request",
        timestamp: "2026-04-30T10:00:01.250Z",
        name: "provider.request",
        provider: "openai",
        operation: "responses.create",
        model: "gpt-5.5",
        durationMs: 350,
        ok: true
      })
    ].join("\n"));
    assertEqual(timelineEvidence.requestCount, 1, "timeline provider request count");
    assertEqual(timelineEvidence.providerDurationMs, 350, "timeline provider duration");
    assertEqual(timelineEvidence.requests[0]?.route, "responses.create", "timeline provider route");
    const attribution = computeProviderTurnAttribution({
      command: "ocm @kova -- agent --local --agent main --session-id kova --message hi --json",
      startedAt: "2026-04-30T10:00:01.000Z",
      startedAtEpochMs: 1777543201000,
      finishedAt: "2026-04-30T10:00:07.000Z",
      finishedAtEpochMs: 1777543207000
    }, {
      ...evidence,
      available: true
    });
    assertEqual(attribution.preProviderMs, 5000, "pre-provider latency");
    assertEqual(attribution.providerFinalMs, 800, "provider final latency");
    assertEqual(attribution.postProviderMs, 200, "post-provider latency");
    assertEqual(evidence.usage?.available, true, "provider usage availability");
    assertEqual(evidence.usage?.totalTokens, 12, "provider usage total tokens");
    return {
      id: "provider-evidence-parser",
      status: "PASS",
      command: "parse fixtures/provider/mock-requests.jsonl",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "provider-evidence-parser",
      status: "FAIL",
      command: "parse fixtures/provider/mock-requests.jsonl",
      durationMs: 0,
      message: error.message
    };
  }
}

async function liveApiKeyExecutionCheck(tmp) {
  const home = join(tmp, "live-api-key-home");
  const reportDir = join(tmp, "live-api-key-report");
  const openclawHome = join(tmp, "live-api-key-openclaw-home");
  const binDir = join(tmp, "live-api-key-bin");
  const ocmLog = join(tmp, "live-api-key-ocm.log");
  const secret = "kova-live-secret-selfcheck";
  await mkdir(join(home, "credentials"), { recursive: true });
  await mkdir(binDir, { recursive: true });
  await writeFile(join(home, "credentials", "providers.json"), `${JSON.stringify({
    schemaVersion: "kova.credentials.providers.v1",
    defaultProvider: "openai",
    providers: {
      openai: {
        id: "openai",
        method: "api-key",
        envVars: ["OPENAI_API_KEY"],
        externalCli: null,
        fallbackPolicy: "mock",
        configuredAt: new Date().toISOString()
      }
    }
  }, null, 2)}\n`, "utf8");
  await writeFile(join(home, "credentials", "live.env"), `OPENAI_API_KEY=${secret}\n`, { encoding: "utf8", mode: 0o600 });
  await writeFile(join(binDir, "ocm"), fakeOcmScript(), "utf8");
  await chmod(join(binDir, "ocm"), 0o755);

  const command = [
    `KOVA_HOME=${quoteShell(home)}`,
    `PATH=${quoteShell(`${binDir}:${process.env.PATH}`)}`,
    `KOVA_FAKE_OPENCLAW_HOME=${quoteShell(openclawHome)}`,
    `KOVA_MOCK_OCM_LOG=${quoteShell(ocmLog)}`,
    `node bin/kova.mjs run --target runtime:stable --scenario fresh-install --auth live --execute --report-dir ${quoteShell(reportDir)} --json`
  ].join(" ");
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000, redactValues: [secret] });

  try {
    if (result.status !== 0) {
      throw new Error(result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`);
    }
    const receipt = JSON.parse(result.stdout);
    const reportText = await readFile(receipt.jsonPath, "utf8");
    if (reportText.includes(secret)) {
      throw new Error("live API key leaked into JSON report");
    }
    const report = JSON.parse(reportText);
    const record = report.records?.[0];
    assertEqual(report.auth?.requestedMode, "live", "report requested live auth");
    assertEqual(report.auth?.live?.environmentDependent, true, "top-level live env-dependent flag");
    assertEqual(record?.auth?.mode, "live", "record live auth mode");
    assertEqual(record?.auth?.source, "api-key", "record live auth source");
    assertEqual(record?.auth?.setupKind, "openclaw-onboard", "record live setup kind");
    assertEqual(record?.auth?.environmentDependent, true, "record live env-dependent flag");
    assertEqual(record?.auth?.secretValues, "redacted", "record secret values redacted");
    assertEqual(record?.providerEvidence?.environmentDependent, true, "provider evidence live env-dependent flag");
    const config = JSON.parse(await readFile(join(openclawHome, ".openclaw", "openclaw.json"), "utf8"));
    assertEqual(config.models?.providers?.openai?.apiKey?.id, "OPENAI_API_KEY", "OpenClaw live config env ref");
    const serializedConfig = JSON.stringify(config);
    if (serializedConfig.includes(secret)) {
      throw new Error("live API key leaked into OpenClaw config");
    }
    const statusResult = record.phases
      ?.flatMap((phase) => phase.results ?? [])
      ?.find((item) => item.command.includes(" -- status"));
    if (!statusResult || statusResult.stdout.includes(secret) || !statusResult.stdout.includes("[REDACTED]")) {
      throw new Error("live command env was not redacted in command output");
    }
    return {
      id: "live-api-key-execution",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "live-api-key-execution",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function liveExternalCliDryRunCheck(tmp) {
  const home = join(tmp, "live-external-cli-home");
  const kovaHome = join(tmp, "live-external-cli-kova-home");
  const fakeBin = join(tmp, "live-external-cli-bin");
  const reportDir = join(tmp, "live-external-cli-report");
  await mkdir(join(home, ".codex"), { recursive: true });
  await mkdir(join(kovaHome, "credentials"), { recursive: true });
  await mkdir(fakeBin, { recursive: true });
  await writeFile(join(home, ".codex", "auth.json"), "{\"tokens\":{\"access_token\":\"redacted\"}}\n", "utf8");
  await writeFile(join(fakeBin, "codex"), "#!/bin/sh\necho codex-selfcheck\n", "utf8");
  await chmod(join(fakeBin, "codex"), 0o755);
  await writeFile(join(kovaHome, "credentials", "providers.json"), `${JSON.stringify({
    schemaVersion: "kova.credentials.providers.v1",
    defaultProvider: "openai",
    providers: {
      openai: {
        id: "openai",
        method: "external-cli",
        envVars: [],
        externalCli: "codex",
        fallbackPolicy: "mock",
        configuredAt: new Date().toISOString()
      }
    }
  }, null, 2)}\n`, "utf8");
  await writeFile(join(kovaHome, "credentials", "live.env"), "", { encoding: "utf8", mode: 0o600 });

  const command = [
    `HOME=${quoteShell(home)}`,
    `PATH=${quoteShell(`${fakeBin}:${process.env.PATH}`)}`,
    `KOVA_HOME=${quoteShell(kovaHome)}`,
    `node bin/kova.mjs run --target runtime:stable --scenario fresh-install --auth live --report-dir ${quoteShell(reportDir)} --json`
  ].join(" ");
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000 });

  try {
    if (result.status !== 0) {
      throw new Error(result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`);
    }
    const receipt = JSON.parse(result.stdout);
    const report = JSON.parse(await readFile(receipt.jsonPath, "utf8"));
    const record = report.records?.[0];
    assertEqual(report.auth?.requestedMode, "live", "external cli requested live auth");
    assertEqual(report.auth?.live?.method, "external-cli", "external cli live method");
    assertEqual(report.auth?.live?.verification?.verified, true, "external cli verification");
    assertEqual(record?.auth?.mode, "live", "external cli record live mode");
    assertEqual(record?.auth?.source, "external-cli", "external cli record source");
    assertEqual(record?.auth?.externalCli, "codex", "external cli record name");
    assertEqual(record?.auth?.setupKind, "fixture-config-patch", "codex cli fixture setup kind");
    const authSetupCommand = record.phases
      ?.flatMap((phase) => phase.commands ?? [])
      ?.find((item) => item.includes("configure-openclaw-live-auth.mjs")) ?? "";
    if (!/'?--auth-method'?\s+'?external-cli'?/.test(authSetupCommand) || !/'?--external-cli'?\s+'?codex'?/.test(authSetupCommand)) {
      throw new Error(`external-cli auth setup command missing expected args: ${authSetupCommand}`);
    }
    return {
      id: "live-external-cli-dry-run",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "live-external-cli-dry-run",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function liveExternalCliFallbackCheck(tmp) {
  const home = join(tmp, "live-external-cli-fallback-home");
  const kovaHome = join(tmp, "live-external-cli-fallback-kova-home");
  const fakeBin = join(tmp, "live-external-cli-fallback-bin");
  const reportDir = join(tmp, "live-external-cli-fallback-report");
  await mkdir(join(home, ".codex"), { recursive: true });
  await mkdir(join(kovaHome, "credentials"), { recursive: true });
  await mkdir(fakeBin, { recursive: true });
  await writeFile(join(home, ".codex", "auth.json"), "{\"tokens\":{\"access_token\":\"redacted\"}}\n", "utf8");
  await writeFile(join(fakeBin, "codex"), "#!/bin/sh\necho codex-selfcheck\n", "utf8");
  await chmod(join(fakeBin, "codex"), 0o755);
  await writeFile(join(kovaHome, "credentials", "providers.json"), `${JSON.stringify({
    schemaVersion: "kova.credentials.providers.v1",
    defaultProvider: "openai",
    providers: {
      openai: {
        id: "openai",
        method: "env-only",
        envVars: ["OPENAI_API_KEY"],
        externalCli: null,
        fallbackPolicy: "external-cli",
        configuredAt: new Date().toISOString()
      }
    }
  }, null, 2)}\n`, "utf8");
  await writeFile(join(kovaHome, "credentials", "live.env"), "", { encoding: "utf8", mode: 0o600 });

  const command = [
    `HOME=${quoteShell(home)}`,
    `PATH=${quoteShell(`${fakeBin}:${process.env.PATH}`)}`,
    `KOVA_HOME=${quoteShell(kovaHome)}`,
    `node bin/kova.mjs run --target runtime:stable --scenario fresh-install --auth live --report-dir ${quoteShell(reportDir)} --json`
  ].join(" ");
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000 });

  try {
    if (result.status !== 0) {
      throw new Error(result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`);
    }
    const receipt = JSON.parse(result.stdout);
    const report = JSON.parse(await readFile(receipt.jsonPath, "utf8"));
    const record = report.records?.[0];
    assertEqual(report.auth?.live?.method, "external-cli", "fallback live method");
    assertEqual(report.auth?.live?.fallbackFrom, "env-only", "fallback source method");
    assertEqual(report.auth?.live?.fallbackPolicy, "external-cli", "fallback policy");
    assertEqual(record?.auth?.source, "external-cli", "record fallback source");
    assertEqual(record?.auth?.fallbackFrom, "env-only", "record fallback from");
    assertEqual(record?.auth?.externalCli, "codex", "record fallback CLI");
    return {
      id: "live-external-cli-fallback",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "live-external-cli-fallback",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function liveAnthropicExternalCliDryRunCheck(tmp) {
  const home = join(tmp, "live-anthropic-cli-home");
  const kovaHome = join(tmp, "live-anthropic-cli-kova-home");
  const fakeBin = join(tmp, "live-anthropic-cli-bin");
  const reportDir = join(tmp, "live-anthropic-cli-report");
  await mkdir(join(home, ".claude"), { recursive: true });
  await mkdir(join(kovaHome, "credentials"), { recursive: true });
  await mkdir(fakeBin, { recursive: true });
  await writeFile(join(home, ".claude", ".credentials.json"), "{\"claudeAiOauth\":{\"accessToken\":\"redacted\"}}\n", "utf8");
  await writeFile(join(fakeBin, "claude"), "#!/bin/sh\necho claude-selfcheck\n", "utf8");
  await chmod(join(fakeBin, "claude"), 0o755);
  await writeFile(join(kovaHome, "credentials", "providers.json"), `${JSON.stringify({
    schemaVersion: "kova.credentials.providers.v1",
    defaultProvider: "anthropic",
    providers: {
      anthropic: {
        id: "anthropic",
        method: "external-cli",
        envVars: [],
        externalCli: "claude",
        fallbackPolicy: "mock",
        configuredAt: new Date().toISOString()
      }
    }
  }, null, 2)}\n`, "utf8");
  await writeFile(join(kovaHome, "credentials", "live.env"), "", { encoding: "utf8", mode: 0o600 });

  const command = [
    `HOME=${quoteShell(home)}`,
    `PATH=${quoteShell(`${fakeBin}:${process.env.PATH}`)}`,
    `KOVA_HOME=${quoteShell(kovaHome)}`,
    `node bin/kova.mjs run --target runtime:stable --scenario fresh-install --auth live --report-dir ${quoteShell(reportDir)} --json`
  ].join(" ");
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000 });

  try {
    if (result.status !== 0) {
      throw new Error(result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`);
    }
    const receipt = JSON.parse(result.stdout);
    const report = JSON.parse(await readFile(receipt.jsonPath, "utf8"));
    const record = report.records?.[0];
    assertEqual(report.auth?.live?.method, "external-cli", "anthropic external cli live method");
    assertEqual(report.auth?.live?.externalCli, "claude", "anthropic external cli name");
    assertEqual(record?.auth?.mode, "live", "anthropic cli record live mode");
    assertEqual(record?.auth?.providerId, "anthropic", "anthropic cli provider");
    assertEqual(record?.auth?.setupKind, "openclaw-onboard", "anthropic cli onboard setup");
    const authSetupCommand = record.phases
      ?.flatMap((phase) => phase.commands ?? [])
      ?.find((item) => item.includes("onboard")) ?? "";
    if (!authSetupCommand.includes("--auth-choice") || !authSetupCommand.includes("anthropic-cli")) {
      throw new Error(`anthropic external-cli auth setup command missing OpenClaw onboard path: ${authSetupCommand}`);
    }
    return {
      id: "live-anthropic-external-cli-dry-run",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "live-anthropic-external-cli-dry-run",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

function fakeOcmScript() {
  return `#!/bin/sh
printf '%s\\n' "$*" >> "$KOVA_MOCK_OCM_LOG"
case "$1:$2" in
  service:status) echo '{"running":false,"desiredRunning":false,"childPid":null,"gatewayPort":null,"gatewayState":"stopped"}'; exit 0 ;;
  env:exec)
    env_name="$3"
    shift 4
    OPENCLAW_HOME="$KOVA_FAKE_OPENCLAW_HOME" "$@"
    exit $?
    ;;
  env:destroy) echo '{"destroyed":true}'; exit 0 ;;
esac
case "$1" in
  start) echo '{"ok":true}'; exit 0 ;;
  logs) exit 0 ;;
  @*)
    env_name="$1"
    shift
    if [ "$1" = "--" ]; then shift; fi
    if [ "$1" = "onboard" ]; then
      mkdir -p "$KOVA_FAKE_OPENCLAW_HOME/.openclaw"
      case " $* " in
        *" --auth-choice openai-api-key "*)
          cat > "$KOVA_FAKE_OPENCLAW_HOME/.openclaw/openclaw.json" <<'JSON'
{"models":{"mode":"merge","providers":{"openai":{"apiKey":{"source":"env","provider":"default","id":"OPENAI_API_KEY"},"models":[{"id":"gpt-5.5","name":"gpt-5.5","api":"openai-responses"}]}}},"agents":{"defaults":{"model":{"primary":"openai/gpt-5.5"}}}}
JSON
          ;;
        *" --auth-choice apiKey "*)
          cat > "$KOVA_FAKE_OPENCLAW_HOME/.openclaw/openclaw.json" <<'JSON'
{"models":{"mode":"merge","providers":{"anthropic":{"apiKey":{"source":"env","provider":"default","id":"ANTHROPIC_API_KEY"},"models":[{"id":"claude-sonnet-4-5","name":"claude-sonnet-4-5"}]}}},"agents":{"defaults":{"model":{"primary":"anthropic/claude-sonnet-4-5"}}}}
JSON
          ;;
        *" --auth-choice anthropic-cli "*)
          cat > "$KOVA_FAKE_OPENCLAW_HOME/.openclaw/openclaw.json" <<'JSON'
{"agents":{"defaults":{"model":{"primary":"claude-cli/claude-sonnet-4-5"},"agentRuntime":{"id":"claude-cli","fallback":"none"}}}}
JSON
          ;;
      esac
      echo '{"ok":true}'
      exit 0
    fi
    echo "live command key=$OPENAI_API_KEY"
    exit 0
    ;;
  --version) echo 'mock-ocm'; exit 0 ;;
esac
echo "unhandled mock ocm command: $*" >&2
exit 2
`;
}

function agentTurnBreakdownCheck() {
  try {
    const normal = syntheticTurn({
      startedAtEpochMs: 1000,
      firstProviderRequestAtEpochMs: 1200,
      firstByteLatencyMs: 15,
      firstChunkLatencyMs: 18,
      lastProviderResponseAtEpochMs: 1600,
      finishedAtEpochMs: 2000,
      timelineSummary: {
        available: true,
        spanTotals: {
          "agent.prepare": { count: 1, totalDurationMs: 90, maxDurationMs: 90 },
          "models.catalog.gateway": { count: 1, totalDurationMs: 70, maxDurationMs: 70 },
          "channel.plugin.load": { count: 1, totalDurationMs: 25, maxDurationMs: 25 }
        },
        keySpans: {}
      }
    });
    assertEqual(normal.breakdown.buckets.preProviderOpenClawMs, 200, "normal pre-provider bucket");
    assertEqual(normal.breakdown.buckets.providerMs, 400, "normal provider bucket");
    assertEqual(normal.breakdown.buckets.postProviderMs, 400, "normal post-provider bucket");
    assertEqual(normal.breakdown.buckets.unknownMs, 15, "normal unattributed pre-provider bucket");
    assertEqual(normal.breakdown.provider.firstByteLatencyMs, 15, "normal first byte latency");
    assertEqual(normal.breakdown.sourceSpans.categories.modelCatalog.totalDurationMs, 70, "model catalog source span");

    const preProviderStall = syntheticTurn({
      startedAtEpochMs: 1000,
      firstProviderRequestAtEpochMs: 62000,
      lastProviderResponseAtEpochMs: 62800,
      finishedAtEpochMs: 63000,
      timelineSummary: null
    });
    assertEqual(preProviderStall.breakdown.evidenceQuality, "outside-in-only", "pre-provider missing timeline quality");
    assertEqual(preProviderStall.breakdown.buckets.preProviderOpenClawMs, 61000, "pre-provider stall bucket");
    assertEqual(preProviderStall.breakdown.buckets.unknownMs, 61000, "pre-provider stall unknown");

    const providerStall = syntheticTurn({
      startedAtEpochMs: 1000,
      firstProviderRequestAtEpochMs: 1500,
      lastProviderResponseAtEpochMs: 21500,
      finishedAtEpochMs: 22000,
      timelineSummary: null
    });
    assertEqual(providerStall.breakdown.buckets.providerMs, 20000, "provider stall bucket");
    assertEqual(providerStall.breakdown.buckets.unknownMs, 500, "provider stall unknown pre-provider");

    const cleanupStall = syntheticTurn({
      startedAtEpochMs: 1000,
      firstProviderRequestAtEpochMs: 1500,
      lastProviderResponseAtEpochMs: 1800,
      finishedAtEpochMs: 77000,
      timelineSummary: {
        available: true,
        spanTotals: {
          "agent.cleanup": { count: 1, totalDurationMs: 74000, maxDurationMs: 74000 }
        },
        keySpans: {}
      }
    });
    assertEqual(cleanupStall.breakdown.buckets.cleanupMs, 74000, "cleanup stall bucket");
    assertEqual(cleanupStall.breakdown.sourceSpans.categories.agentCleanup.totalDurationMs, 74000, "cleanup source span");

    const missingTimeline = syntheticTurn({
      startedAtEpochMs: 1000,
      firstProviderRequestAtEpochMs: 1500,
      lastProviderResponseAtEpochMs: 1800,
      finishedAtEpochMs: 1900,
      timelineSummary: { available: false, spanTotals: {}, keySpans: {} }
    });
    assertEqual(missingTimeline.breakdown.evidenceQuality, "outside-in-only", "missing timeline fallback quality");
    assertEqual(missingTimeline.breakdown.buckets.unknownMs, 500, "missing timeline unknown");

    const record = {
      scenario: "agent-cold-warm-message",
      title: "Agent cold/warm message",
      status: "PASS",
      cleanup: "done",
      phases: [{
        id: "cold-agent-turn",
        title: "Cold agent turn",
        intent: "Synthetic self-check",
        commands: [normal.result.command],
        evidence: [],
        results: [{
          ...normal.result,
          status: 0,
          timedOut: false,
          stdout: "{\"finalAssistantVisibleText\":\"KOVA_AGENT_OK\"}",
          stderr: ""
        }],
        metrics: {
          logs: zeroLogMetrics(),
          health: { ok: true },
          timeline: {
            available: true,
            eventCount: 3,
            parseErrorCount: 0,
            spanTotals: {
              "agent.prepare": { count: 1, totalDurationMs: 90, maxDurationMs: 90 },
              "models.catalog.gateway": { count: 1, totalDurationMs: 70, maxDurationMs: 70 }
            },
            keySpans: {}
          }
        }
      }],
      providerEvidence: {
        available: true,
        requestCount: 1,
        requests: [normal.request]
      },
      finalMetrics: {
        service: { gatewayState: "running" },
        logs: zeroLogMetrics()
      }
    };
    evaluateRecord(record, {
      id: "agent-cold-warm-message",
      agent: { expectedText: "KOVA_AGENT_OK" },
      thresholds: {}
    }, { surface: { thresholds: {} }, targetPlan: { kind: "local-build" } });
    assertEqual(record.measurements.agentTurnStats?.count, 1, "agent turn stats count");
    assertEqual(record.measurements.agentTurnP95Ms, 1000, "agent turn p95");
    assertEqual(record.measurements.agentPreProviderP95Ms, 200, "agent pre-provider p95");
    const rendered = renderMarkdownReport({
      generatedAt: "2026-05-01T00:00:00.000Z",
      runId: "self-check-agent-turn-breakdown",
      mode: "self-check",
      target: "runtime:stable",
      platform: { os: "test", release: "test", arch: "test", node: "test" },
      records: [record],
      summary: { statuses: { PASS: 1 } }
    });
    assertEqual(rendered.includes("breakdown:"), true, "markdown includes agent turn breakdown");
    assertEqual(rendered.includes("models.catalog.* 70ms"), true, "markdown includes source span evidence");
    assertEqual(rendered.includes("Agent turn stats:"), true, "markdown includes agent turn stats");
    assertEqual(
      summarizeAgentTurnBreakdownForMarkdown(normal.breakdown).includes("unknown 15ms"),
      true,
      "breakdown markdown helper includes unknown bucket"
    );

    const cleanupRecord = {
      scenario: "agent-cold-warm-message",
      title: "Agent cleanup stall",
      status: "PASS",
      cleanup: "done",
      phases: [{
        id: "cleanup-agent-turn",
        title: "Cleanup agent turn",
        intent: "Synthetic cleanup stall",
        commands: [cleanupStall.result.command],
        evidence: [],
        results: [{
          ...cleanupStall.result,
          status: 0,
          timedOut: false,
          stdout: "{\"finalAssistantVisibleText\":\"KOVA_AGENT_OK\"}",
          stderr: ""
        }],
        metrics: {
          logs: zeroLogMetrics(),
          health: { ok: true },
          timeline: {
            available: true,
            eventCount: 1,
            parseErrorCount: 0,
            spanTotals: {
              "agent.cleanup": { count: 1, totalDurationMs: 74000, maxDurationMs: 74000 }
            },
            keySpans: {}
          }
        }
      }],
      providerEvidence: {
        available: true,
        requestCount: 1,
        requests: [cleanupStall.request]
      },
      finalMetrics: {
        service: { gatewayState: "running" },
        logs: zeroLogMetrics()
      }
    };
    evaluateRecord(cleanupRecord, {
      id: "agent-cold-warm-message",
      agent: { expectedText: "KOVA_AGENT_OK" },
      thresholds: { agentCleanupMs: 5000 }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "local-build" } });
    assertEqual(cleanupRecord.status, "FAIL", "cleanup stall should fail");
    assertEqual(cleanupRecord.measurements.agentCleanupMaxMs, 74000, "agent cleanup max measurement");
    assertEqual(cleanupRecord.measurements.agentCleanupDiagnosis.kind, "slow-agent-cleanup", "agent cleanup diagnosis");
    assertEqual(
      cleanupRecord.measurements.agentFailureFixerSummary.items.some((item) => item.kind === "slow-agent-cleanup"),
      true,
      "slow cleanup fixer evidence"
    );

    return {
      id: "agent-turn-breakdown",
      status: "PASS",
      command: "evaluate synthetic agent turn phase breakdowns",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "agent-turn-breakdown",
      status: "FAIL",
      command: "evaluate synthetic agent turn phase breakdowns",
      durationMs: 0,
      message: error.message
    };
  }
}

function gatewaySessionTurnEvaluationCheck() {
  try {
    const base = 1777536000000;
    const coldPayload = {
      ok: true,
      surface: "gateway-session-send-turn",
      method: "sessions.send",
      createSession: true,
      minAssistantCount: 1,
      sessionKey: "kova-gateway-session-send",
      runId: "cold-run",
      gatewayTransport: { kind: "direct-gateway-rpc", fallbackReason: null },
      activeStartedAtEpochMs: base + 1000,
      activeFinishedAtEpochMs: base + 2500,
      activeTurnMs: 1500,
      sessionCreateDurationMs: 100,
      sendStartedAtEpochMs: base + 1000,
      sendFinishedAtEpochMs: base + 1040,
      sendDurationMs: 40,
      assistantFirstSeenAtEpochMs: base + 2200,
      assistantMatchedAtEpochMs: base + 2500,
      timeToFirstAssistantMs: 1200,
      timeToMatchedAssistantMs: 1500,
      historyPollCount: 3,
      historyErrorCount: 0,
      assistantMessageCount: 1,
      finalAssistantVisibleText: "KOVA_AGENT_OK",
      expectedTextPresent: true
    };
    const warmPayload = {
      ok: true,
      surface: "gateway-session-send-turn",
      method: "sessions.send",
      createSession: false,
      minAssistantCount: 2,
      sessionKey: "kova-gateway-session-send",
      runId: "warm-run",
      gatewayTransport: { kind: "direct-gateway-rpc", fallbackReason: null },
      activeStartedAtEpochMs: base + 11000,
      activeFinishedAtEpochMs: base + 11800,
      activeTurnMs: 800,
      sessionCreateDurationMs: null,
      sendStartedAtEpochMs: base + 11000,
      sendFinishedAtEpochMs: base + 11050,
      sendDurationMs: 50,
      assistantFirstSeenAtEpochMs: base + 11600,
      assistantMatchedAtEpochMs: base + 11800,
      timeToFirstAssistantMs: 600,
      timeToMatchedAssistantMs: 800,
      historyPollCount: 2,
      historyErrorCount: 0,
      assistantMessageCount: 2,
      finalAssistantVisibleText: "KOVA_AGENT_OK",
      expectedTextPresent: true
    };
    const record = {
      scenario: "gateway-session-send-turn",
      surface: "gateway-session-send-turn",
      title: "Gateway session cold/warm",
      status: "PASS",
      cleanup: "done",
      auth: { mode: "mock" },
      phases: [
        {
          id: "cold-gateway-session-turn",
          title: "Cold Gateway Session Turn",
          intent: "Synthetic cold Gateway session turn",
          commands: ["node support/run-gateway-session-send-turn.mjs --create-session true"],
          evidence: [],
          results: [{
            command: "node support/run-gateway-session-send-turn.mjs --create-session true",
            status: 0,
            timedOut: false,
            startedAt: new Date(base).toISOString(),
            startedAtEpochMs: base,
            finishedAt: new Date(base + 5000).toISOString(),
            finishedAtEpochMs: base + 5000,
            durationMs: 5000,
            stdout: JSON.stringify(coldPayload),
            stderr: ""
          }],
          metrics: { logs: zeroLogMetrics(), health: { ok: true } }
        },
        {
          id: "warm-gateway-session-turn",
          title: "Warm Gateway Session Turn",
          intent: "Synthetic warm Gateway session turn",
          commands: ["node support/run-gateway-session-send-turn.mjs --create-session false"],
          evidence: [],
          results: [{
            command: "node support/run-gateway-session-send-turn.mjs --create-session false",
            status: 0,
            timedOut: false,
            startedAt: new Date(base + 10000).toISOString(),
            startedAtEpochMs: base + 10000,
            finishedAt: new Date(base + 14000).toISOString(),
            finishedAtEpochMs: base + 14000,
            durationMs: 4000,
            stdout: JSON.stringify(warmPayload),
            stderr: ""
          }],
          metrics: { logs: zeroLogMetrics(), health: { ok: true } }
        }
      ],
      providerEvidence: {
        available: true,
        requestCount: 2,
        requests: [
          {
            requestId: "cold-provider",
            receivedAt: new Date(base + 1200).toISOString(),
            receivedAtEpochMs: base + 1200,
            respondedAt: new Date(base + 1800).toISOString(),
            respondedAtEpochMs: base + 1800,
            firstByteLatencyMs: 25,
            firstChunkLatencyMs: 30,
            route: "/v1/responses",
            model: "gpt-5.5",
            status: 200
          },
          {
            requestId: "warm-provider",
            receivedAt: new Date(base + 11250).toISOString(),
            receivedAtEpochMs: base + 11250,
            respondedAt: new Date(base + 11600).toISOString(),
            respondedAtEpochMs: base + 11600,
            firstByteLatencyMs: 20,
            firstChunkLatencyMs: 22,
            route: "/v1/responses",
            model: "gpt-5.5",
            status: 200
          }
        ]
      },
      finalMetrics: {
        service: { gatewayState: "running" },
        logs: zeroLogMetrics(),
        timeline: {
          available: true,
          eventCount: 5,
          parseErrorCount: 0,
          events: [
            { type: "span.end", name: "plugins.metadata.scan", timestamp: new Date(base + 700).toISOString(), durationMs: 99 },
            { type: "span.end", name: "plugins.metadata.scan", timestamp: new Date(base + 1150).toISOString(), durationMs: 33 },
            { type: "eventLoop.sample", name: "eventLoop.sample", timestamp: new Date(base + 1250).toISOString(), maxMs: 9 },
            { type: "span.end", name: "plugins.metadata.scan", timestamp: new Date(base + 11100).toISOString(), durationMs: 11 },
            { type: "eventLoop.sample", name: "eventLoop.sample", timestamp: new Date(base + 11200).toISOString(), maxMs: 7 }
          ],
          spanTotals: {},
          keySpans: {}
        }
      }
    };

    evaluateRecord(record, {
      id: "gateway-session-send-turn",
      agent: { expectedText: "KOVA_AGENT_OK" },
      thresholds: { agentTurnMs: 2000, coldAgentTurnMs: 2000, warmAgentTurnMs: 1000 }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "runtime" } });

    assertEqual(record.status, "PASS", "gateway session active-window scenario status");
    assertEqual(record.measurements.coldAgentTurnMs, 1500, "cold gateway session active turn duration");
    assertEqual(record.measurements.warmAgentTurnMs, 800, "warm gateway session active turn duration");
    assertEqual(record.measurements.agentTurnMs, 1500, "agent turn max uses active turn duration");
    assertEqual(record.measurements.agentTurns[0].rawCommandDurationMs, 5000, "raw support command duration preserved");
    assertEqual(record.measurements.coldPreProviderMs, 200, "cold pre-provider uses active window");
    assertEqual(record.measurements.coldProviderFinalMs, 600, "cold provider duration");
    assertEqual(record.measurements.agentMetadataScanCount, 2, "active-window metadata scans");
    assertEqual(record.measurements.agentMetadataScanTotalMs, 44, "active-window metadata scan total");
    assertEqual(record.measurements.agentEventLoopMaxMs, 9, "active-window event-loop max");
    assertEqual(record.measurements.agentSessionPollCount, 5, "session polling total");
    assertEqual(record.measurements.agentTurns[1].gatewaySession.createSession, false, "warm turn reuses session");
    assertEqual(record.measurements.agentTurns[0].gatewaySession.gatewayTransportKind, "direct-gateway-rpc", "Gateway session direct Gateway transport");

    const rendered = renderMarkdownReport({
      generatedAt: "2026-05-01T00:00:00.000Z",
      runId: "self-check-gateway-session-turn",
      mode: "self-check",
      target: "runtime:stable",
      platform: { os: "test", release: "test", arch: "test", node: "test" },
      records: [record],
      summary: { statuses: { PASS: 1 } }
    });
    assertEqual(rendered.includes("gateway session:"), true, "markdown includes gateway session detail");
    assertEqual(rendered.includes("transport direct-gateway-rpc"), true, "markdown includes direct Gateway transport");
    assertEqual(rendered.includes("active window:"), true, "markdown includes active turn diagnostics");

    const fallbackPayload = {
      ...coldPayload,
      gatewayTransport: { kind: "shell", fallbackReason: "gateway-token-unavailable" }
    };
    const fallbackRecord = {
      scenario: "gateway-session-send-turn",
      surface: "gateway-session-send-turn",
      title: "Gateway session shell fallback",
      status: "PASS",
      phases: [{
        id: "cold-gateway-session-turn",
        title: "Cold Gateway Session Turn",
        intent: "Synthetic shell fallback",
        commands: ["node support/run-gateway-session-send-turn.mjs --create-session true"],
        evidence: [],
        results: [{
          command: "node support/run-gateway-session-send-turn.mjs --create-session true",
          status: 0,
          timedOut: false,
          startedAt: new Date(base).toISOString(),
          startedAtEpochMs: base,
          finishedAt: new Date(base + 5000).toISOString(),
          finishedAtEpochMs: base + 5000,
          durationMs: 5000,
          stdout: JSON.stringify(fallbackPayload),
          stderr: ""
        }],
        metrics: { logs: zeroLogMetrics(), health: { ok: true } }
      }],
      providerEvidence: {
        available: true,
        requestCount: 1,
        requests: [record.providerEvidence.requests[0]]
      },
      finalMetrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
    };
    evaluateRecord(fallbackRecord, {
      id: "gateway-session-send-turn",
      agent: { expectedText: "KOVA_AGENT_OK" },
      thresholds: {}
    }, { surface: { thresholds: {} }, targetPlan: { kind: "runtime" } });
    assertEqual(fallbackRecord.status, "FAIL", "gateway session shell fallback rejected");
    assertEqual(
      fallbackRecord.violations.some((violation) => violation.metric === "gatewayTransport.kind"),
      true,
      "gateway session shell fallback violation"
    );

    return {
      id: "gateway-session-turn-evaluation",
      status: "PASS",
      command: "evaluate synthetic Gateway session cold/warm active-turn attribution",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "gateway-session-turn-evaluation",
      status: "FAIL",
      command: "evaluate synthetic Gateway session cold/warm active-turn attribution",
      durationMs: 0,
      message: error.message
    };
  }
}

function gatewaySessionPreProviderAttributionCheck() {
  try {
    const base = 1777536000000;
    const timelineText = [
      timelineEvent({ type: "span.start", name: "gateway.chat_send.load_session", timestamp: base + 1010, spanId: "cold-load" }),
      timelineEvent({ type: "span.end", name: "gateway.chat_send.load_session", timestamp: base + 1070, spanId: "cold-load", durationMs: 60 }),
      timelineEvent({ type: "span.start", name: "auto_reply.finalize_context", timestamp: base + 1060, spanId: "cold-finalize" }),
      timelineEvent({ type: "span.end", name: "auto_reply.finalize_context", timestamp: base + 1160, spanId: "cold-finalize", durationMs: 100 }),
      timelineEvent({ type: "span.start", name: "reply.ensure_workspace", timestamp: base + 1180, spanId: "cold-workspace" }),
      timelineEvent({ type: "span.error", name: "reply.ensure_workspace", timestamp: base + 1230, spanId: "cold-workspace", durationMs: 50, errorName: "SyntheticError" }),
      timelineEvent({ type: "span.end", name: "plugins.metadata.scan", timestamp: base + 1150, spanId: "cold-scan", durationMs: 33, phase: "startup" }),
      timelineEvent({ type: "span.end", name: "plugins.metadata.scan", timestamp: base + 1175, spanId: "cold-scan-gap", durationMs: 10, phase: "agent-turn" }),
      timelineEvent({ type: "provider.request", name: "provider.request", timestamp: base + 1200, receivedAtEpochMs: base + 1200, respondedAtEpochMs: base + 1800, durationMs: 600 }),
      timelineEvent({ type: "eventLoop.sample", name: "eventLoop.sample", timestamp: base + 1250, maxMs: 9 }),
      timelineEvent({ type: "span.start", name: "gateway.chat_send.dispatch_inbound", timestamp: base + 11025, spanId: "warm-dispatch" }),
      timelineEvent({ type: "span.end", name: "gateway.chat_send.dispatch_inbound", timestamp: base + 11125, spanId: "warm-dispatch", durationMs: 100 }),
      timelineEvent({ type: "span.start", name: "reply.load_runtime_plugins", timestamp: base + 11120, spanId: "warm-plugins" }),
      timelineEvent({ type: "span.end", name: "reply.load_runtime_plugins", timestamp: base + 11220, spanId: "warm-plugins", durationMs: 100 }),
      timelineEvent({ type: "span.end", name: "plugins.metadata.scan", timestamp: base + 11100, spanId: "warm-scan", durationMs: 11, phase: "agent-turn" }),
      timelineEvent({ type: "provider.request", name: "provider.request", timestamp: base + 11250, receivedAtEpochMs: base + 11250, respondedAtEpochMs: base + 11600, durationMs: 350 }),
      timelineEvent({ type: "eventLoop.sample", name: "eventLoop.sample", timestamp: base + 11200, maxMs: 7 })
    ].join("\n");
    const parsed = parseTimelineText(timelineText);
    assertEqual(parsed.turnAttributionEvents.length, 17, "turn attribution events retained");
    const parsedIntervals = attributedSpanIntervals(parsed.turnAttributionEvents);
    assertEqual(parsedIntervals.length, 8, "span parser includes error terminal and metadata scans");
    assertEqual(parsedIntervals.some((span) => span.type === "span.error" && span.name === "reply.ensure_workspace"), true, "span error included");

    const coldAttribution = buildGatewaySessionPreProviderAttribution({
      label: "cold",
      phaseId: "cold-gateway-session-turn",
      activeStartedAtEpochMs: base + 1000,
      activeFinishedAtEpochMs: base + 2500,
      attribution: {
        firstProviderRequestAtEpochMs: base + 1200,
        preProviderMs: 200,
        providerFinalMs: 600,
        firstByteLatencyMs: 25,
        firstChunkLatencyMs: 30
      },
      timelineSummary: {
        available: true,
        turnAttributionEvents: parsed.turnAttributionEvents,
        artifacts: ["/tmp/kova/openclaw/timeline.jsonl"]
      }
    });
    assertEqual(coldAttribution.available, true, "cold attribution available");
    assertEqual(coldAttribution.knownAttributedMs, 180, "overlap-safe cold known attribution includes active-turn metadata scan");
    assertEqual(coldAttribution.unattributedMs, 20, "cold unattributed remainder");
    const coldScanSummary = coldAttribution.spanSummaries.find((span) => span.name === "plugins.metadata.scan");
    assertEqual(coldScanSummary?.count, 2, "gateway session attribution includes active-turn metadata scans");
    assertEqual(coldScanSummary?.phases?.some((phase) => phase.phase === "startup"), true, "startup phase scan inside active window is counted");
    assertEqual(coldScanSummary?.phases?.some((phase) => phase.phase === "agent-turn"), true, "agent-turn phase scan inside active window is counted");
    assertEqual(coldAttribution.spanSummaries.find((span) => span.name === "reply.ensure_workspace")?.errorCount, 1, "error span summary");
    assertEqual(coldAttribution.provider.totalDurationMs, 600, "provider duration stays separate");
    assertEqual(coldAttribution.timelineArtifacts[0], "/tmp/kova/openclaw/timeline.jsonl", "timeline artifact path");

    const missingAttribution = buildGatewaySessionPreProviderAttribution({
      label: "cold",
      phaseId: "cold-gateway-session-turn",
      activeStartedAtEpochMs: base + 1000,
      activeFinishedAtEpochMs: base + 2500,
      attribution: { firstProviderRequestAtEpochMs: base + 1200, preProviderMs: 200 },
      timelineSummary: { available: false, artifacts: [] }
    });
    assertEqual(missingAttribution.available, false, "missing timeline unavailable");
    assertEqual(missingAttribution.unattributedMs, 200, "missing timeline preserves full remainder");

    const record = syntheticGatewaySessionRecord({ base, timeline: parsed });
    evaluateRecord(record, {
      id: "gateway-session-send-turn",
      agent: { expectedText: "KOVA_AGENT_OK" },
      thresholds: { agentTurnMs: 2000, coldAgentTurnMs: 2000, warmAgentTurnMs: 1000 }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "runtime" } });
    assertEqual(record.measurements.coldPreProviderAttributedMs, 180, "record cold attributed metric");
    assertEqual(record.measurements.warmPreProviderAttributedMs, 195, "record warm attributed metric");
    assertEqual(record.measurements.warmPreProviderUnattributedMs, 55, "record warm unattributed metric");
    assertEqual(record.measurements.gatewaySessionPreProviderAttribution.timelineArtifacts[0], "/tmp/kova/openclaw/timeline.jsonl", "record timeline artifact");

    const rendered = renderMarkdownReport({
      generatedAt: "2026-05-01T00:00:00.000Z",
      runId: "self-check-gateway-session-pre-provider",
      mode: "self-check",
      target: "runtime:stable",
      platform: { os: "test", release: "test", arch: "test", node: "test" },
      records: [record],
      summary: { statuses: { PASS: 1 } }
    });
    assertEqual(rendered.includes("Gateway session pre-provider attribution:"), true, "markdown includes gateway session attribution table");
    assertEqual(rendered.includes("Spans are selected by active turn timestamp window"), true, "markdown describes timestamp-window attribution");
    assertEqual(rendered.includes("`agent-turn`"), true, "markdown includes metadata scan phase as descriptive context");
    assertEqual(rendered.includes("`reply.ensure_workspace`"), true, "markdown includes span table");

    return {
      id: "gateway-session-pre-provider-attribution",
      status: "PASS",
      command: "evaluate synthetic Gateway session pre-provider timeline attribution",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "gateway-session-pre-provider-attribution",
      status: "FAIL",
      command: "evaluate synthetic Gateway session pre-provider timeline attribution",
      durationMs: 0,
      message: error.message
    };
  }
}

function agentCliPreProviderAttributionCheck() {
  try {
    const base = 1777536000000;
    const timelineText = [
      timelineEvent({ type: "span.start", name: "agent.turn", timestamp: base + 1000, spanId: "cold-turn" }),
      timelineEvent({ type: "span.start", name: "agent.prepare", timestamp: base + 1020, spanId: "cold-prepare" }),
      timelineEvent({ type: "span.end", name: "agent.prepare", timestamp: base + 1120, spanId: "cold-prepare", durationMs: 100 }),
      timelineEvent({ type: "span.start", name: "models.catalog.gateway", timestamp: base + 1080, spanId: "cold-models" }),
      timelineEvent({ type: "span.end", name: "models.catalog.gateway", timestamp: base + 1180, spanId: "cold-models", durationMs: 100 }),
      timelineEvent({ type: "span.start", name: "channel.plugin.load", timestamp: base + 1150, spanId: "cold-channel" }),
      timelineEvent({ type: "span.error", name: "channel.plugin.load", timestamp: base + 1170, spanId: "cold-channel", durationMs: 20, errorName: "SyntheticError" }),
      timelineEvent({ type: "span.end", name: "plugins.metadata.scan", timestamp: base + 1190, spanId: "cold-scan", durationMs: 30 }),
      timelineEvent({ type: "provider.request", name: "provider.request", timestamp: base + 1200, receivedAtEpochMs: base + 1200, respondedAtEpochMs: base + 1700, durationMs: 500 }),
      timelineEvent({ type: "span.end", name: "agent.turn", timestamp: base + 1900, spanId: "cold-turn", durationMs: 900 }),
      timelineEvent({ type: "span.start", name: "runtimeDeps.stage", timestamp: base + 11020, spanId: "warm-runtime" }),
      timelineEvent({ type: "span.end", name: "runtimeDeps.stage", timestamp: base + 11070, spanId: "warm-runtime", durationMs: 50 }),
      timelineEvent({ type: "span.start", name: "channel.capabilities", timestamp: base + 11080, spanId: "warm-channel" }),
      timelineEvent({ type: "span.end", name: "channel.capabilities", timestamp: base + 11110, spanId: "warm-channel", durationMs: 30 }),
      timelineEvent({ type: "provider.request", name: "provider.request", timestamp: base + 11200, receivedAtEpochMs: base + 11200, respondedAtEpochMs: base + 11500, durationMs: 300 }),
      timelineEvent({ type: "eventLoop.sample", name: "eventLoop.sample", timestamp: base + 11250, maxMs: 6 })
    ].join("\n");
    const parsed = parseTimelineText(timelineText);
    assertEqual(parsed.turnAttributionEvents.length, 16, "agent CLI turn attribution events retained");

    const coldAttribution = buildAgentCliPreProviderAttribution({
      label: "cold",
      phaseId: "cold-agent-turn",
      activeStartedAtEpochMs: base + 1000,
      activeFinishedAtEpochMs: base + 1900,
      attribution: {
        firstProviderRequestAtEpochMs: base + 1200,
        preProviderMs: 200,
        providerFinalMs: 500
      },
      timelineSummary: {
        available: true,
        turnAttributionEvents: parsed.turnAttributionEvents,
        artifacts: ["/tmp/kova/openclaw/timeline.jsonl"]
      }
    });
    assertEqual(coldAttribution.available, true, "agent CLI cold attribution available");
    assertEqual(coldAttribution.knownAttributedMs, 170, "agent CLI overlap-safe cold known attribution");
    assertEqual(coldAttribution.unattributedMs, 30, "agent CLI cold unattributed remainder");
    assertEqual(coldAttribution.spanSummaries.some((span) => span.name === "agent.turn"), false, "agent.turn parent span is not counted as pre-provider work");
    assertEqual(coldAttribution.spanSummaries.find((span) => span.name === "channel.plugin.load")?.errorCount, 1, "agent CLI error span summary");

    const missingAttribution = buildAgentCliPreProviderAttribution({
      label: "cold",
      phaseId: "cold-agent-turn",
      activeStartedAtEpochMs: base + 1000,
      activeFinishedAtEpochMs: base + 1900,
      attribution: { firstProviderRequestAtEpochMs: base + 1200, preProviderMs: 200 },
      timelineSummary: { available: false, artifacts: [] }
    });
    assertEqual(missingAttribution.available, false, "agent CLI missing timeline unavailable");
    assertEqual(missingAttribution.unattributedMs, 200, "agent CLI missing timeline preserves full remainder");

    const record = syntheticAgentCliRecord({ base, timeline: parsed });
    evaluateRecord(record, {
      id: "agent-cold-warm-message",
      agent: { expectedText: "KOVA_AGENT_OK" },
      thresholds: { agentTurnMs: 2000, coldAgentTurnMs: 2000, warmAgentTurnMs: 1000 }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "runtime" } });
    assertEqual(record.measurements.agentCliPreProviderAttribution.count, 2, "record agent CLI attribution count");
    assertEqual(record.measurements.gatewaySessionPreProviderAttribution.count, 0, "record gateway session attribution stays empty for CLI turns");
    assertEqual(record.measurements.coldPreProviderAttributedMs, 170, "record agent CLI cold attributed metric");
    assertEqual(record.measurements.warmPreProviderAttributedMs, 80, "record agent CLI warm attributed metric");
    assertEqual(record.measurements.warmPreProviderUnattributedMs, 120, "record agent CLI warm unattributed metric");
    assertEqual(record.measurements.agentTurns[0].agentCliPreProviderAttribution.timelineArtifacts[0], "/tmp/kova/openclaw/timeline.jsonl", "record agent CLI timeline artifact");

    const rendered = renderMarkdownReport({
      generatedAt: "2026-05-01T00:00:00.000Z",
      runId: "self-check-agent-cli-pre-provider",
      mode: "self-check",
      target: "runtime:stable",
      platform: { os: "test", release: "test", arch: "test", node: "test" },
      records: [record],
      summary: { statuses: { PASS: 1 } }
    });
    assertEqual(rendered.includes("Agent CLI pre-provider attribution:"), true, "markdown includes agent CLI attribution table");
    assertEqual(rendered.includes("`channel.plugin.load`"), true, "markdown includes agent CLI span table");

    return {
      id: "agent-cli-pre-provider-attribution",
      status: "PASS",
      command: "evaluate synthetic agent CLI pre-provider timeline attribution",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "agent-cli-pre-provider-attribution",
      status: "FAIL",
      command: "evaluate synthetic agent CLI pre-provider timeline attribution",
      durationMs: 0,
      message: error.message
    };
  }
}

function timelineEvent(event) {
  const timestamp = typeof event.timestamp === "number" ? new Date(event.timestamp).toISOString() : event.timestamp;
  return JSON.stringify({
    schemaVersion: "openclaw.diagnostics.v1",
    ...event,
    timestamp
  });
}

function syntheticGatewaySessionRecord({ base, timeline }) {
  const coldPayload = {
    ok: true,
    surface: "gateway-session-send-turn",
    method: "sessions.send",
    createSession: true,
    minAssistantCount: 1,
    sessionKey: "kova-gateway-session-send",
    runId: "cold-run",
    activeStartedAtEpochMs: base + 1000,
    activeFinishedAtEpochMs: base + 2500,
    activeTurnMs: 1500,
    sendStartedAtEpochMs: base + 1000,
    sendFinishedAtEpochMs: base + 1040,
    sendDurationMs: 40,
    assistantFirstSeenAtEpochMs: base + 2200,
    assistantMatchedAtEpochMs: base + 2500,
    timeToFirstAssistantMs: 1200,
    timeToMatchedAssistantMs: 1500,
    historyPollCount: 3,
    historyErrorCount: 0,
    assistantMessageCount: 1,
    finalAssistantVisibleText: "KOVA_AGENT_OK",
    expectedTextPresent: true
  };
  const warmPayload = {
    ...coldPayload,
    createSession: false,
    minAssistantCount: 2,
    runId: "warm-run",
    activeStartedAtEpochMs: base + 11000,
    activeFinishedAtEpochMs: base + 11800,
    activeTurnMs: 800,
    sendStartedAtEpochMs: base + 11000,
    sendFinishedAtEpochMs: base + 11050,
    sendDurationMs: 50,
    assistantFirstSeenAtEpochMs: base + 11600,
    assistantMatchedAtEpochMs: base + 11800,
    timeToFirstAssistantMs: 600,
    timeToMatchedAssistantMs: 800,
    historyPollCount: 2,
    assistantMessageCount: 2
  };
  return {
    scenario: "gateway-session-send-turn",
    surface: "gateway-session-send-turn",
    title: "Gateway session cold/warm",
    status: "PASS",
    cleanup: "done",
    auth: { mode: "mock" },
    phases: [
      syntheticGatewayTurnPhase({
        id: "cold-gateway-session-turn",
        command: "node support/run-gateway-session-send-turn.mjs --create-session true",
        startedAtEpochMs: base,
        finishedAtEpochMs: base + 5000,
        payload: coldPayload
      }),
      syntheticGatewayTurnPhase({
        id: "warm-gateway-session-turn",
        command: "node support/run-gateway-session-send-turn.mjs --create-session false",
        startedAtEpochMs: base + 10000,
        finishedAtEpochMs: base + 14000,
        payload: warmPayload
      })
    ],
    providerEvidence: {
      available: true,
      requestCount: 2,
      requests: [
        {
          requestId: "cold-provider",
          receivedAt: new Date(base + 1200).toISOString(),
          receivedAtEpochMs: base + 1200,
          respondedAt: new Date(base + 1800).toISOString(),
          respondedAtEpochMs: base + 1800,
          firstByteLatencyMs: 25,
          firstChunkLatencyMs: 30,
          route: "/v1/responses",
          model: "gpt-5.5",
          status: 200
        },
        {
          requestId: "warm-provider",
          receivedAt: new Date(base + 11250).toISOString(),
          receivedAtEpochMs: base + 11250,
          respondedAt: new Date(base + 11600).toISOString(),
          respondedAtEpochMs: base + 11600,
          firstByteLatencyMs: 20,
          firstChunkLatencyMs: 22,
          route: "/v1/responses",
          model: "gpt-5.5",
          status: 200
        }
      ]
    },
    finalMetrics: {
      service: { gatewayState: "running" },
      logs: zeroLogMetrics(),
      timeline: {
        ...timeline,
        artifacts: ["/tmp/kova/openclaw/timeline.jsonl"]
      }
    }
  };
}

function syntheticAgentCliRecord({ base, timeline }) {
  return {
    scenario: "agent-cold-warm-message",
    surface: "agent-cold-warm-message",
    title: "Agent CLI cold/warm",
    status: "PASS",
    cleanup: "done",
    auth: { mode: "mock" },
    phases: [
      syntheticAgentCliTurnPhase({
        id: "cold-agent-turn",
        startedAtEpochMs: base + 1000,
        finishedAtEpochMs: base + 1900
      }),
      syntheticAgentCliTurnPhase({
        id: "warm-agent-turn",
        startedAtEpochMs: base + 11000,
        finishedAtEpochMs: base + 11600
      })
    ],
    providerEvidence: {
      available: true,
      requestCount: 2,
      requests: [
        {
          requestId: "cold-provider",
          receivedAt: new Date(base + 1200).toISOString(),
          receivedAtEpochMs: base + 1200,
          respondedAt: new Date(base + 1700).toISOString(),
          respondedAtEpochMs: base + 1700,
          firstByteLatencyMs: 20,
          firstChunkLatencyMs: 25,
          route: "/v1/responses",
          model: "gpt-5.5",
          status: 200
        },
        {
          requestId: "warm-provider",
          receivedAt: new Date(base + 11200).toISOString(),
          receivedAtEpochMs: base + 11200,
          respondedAt: new Date(base + 11500).toISOString(),
          respondedAtEpochMs: base + 11500,
          firstByteLatencyMs: 18,
          firstChunkLatencyMs: 20,
          route: "/v1/responses",
          model: "gpt-5.5",
          status: 200
        }
      ]
    },
    finalMetrics: {
      service: { gatewayState: "running" },
      logs: zeroLogMetrics(),
      timeline: {
        ...timeline,
        artifacts: ["/tmp/kova/openclaw/timeline.jsonl"]
      }
    }
  };
}

function syntheticAgentCliTurnPhase({ id, startedAtEpochMs, finishedAtEpochMs }) {
  const command = "ocm @kova -- agent --local --agent main --session-id kova-agent-cold-warm --message hi --json";
  return {
    id,
    title: id,
    intent: "Synthetic agent CLI turn",
    commands: [command],
    evidence: [],
    results: [{
      command,
      status: 0,
      timedOut: false,
      startedAt: new Date(startedAtEpochMs).toISOString(),
      startedAtEpochMs,
      finishedAt: new Date(finishedAtEpochMs).toISOString(),
      finishedAtEpochMs,
      durationMs: finishedAtEpochMs - startedAtEpochMs,
      stdout: "{\"finalAssistantVisibleText\":\"KOVA_AGENT_OK\"}",
      stderr: ""
    }],
    metrics: { logs: zeroLogMetrics(), health: { ok: true } }
  };
}

function syntheticGatewayTurnPhase({ id, command, startedAtEpochMs, finishedAtEpochMs, payload }) {
  return {
    id,
    title: id,
    intent: "Synthetic Gateway session turn",
    commands: [command],
    evidence: [],
    results: [{
      command,
      status: 0,
      timedOut: false,
      startedAt: new Date(startedAtEpochMs).toISOString(),
      startedAtEpochMs,
      finishedAt: new Date(finishedAtEpochMs).toISOString(),
      finishedAtEpochMs,
      durationMs: finishedAtEpochMs - startedAtEpochMs,
      stdout: JSON.stringify(payload),
      stderr: ""
    }],
    metrics: { logs: zeroLogMetrics(), health: { ok: true } }
  };
}

function syntheticTurn({
  startedAtEpochMs,
  firstProviderRequestAtEpochMs,
  firstByteLatencyMs = null,
  firstChunkLatencyMs = null,
  lastProviderResponseAtEpochMs,
  finishedAtEpochMs,
  timelineSummary
}) {
  const result = {
    command: "ocm @kova -- agent --local --agent main --session-id kova --message hi --json",
    startedAt: new Date(startedAtEpochMs).toISOString(),
    startedAtEpochMs,
    finishedAt: new Date(finishedAtEpochMs).toISOString(),
    finishedAtEpochMs,
    durationMs: finishedAtEpochMs - startedAtEpochMs,
    processSnapshots: {
      before: { capturedAt: new Date(startedAtEpochMs - 10).toISOString(), processCount: 2 },
      after: { capturedAt: new Date(finishedAtEpochMs + 10).toISOString(), processCount: 2 },
      leaks: { leakCount: 0, leaksByRole: {}, leakedProcesses: [] }
    }
  };
  const request = {
    requestId: "self-check-provider",
    receivedAt: new Date(firstProviderRequestAtEpochMs).toISOString(),
    receivedAtEpochMs: firstProviderRequestAtEpochMs,
    firstByteLatencyMs,
    firstChunkLatencyMs,
    respondedAt: new Date(lastProviderResponseAtEpochMs).toISOString(),
    respondedAtEpochMs: lastProviderResponseAtEpochMs,
    route: "/v1/responses",
    model: "gpt-5.5",
    stream: true,
    status: 200,
    statusClass: "2xx"
  };
  const attribution = computeProviderTurnAttribution(result, {
    available: true,
    requests: [request]
  });
  return {
    result,
    request,
    attribution,
    breakdown: buildAgentTurnBreakdown({ result, attribution, timelineSummary })
  };
}

async function mockProviderBehaviorCheck(tmp) {
  const dir = join(tmp, "mock-provider-behavior");
  await mkdir(dir, { recursive: true });
  const command = [
    `node support/mock-openai-server.mjs --port-file ${quoteShell(join(dir, "port"))} --request-log ${quoteShell(join(dir, "requests.jsonl"))} --mode error-then-recover --error-status 503 >${quoteShell(join(dir, "server.log"))} 2>&1 & echo $! >${quoteShell(join(dir, "pid"))}`,
    `for i in $(seq 1 50); do test -s ${quoteShell(join(dir, "port"))} && break; sleep 0.1; done`,
    `port=$(cat ${quoteShell(join(dir, "port"))})`,
    "node -e 'const port=process.argv[1]; const body=JSON.stringify({model:\"gpt-5.5\",stream:false}); const send=()=>fetch(`http://127.0.0.1:${port}/v1/responses`,{method:\"POST\",headers:{\"content-type\":\"application/json\"},body}).then(async r=>({status:r.status,text:await r.text()})); const first=await send(); const second=await send(); console.log(JSON.stringify({first:first.status,second:second.status}));' \"$port\"",
    `kill "$(cat ${quoteShell(join(dir, "pid"))})" 2>/dev/null || true`
  ].join("; ");
  const result = await runCommand(command, { timeoutMs: 10000 });
  try {
    if (result.status !== 0) {
      throw new Error(`mock provider behavior command failed: ${result.stderr || result.stdout}`);
    }
    const response = JSON.parse(result.stdout.trim().split(/\r?\n/).at(-1));
    assertEqual(response.first, 503, "first transient provider status");
    assertEqual(response.second, 200, "second recovered provider status");
    const evidence = parseProviderRequestLog(await readFile(join(dir, "requests.jsonl"), "utf8"));
    assertEqual(evidence.requestCount, 2, "behavior request count");
    assertEqual(evidence.requests[0]?.mode, "error-then-recover", "first request behavior");
    assertEqual(evidence.requests[0]?.errorClass, "provider-error", "first request error class");
    assertEqual(evidence.requests[1]?.mode, "normal", "second request behavior");
    return {
      id: "mock-provider-behavior",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "mock-provider-behavior",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function concurrentAgentRunnerCheck(tmp) {
  const fakeBin = join(tmp, "concurrent-agent-runner-bin");
  const fakeOcm = join(fakeBin, "ocm");
  await mkdir(fakeBin, { recursive: true });
  await writeFile(fakeOcm, [
    "#!/usr/bin/env node",
    "process.stdout.write(JSON.stringify({ finalAssistantVisibleText: 'KOVA_AGENT_OK' }) + '\\n');"
  ].join("\n"), "utf8");
  await chmod(fakeOcm, 0o755);

  const command = `PATH=${quoteShell(fakeBin)}:$PATH node support/run-concurrent-agent-turns.mjs --env kova-self-check --count 2 --session-prefix kova-self-check-concurrent --message hi --expected-text KOVA_AGENT_OK --timeout 5`;
  const result = await runCommand(command, { timeoutMs: 10000 });
  try {
    if (result.status !== 0) {
      throw new Error(`concurrent agent runner failed: ${result.stderr || result.stdout}`);
    }
    const summary = JSON.parse(result.stdout);
    assertEqual(summary.schemaVersion, "kova.concurrentAgentTurns.v1", "concurrent runner schema");
    assertEqual(summary.ok, true, "concurrent runner ok");
    assertEqual(summary.count, 2, "concurrent runner count");
    assertEqual(summary.successCount, 2, "concurrent runner success count");
    assertEqual(summary.turns.every((turn) => turn.expectedTextPresent === true), true, "all concurrent turns included expected text");
    return {
      id: "concurrent-agent-runner",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "concurrent-agent-runner",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function officialPluginInstallRunnerCheck(tmp) {
  const fakeBin = join(tmp, "official-plugin-runner-bin");
  const fakeOcm = join(fakeBin, "ocm");
  const artifactDir = join(tmp, "official-plugin-runner-artifacts");
  await mkdir(fakeBin, { recursive: true });
  await writeFile(fakeOcm, [
    "#!/usr/bin/env node",
    "const text = process.argv.slice(2).join(' ');",
    "if (text.includes('@kova-self-check -- plugins install @openclaw/discord')) {",
    "  if (process.env.KOVA_FAKE_OCM_SECURITY_BLOCK === '1') {",
    "    process.stderr.write('WARNING: Plugin \"discord\" contains dangerous code patterns: credential harvesting\\n');",
    "    process.exit(1);",
    "  }",
    "  process.stdout.write('installed @openclaw/discord\\n');",
    "  process.exit(0);",
    "}",
    "if (text.includes('@kova-self-check -- plugins list')) {",
    "  process.stdout.write('discord @openclaw/discord\\n');",
    "  process.exit(0);",
    "}",
    "if (text.includes('@kova-self-check -- plugins registry --refresh --json')) {",
    "  process.stdout.write(JSON.stringify({ plugins: [{ id: 'discord' }] }) + '\\n');",
    "  process.exit(0);",
    "}",
    "if (text.includes('@kova-self-check -- status')) {",
    "  process.stdout.write('status ok\\n');",
    "  process.exit(0);",
    "}",
    "if (text.includes('logs kova-self-check --tail 400 --raw')) {",
    "  process.stdout.write('[plugins] diagnostic log line\\n');",
    "  process.exit(0);",
    "}",
    "process.stderr.write('unexpected fake ocm command: ' + text + '\\n');",
    "process.exit(2);"
  ].join("\n"), "utf8");
  await chmod(fakeOcm, 0o755);

  const successCommand = `PATH=${quoteShell(fakeBin)}:$PATH node support/run-official-plugin-install.mjs --env kova-self-check --state states/official-plugins.json --artifact-dir ${quoteShell(artifactDir)} --timeout-ms 5000`;
  const success = await runCommand(successCommand, { timeoutMs: 10000, maxOutputChars: 1000000 });
  const blockedCommand = `PATH=${quoteShell(fakeBin)}:$PATH KOVA_FAKE_OCM_SECURITY_BLOCK=1 node support/run-official-plugin-install.mjs --env kova-self-check --state states/official-plugins.json --artifact-dir ${quoteShell(join(tmp, "official-plugin-blocked-artifacts"))} --timeout-ms 5000`;
  const blocked = await runCommand(blockedCommand, { timeoutMs: 10000, maxOutputChars: 1000000 });

  try {
    if (success.status !== 0) {
      throw new Error(`official plugin runner success path failed: ${success.stderr || success.stdout}`);
    }
    const successSummary = JSON.parse(success.stdout);
    assertEqual(successSummary.schemaVersion, "kova.officialPluginInstall.v1", "official plugin runner schema");
    assertEqual(successSummary.ok, true, "official plugin runner ok");
    assertEqual(successSummary.pluginCount >= 1, true, "official plugin runner plugin count");
    assertEqual(successSummary.pluginResults?.[0]?.package, "@openclaw/discord", "official plugin package");

    if (blocked.status === 0) {
      throw new Error("official plugin runner security-block path should fail");
    }
    const blockedSummary = JSON.parse(blocked.stdout);
    assertEqual(blockedSummary.securityBlocked, true, "official plugin runner security blocked");
    assertEqual(blockedSummary.securityBlockCount, 1, "official plugin runner security block count");
    assertEqual(blockedSummary.failureEvidence?.length, 1, "official plugin runner failure evidence");
    assertEqual(blockedSummary.failureEvidence?.[0]?.diagnostics?.some((step) => step.id === "diagnostic-logs:discord"), true, "official plugin runner diagnostic logs");
    return {
      id: "official-plugin-install-runner",
      status: "PASS",
      command: successCommand,
      durationMs: success.durationMs + blocked.durationMs
    };
  } catch (error) {
    return {
      id: "official-plugin-install-runner",
      status: "FAIL",
      command: successCommand,
      durationMs: success.durationMs + blocked.durationMs,
      message: error.message
    };
  }
}

function providerFailureEvaluationCheck() {
  try {
    const recoverCommand = "ocm @kova -- agent --local --agent main --session-id kova-agent-provider-recovery --message hi --json";
    const record = {
      scenario: "agent-provider-recovery",
      status: "PASS",
      auth: { mode: "mock", source: "mock", providerId: "openai" },
      phases: [
        {
          id: "transient-provider-failure-turn",
          results: [{
            command: recoverCommand,
            status: 0,
            timedOut: false,
            startedAt: "2026-04-30T10:00:01.000Z",
            startedAtEpochMs: 1777543201000,
            finishedAt: "2026-04-30T10:00:02.000Z",
            finishedAtEpochMs: 1777543202000,
            durationMs: 1000,
            stdout: "{\"finalAssistantVisibleText\":\"KOVA_AGENT_OK\"}",
            stderr: "",
            processSnapshots: {
              leaks: {
                schemaVersion: "kova.processLeakSummary.v1",
                leakCount: 0,
                leakedProcesses: [],
                leaksByRole: {}
              }
            }
          }],
          metrics: { logs: zeroLogMetrics(), health: { ok: true } }
        }
      ],
      providerEvidence: {
        available: true,
        requestCount: 2,
        requests: [
          {
            requestId: "provider-error",
            mode: "error-then-recover",
            outcome: "completed",
            errorClass: "provider-error",
            receivedAt: "2026-04-30T10:00:01.500Z",
            receivedAtEpochMs: 1777543201500,
            respondedAt: "2026-04-30T10:00:01.520Z",
            respondedAtEpochMs: 1777543201520,
            firstByteLatencyMs: 10,
            firstChunkLatencyMs: 10,
            route: "/v1/responses",
            model: "gpt-5.5",
            stream: true,
            status: 503,
            statusClass: "5xx"
          },
          {
            requestId: "provider-recover",
            mode: "normal",
            outcome: "completed",
            errorClass: null,
            receivedAt: "2026-04-30T10:00:01.600Z",
            receivedAtEpochMs: 1777543201600,
            respondedAt: "2026-04-30T10:00:01.700Z",
            respondedAtEpochMs: 1777543201700,
            firstByteLatencyMs: 20,
            firstChunkLatencyMs: 20,
            route: "/v1/responses",
            model: "gpt-5.5",
            stream: true,
            status: 200,
            statusClass: "2xx"
          }
        ]
      },
      finalMetrics: {
        service: { gatewayState: "running" },
        logs: zeroLogMetrics()
      }
    };

    evaluateRecord(record, {
      id: "agent-provider-recovery",
      mockProvider: { mode: "error-then-recover" },
      agent: { expectedText: "KOVA_AGENT_OK" },
      thresholds: {
        providerFinalMs: 10000,
        providerFailureHealthFailures: 0
      }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "npm" } });

    assertEqual(record.status, "PASS", "provider recovery scenario status");
    assertEqual(record.measurements.agentProviderSimulation.mode, "error-then-recover", "provider simulation mode");
    assertEqual(record.measurements.agentProviderSimulation.recoveryOk, true, "provider recovery ok");
    assertEqual(record.measurements.agentProviderSimulation.containmentOk, true, "provider containment ok");
    assertEqual(record.measurements.agentFailureContainment.processLeaksOk, true, "agent process leaks ok");
    assertEqual(record.measurements.agentTurns[0].responseOk, true, "recovery response ok");
    assertEqual(record.measurements.agentLatencyDiagnosis.kind, "provider-error", "provider failure diagnosis");
    const fixerKinds = new Set(record.measurements.agentFailureFixerSummary.items.map((item) => item.kind));
    assertEqual(fixerKinds.has("provider-error"), true, "provider error fixer evidence");
    assertEqual(fixerKinds.has("provider-recovered"), true, "provider recovered fixer evidence");
    return {
      id: "provider-failure-evaluation",
      status: "PASS",
      command: "evaluate synthetic provider failure containment",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "provider-failure-evaluation",
      status: "FAIL",
      command: "evaluate synthetic provider failure containment",
      durationMs: 0,
      message: error.message
    };
  }
}

function providerConcurrentEvaluationCheck() {
  try {
    const command = "node support/run-concurrent-agent-turns.mjs --env kova-self-check --count 3 --message hi --expected-text KOVA_AGENT_OK";
    const record = {
      scenario: "agent-provider-concurrent",
      status: "PASS",
      auth: { mode: "mock", source: "mock", providerId: "openai" },
      phases: [
        {
          id: "concurrent-provider-turns",
          results: [{
            command,
            status: 0,
            timedOut: false,
            startedAt: "2026-04-30T10:00:01.000Z",
            startedAtEpochMs: 1777543201000,
            finishedAt: "2026-04-30T10:00:05.000Z",
            finishedAtEpochMs: 1777543205000,
            durationMs: 4000,
            stdout: "{\"finalAssistantVisibleText\":\"KOVA_AGENT_OK\",\"successCount\":3}",
            stderr: "",
            processSnapshots: {
              leaks: {
                schemaVersion: "kova.processLeakSummary.v1",
                leakCount: 0,
                leakedProcesses: [],
                leaksByRole: {}
              }
            }
          }],
          metrics: { logs: zeroLogMetrics(), health: { ok: true } }
        }
      ],
      providerEvidence: {
        available: true,
        requestCount: 3,
        requests: [1, 2, 3].map((index) => ({
          requestId: `concurrent-provider-${index}`,
          mode: "concurrent-pressure",
          outcome: "completed",
          errorClass: null,
          receivedAt: `2026-04-30T10:00:02.${index}00Z`,
          receivedAtEpochMs: 1777543202000 + (index * 100),
          respondedAt: `2026-04-30T10:00:03.${index}00Z`,
          respondedAtEpochMs: 1777543203000 + (index * 100),
          firstByteLatencyMs: 1000,
          firstChunkLatencyMs: 1000,
          route: "/v1/responses",
          model: "gpt-5.5",
          stream: true,
          status: 200,
          statusClass: "2xx"
        }))
      },
      finalMetrics: {
        service: { gatewayState: "running" },
        logs: zeroLogMetrics()
      }
    };

    evaluateRecord(record, {
      id: "agent-provider-concurrent",
      mockProvider: { mode: "concurrent-pressure", delayMs: 1500, concurrency: 3 },
      agent: { expectedText: "KOVA_AGENT_OK" },
      thresholds: {
        providerRequestCountMin: 3,
        providerConcurrencyMin: 2,
        providerFailureHealthFailures: 0,
        agentProcessLeaks: 0
      }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "npm" } });

    assertEqual(record.status, "PASS", "provider concurrent scenario status");
    assertEqual(record.measurements.agentProviderSimulation.mode, "concurrent-pressure", "provider concurrent mode");
    assertEqual(record.measurements.agentProviderSimulation.concurrentObserved, true, "provider concurrent observed");
    assertEqual(record.measurements.agentProviderSimulation.providerRequestCount, 3, "provider concurrent request count");
    assertEqual(record.measurements.agentProviderSimulation.providerMaxConcurrency, 3, "provider max concurrency");
    assertEqual(record.measurements.agentTurns[0].requestCount, 3, "concurrent turn provider request count");
    assertEqual(record.measurements.agentTurns[0].responseOk, true, "concurrent response ok");
    return {
      id: "provider-concurrent-evaluation",
      status: "PASS",
      command: "evaluate synthetic concurrent provider pressure",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "provider-concurrent-evaluation",
      status: "FAIL",
      command: "evaluate synthetic concurrent provider pressure",
      durationMs: 0,
      message: error.message
    };
  }
}

function agentAuthFailureEvaluationCheck() {
  try {
    const command = "node support/expect-command-fails.mjs -- ocm @kova-self-check -- agent --local --agent main --session-id kova-agent-auth-missing --message hi --json";
    const record = {
      scenario: "agent-auth-missing",
      status: "PASS",
      auth: { mode: "missing", source: "override:missing", providerId: null },
      phases: [
        {
          id: "missing-auth-agent-turn",
          expectedAgentFailure: true,
          results: [{
            command,
            status: 0,
            timedOut: false,
            startedAt: "2026-04-30T10:00:01.000Z",
            startedAtEpochMs: 1777543201000,
            finishedAt: "2026-04-30T10:00:02.000Z",
            finishedAtEpochMs: 1777543202000,
            durationMs: 1000,
            stdout: "",
            stderr: "missing OpenAI credentials",
            processSnapshots: {
              leaks: {
                schemaVersion: "kova.processLeakSummary.v1",
                leakCount: 0,
                leakedProcesses: [],
                leaksByRole: {}
              }
            }
          }],
          metrics: { logs: zeroLogMetrics(), health: { ok: true } }
        },
        {
          id: "post-auth-failure-health",
          results: [{
            command: "ocm @kova-self-check -- status",
            status: 0,
            timedOut: false,
            durationMs: 100,
            stdout: "status ok",
            stderr: ""
          }],
          metrics: { logs: zeroLogMetrics(), health: { ok: true } }
        }
      ],
      providerEvidence: {
        available: false,
        requestCount: 0,
        requests: [],
        errors: [],
        error: "provider request log not found"
      },
      finalMetrics: {
        service: { gatewayState: "running" },
        logs: zeroLogMetrics()
      }
    };

    evaluateRecord(record, {
      id: "agent-auth-missing",
      auth: { mode: "missing" },
      agent: { expectedFailure: true },
      thresholds: {
        agentContainmentHealthFailures: 0,
        agentProcessLeaks: 0
      }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "npm" } });

    assertEqual(record.status, "PASS", "agent auth failure scenario status");
    assertEqual(record.measurements.agentTurnCount, 1, "auth failure agent turn count");
    assertEqual(record.measurements.agentTurns[0].expectedFailureObserved, true, "auth failure observed");
    assertEqual(record.measurements.agentLatencyDiagnosis.kind, "auth-failure", "auth failure diagnosis");
    assertEqual(record.measurements.agentFailureContainment.gatewayHealthy, true, "auth failure gateway healthy");
    assertEqual(
      record.measurements.agentFailureFixerSummary.items.some((item) => item.kind === "auth-failure"),
      true,
      "auth failure fixer evidence"
    );
    return {
      id: "agent-auth-failure-evaluation",
      status: "PASS",
      command: "evaluate synthetic missing-auth agent failure containment",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "agent-auth-failure-evaluation",
      status: "FAIL",
      command: "evaluate synthetic missing-auth agent failure containment",
      durationMs: 0,
      message: error.message
    };
  }
}

async function soakLoopRunnerCheck(tmp) {
  const fakeBin = join(tmp, "soak-loop-runner-bin");
  const fakeOcm = join(fakeBin, "ocm");
  const port = 39291;
  await mkdir(fakeBin, { recursive: true });
  await writeFile(fakeOcm, [
    "#!/usr/bin/env node",
    "const args = process.argv.slice(2);",
    "if (args[0] === 'service' && args[1] === 'status') {",
    "  process.stdout.write(JSON.stringify({ gatewayState: 'running', running: true, gatewayPort: Number(process.env.KOVA_FAKE_PORT) }) + '\\n');",
    "  process.exit(0);",
    "}",
    "process.stdout.write('ok\\n');"
  ].join("\n"), "utf8");
  await chmod(fakeOcm, 0o755);

  const command = [
    `node -e "require('node:http').createServer((req,res)=>{res.end('ok')}).listen(${port},'127.0.0.1')" >/dev/null 2>&1 & server_pid=$!`,
    `PATH=${quoteShell(fakeBin)}:$PATH KOVA_FAKE_PORT=${port} node support/run-soak-loop.mjs --env kova-self-check --duration-ms 50 --interval-ms 0 --timeout-ms 5000`,
    "rc=$?",
    "kill $server_pid 2>/dev/null || true",
    "exit $rc"
  ].join("; ");
  const result = await runCommand(command, { timeoutMs: 10000, maxOutputChars: 1000000 });
  try {
    if (result.status !== 0) {
      throw new Error(`soak loop runner failed: ${result.stderr || result.stdout}`);
    }
    const summary = JSON.parse(result.stdout);
    assertEqual(summary.schemaVersion, "kova.soakLoop.v1", "soak loop schema");
    assertEqual(summary.iterations >= 1, true, "soak loop iterations");
    assertEqual(summary.commandSummary.failureCount, 0, "soak loop command failures");
    assertEqual(summary.healthSummary.failureCount, 0, "soak loop health failures");
    assertEqual(summary.commandSummary.byId.status.count >= 1, true, "soak loop status command count");
    return {
      id: "soak-loop-runner",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "soak-loop-runner",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

function soakTrendEvaluationCheck() {
  try {
    const loop = {
      schemaVersion: "kova.soakLoop.v1",
      durationMs: 65000,
      iterations: 3,
      commandSummary: {
        count: 9,
        okCount: 9,
        failureCount: 0,
        p95Ms: 900,
        maxMs: 1200
      },
      healthSummary: {
        count: 3,
        okCount: 3,
        failureCount: 0,
        p95Ms: 45,
        maxMs: 60
      }
    };
    const record = {
      scenario: "soak",
      status: "PASS",
      phases: [{
        id: "loop",
        results: [{
          command: "node support/run-soak-loop.mjs --env kova-self-check --duration-ms 60000",
          status: 0,
          timedOut: false,
          durationMs: 65000,
          stdout: JSON.stringify(loop),
          stderr: "",
          resourceSamples: {
            sampleCount: 3,
            peakTotalRssMb: 1000,
            maxTotalCpuPercent: 80,
            peakGatewayRssMb: 900,
            peakCommandTreeRssMb: 100,
            byRole: {},
            topRolesByRss: [],
            topRolesByCpu: [],
            topByRss: [],
            topByCpu: [],
            trend: {
              schemaVersion: "kova.resourceTrend.v1",
              available: true,
              totalRssGrowthMb: 420,
              gatewayRssGrowthMb: 390
            }
          }
        }],
        metrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
      }],
      finalMetrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
    };
    evaluateRecord(record, {
      id: "soak",
      thresholds: {
        soakMinDurationMs: 60000,
        soakCommandP95Ms: 10000,
        soakHealthP95Ms: 1000,
        soakCommandFailures: 0,
        soakHealthFailures: 0,
        rssGrowthMb: 300,
        gatewayRssGrowthMb: 300
      }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "npm" } });

    assertEqual(record.status, "FAIL", "soak trend record status");
    assertEqual(record.measurements.soakIterations, 3, "soak iterations");
    assertEqual(record.measurements.soakCommandP95Ms, 900, "soak command p95");
    assertEqual(record.measurements.rssGrowthMb, 420, "soak total RSS growth");
    assertEqual(record.measurements.gatewayRssGrowthMb, 390, "soak gateway RSS growth");
    assertEqual(
      record.violations.some((violation) => violation.metric === "rssGrowthMb"),
      true,
      "soak RSS growth violation"
    );

    return {
      id: "soak-trend-evaluation",
      status: "PASS",
      command: "evaluate synthetic soak trend regression",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "soak-trend-evaluation",
      status: "FAIL",
      command: "evaluate synthetic soak trend regression",
      durationMs: 0,
      message: error.message
    };
  }
}

function mcpBridgeEvidenceEvaluationCheck() {
  try {
    const smoke = {
      schemaVersion: "kova.mcpBridgeSmoke.v1",
      durationMs: 1800,
      initializeMs: 120,
      toolsListMs: 90,
      shutdownMs: 45,
      toolCount: 8,
      toolNames: ["conversations_list", "messages_read"],
      processExited: true,
      exitStatus: 0,
      exitSignal: null,
      errors: []
    };
    const record = {
      scenario: "mcp-runtime-start-stop",
      status: "PASS",
      phases: [{
        id: "mcp-bridge",
        results: [{
          command: "node support/mcp-bridge-smoke.mjs --env kova-self-check --artifact-dir /tmp/kova",
          status: 0,
          timedOut: false,
          durationMs: 1800,
          stdout: JSON.stringify(smoke),
          stderr: ""
        }],
        metrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
      }],
      finalMetrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
    };
    evaluateRecord(record, {
      id: "mcp-runtime-start-stop",
      thresholds: {
        mcpInitializeMs: 10000,
        mcpToolsListMs: 10000,
        mcpShutdownMs: 5000,
        mcpToolCountMin: 1,
        mcpProcessLeaks: 0,
        pluginLoadFailures: 0
      }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "npm" } });

    assertEqual(record.status, "PASS", "MCP bridge record status");
    assertEqual(record.measurements.mcpInitializeMs, 120, "MCP initialize ms");
    assertEqual(record.measurements.mcpToolsListMs, 90, "MCP tools/list ms");
    assertEqual(record.measurements.mcpShutdownMs, 45, "MCP shutdown ms");
    assertEqual(record.measurements.mcpToolCount, 8, "MCP tool count");
    assertEqual(record.measurements.mcpProcessLeaks, 0, "MCP process leak count");

    const leaked = {
      ...record,
      status: "PASS",
      violations: [],
      measurements: undefined,
      phases: [{
        id: "mcp-bridge",
        results: [{
          command: "node support/mcp-bridge-smoke.mjs --env kova-self-check --artifact-dir /tmp/kova",
          status: 0,
          timedOut: false,
          durationMs: 1800,
          stdout: JSON.stringify({ ...smoke, processExited: false }),
          stderr: ""
        }],
        metrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
      }]
    };
    evaluateRecord(leaked, {
      id: "mcp-runtime-start-stop",
      thresholds: { mcpProcessLeaks: 0 }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "npm" } });
    assertEqual(leaked.status, "FAIL", "MCP leaked process status");
    assertEqual(
      leaked.violations.some((violation) => violation.metric === "mcpProcessLeaks"),
      true,
      "MCP process leak violation"
    );

    return {
      id: "mcp-bridge-evidence-evaluation",
      status: "PASS",
      command: "evaluate synthetic MCP bridge evidence",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "mcp-bridge-evidence-evaluation",
      status: "FAIL",
      command: "evaluate synthetic MCP bridge evidence",
      durationMs: 0,
      message: error.message
    };
  }
}

function browserAutomationEvidenceEvaluationCheck() {
  try {
    const smoke = {
      schemaVersion: "kova.browserAutomationSmoke.v1",
      durationMs: 4200,
      browserDoctorMs: 120,
      browserStartMs: 1800,
      browserTabsMs: 90,
      browserOpenMs: 300,
      browserSnapshotMs: 250,
      browserStopMs: 180,
      browserTabCount: 2,
      browserSnapshotOk: true,
      browserStopped: true,
      errors: []
    };
    const record = {
      scenario: "browser-automation-smoke",
      status: "PASS",
      phases: [{
        id: "browser-smoke",
        results: [{
          command: "node support/browser-automation-smoke.mjs --env kova-self-check --artifact-dir /tmp/kova",
          status: 0,
          timedOut: false,
          durationMs: 4200,
          stdout: JSON.stringify(smoke),
          stderr: ""
        }],
        metrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
      }],
      finalMetrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
    };
    evaluateRecord(record, {
      id: "browser-automation-smoke",
      thresholds: {
        browserDoctorMs: 15000,
        browserStartMs: 30000,
        browserTabsMs: 10000,
        browserOpenMs: 15000,
        browserSnapshotMs: 15000,
        browserStopMs: 10000,
        browserTabCountMin: 1,
        browserProcessLeaks: 0
      }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "npm" } });

    assertEqual(record.status, "PASS", "browser automation record status");
    assertEqual(record.measurements.browserStartMs, 1800, "browser start ms");
    assertEqual(record.measurements.browserOpenMs, 300, "browser open ms");
    assertEqual(record.measurements.browserSnapshotMs, 250, "browser snapshot ms");
    assertEqual(record.measurements.browserTabCount, 2, "browser tab count");
    assertEqual(record.measurements.browserProcessLeaks, 0, "browser process leak count");

    const failed = {
      ...record,
      status: "PASS",
      violations: [],
      measurements: undefined,
      phases: [{
        id: "browser-smoke",
        results: [{
          command: "node support/browser-automation-smoke.mjs --env kova-self-check --artifact-dir /tmp/kova",
          status: 0,
          timedOut: false,
          durationMs: 4200,
          stdout: JSON.stringify({ ...smoke, browserStopped: false, errors: ["browser stop failed"] }),
          stderr: ""
        }],
        metrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
      }]
    };
    evaluateRecord(failed, {
      id: "browser-automation-smoke",
      thresholds: { browserProcessLeaks: 0 }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "npm" } });
    assertEqual(failed.status, "FAIL", "browser failed stop status");
    assertEqual(
      failed.violations.some((violation) => violation.metric === "browserProcessLeaks"),
      true,
      "browser process leak violation"
    );

    return {
      id: "browser-automation-evidence-evaluation",
      status: "PASS",
      command: "evaluate synthetic browser automation evidence",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "browser-automation-evidence-evaluation",
      status: "FAIL",
      command: "evaluate synthetic browser automation evidence",
      durationMs: 0,
      message: error.message
    };
  }
}

function mediaUnderstandingEvidenceEvaluationCheck() {
  try {
    const smoke = {
      schemaVersion: "kova.mediaUnderstandingTimeout.v1",
      ok: true,
      durationMs: 1600,
      mediaDescribeMs: 1250,
      mediaTimeoutObserved: true,
      mediaCommandTimedOut: false,
      mediaCommandStatus: 1,
      mediaStatusAfterTimeoutMs: 180,
      gatewayStatusWorks: true,
      errors: []
    };
    const record = {
      scenario: "media-understanding-timeout",
      status: "PASS",
      providerEvidence: { requestCount: 1 },
      phases: [{
        id: "media-timeout",
        results: [{
          command: "node support/media-understanding-timeout.mjs --env kova-self-check --artifact-dir /tmp/kova",
          status: 0,
          timedOut: false,
          durationMs: 1600,
          stdout: JSON.stringify(smoke),
          stderr: ""
        }],
        metrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
      }],
      finalMetrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
    };
    evaluateRecord(record, {
      id: "media-understanding-timeout",
      thresholds: {
        mediaDescribeMs: 10000,
        mediaTimeoutObserved: 1,
        mediaStatusAfterTimeoutMs: 10000,
        providerRequestCountMin: 1
      }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "npm" } });

    assertEqual(record.status, "PASS", "media understanding record status");
    assertEqual(record.measurements.mediaDescribeMs, 1250, "media describe ms");
    assertEqual(record.measurements.mediaTimeoutObserved, true, "media timeout observed");
    assertEqual(record.measurements.mediaCommandTimedOut, false, "media command did not hit outer timeout");
    assertEqual(record.measurements.mediaStatusAfterTimeoutMs, 180, "post-media status ms");
    assertEqual(record.measurements.mediaGatewayStatusWorks, true, "gateway status after media timeout");

    const failed = {
      ...record,
      status: "PASS",
      providerEvidence: { requestCount: 0 },
      violations: [],
      measurements: undefined,
      phases: [{
        id: "media-timeout",
        results: [{
          command: "node support/media-understanding-timeout.mjs --env kova-self-check --artifact-dir /tmp/kova",
          status: 0,
          timedOut: false,
          durationMs: 1600,
          stdout: JSON.stringify({
            ...smoke,
            ok: false,
            mediaTimeoutObserved: false,
            gatewayStatusWorks: false,
            errors: ["media timeout not observed"]
          }),
          stderr: ""
        }],
        metrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
      }]
    };
    evaluateRecord(failed, {
      id: "media-understanding-timeout",
      thresholds: {
        mediaTimeoutObserved: 1,
        providerRequestCountMin: 1
      }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "npm" } });
    assertEqual(failed.status, "FAIL", "media failure status");
    assertEqual(
      failed.violations.some((violation) => violation.metric === "mediaTimeoutObserved"),
      true,
      "media timeout observed violation"
    );
    assertEqual(
      failed.violations.some((violation) => violation.metric === "providerRequestCountMin"),
      true,
      "media provider request count violation"
    );

    return {
      id: "media-understanding-evidence-evaluation",
      status: "PASS",
      command: "evaluate synthetic media understanding timeout evidence",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "media-understanding-evidence-evaluation",
      status: "FAIL",
      command: "evaluate synthetic media understanding timeout evidence",
      durationMs: 0,
      message: error.message
    };
  }
}

function networkOfflineEvidenceEvaluationCheck() {
  try {
    const smoke = {
      schemaVersion: "kova.agentNetworkOffline.v1",
      ok: true,
      durationMs: 1800,
      networkTurnMs: 1400,
      networkFailureObserved: true,
      networkCommandTimedOut: false,
      networkCommandStatus: 1,
      networkStatusAfterFailureMs: 190,
      gatewayStatusWorks: true,
      errors: []
    };
    const record = {
      scenario: "agent-network-offline",
      status: "PASS",
      phases: [{
        id: "network-offline-turn",
        results: [{
          command: "node support/agent-network-offline.mjs --env kova-self-check --artifact-dir /tmp/kova",
          status: 0,
          timedOut: false,
          durationMs: 1800,
          stdout: JSON.stringify(smoke),
          stderr: ""
        }],
        metrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
      }],
      finalMetrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
    };
    evaluateRecord(record, {
      id: "agent-network-offline",
      thresholds: {
        networkFailureObserved: 1,
        networkStatusAfterFailureMs: 10000
      }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "npm" } });

    assertEqual(record.status, "PASS", "network offline record status");
    assertEqual(record.measurements.networkTurnMs, 1400, "network turn ms");
    assertEqual(record.measurements.networkFailureObserved, true, "network failure observed");
    assertEqual(record.measurements.networkCommandTimedOut, false, "network command did not hit outer timeout");
    assertEqual(record.measurements.networkStatusAfterFailureMs, 190, "post-network status ms");
    assertEqual(record.measurements.networkGatewayStatusWorks, true, "gateway status after network failure");

    const failed = {
      ...record,
      status: "PASS",
      violations: [],
      measurements: undefined,
      phases: [{
        id: "network-offline-turn",
        results: [{
          command: "node support/agent-network-offline.mjs --env kova-self-check --artifact-dir /tmp/kova",
          status: 0,
          timedOut: false,
          durationMs: 1800,
          stdout: JSON.stringify({
            ...smoke,
            ok: false,
            networkFailureObserved: false,
            gatewayStatusWorks: false,
            errors: ["network failure not observed"]
          }),
          stderr: ""
        }],
        metrics: { service: { gatewayState: "running" }, logs: zeroLogMetrics() }
      }]
    };
    evaluateRecord(failed, {
      id: "agent-network-offline",
      thresholds: {
        networkFailureObserved: 1
      }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "npm" } });
    assertEqual(failed.status, "FAIL", "network failure status");
    assertEqual(
      failed.violations.some((violation) => violation.metric === "networkFailureObserved"),
      true,
      "network failure observed violation"
    );
    assertEqual(
      failed.violations.some((violation) => violation.metric === "networkGatewayStatusWorks"),
      true,
      "network gateway status violation"
    );

    return {
      id: "network-offline-evidence-evaluation",
      status: "PASS",
      command: "evaluate synthetic network offline evidence",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "network-offline-evidence-evaluation",
      status: "FAIL",
      command: "evaluate synthetic network offline evidence",
      durationMs: 0,
      message: error.message
    };
  }
}

function agentColdWarmEvaluationCheck() {
  try {
    const coldCommand = "ocm @kova -- agent --local --agent main --session-id kova-agent-cold-warm --message hi --json";
    const warmCommand = "ocm @kova -- agent --local --agent main --session-id kova-agent-cold-warm --message hi --json";
    const record = {
      scenario: "agent-cold-warm-message",
      status: "PASS",
      auth: { mode: "mock", source: "mock", providerId: "openai" },
      phases: [
        {
          id: "cold-agent-turn",
          results: [{
            command: coldCommand,
            status: 0,
            timedOut: false,
            startedAt: "2026-04-30T10:00:01.000Z",
            startedAtEpochMs: 1777543201000,
            finishedAt: "2026-04-30T10:01:03.000Z",
            finishedAtEpochMs: 1777543263000,
            durationMs: 62000,
            stdout: "{\"finalAssistantVisibleText\":\"KOVA_AGENT_OK\"}",
            stderr: ""
          }],
          metrics: { logs: zeroLogMetrics(), health: { ok: true } }
        },
        {
          id: "warm-agent-turn",
          results: [{
            command: warmCommand,
            status: 0,
            timedOut: false,
            startedAt: "2026-04-30T10:01:10.000Z",
            startedAtEpochMs: 1777543270000,
            finishedAt: "2026-04-30T10:01:12.000Z",
            finishedAtEpochMs: 1777543272000,
            durationMs: 2000,
            stdout: "{\"finalAssistantVisibleText\":\"KOVA_AGENT_OK\"}",
            stderr: ""
          }],
          metrics: { logs: zeroLogMetrics(), health: { ok: true } }
        }
      ],
      providerEvidence: {
        available: true,
        requestCount: 2,
        requests: [
          {
            requestId: "cold-provider",
            receivedAt: "2026-04-30T10:01:02.000Z",
            receivedAtEpochMs: 1777543262000,
            respondedAt: "2026-04-30T10:01:02.800Z",
            respondedAtEpochMs: 1777543262800,
            firstByteLatencyMs: 50,
            firstChunkLatencyMs: 50,
            route: "/v1/responses",
            model: "gpt-5.5",
            stream: true,
            status: 200,
            statusClass: "2xx"
          },
          {
            requestId: "warm-provider",
            receivedAt: "2026-04-30T10:01:10.500Z",
            receivedAtEpochMs: 1777543270500,
            respondedAt: "2026-04-30T10:01:11.300Z",
            respondedAtEpochMs: 1777543271300,
            firstByteLatencyMs: 40,
            firstChunkLatencyMs: 40,
            route: "/v1/responses",
            model: "gpt-5.5",
            stream: true,
            status: 200,
            statusClass: "2xx"
          }
        ]
      },
      finalMetrics: {
        service: { gatewayState: "running" },
        logs: zeroLogMetrics()
      }
    };

    evaluateRecord(record, {
      id: "agent-cold-warm-message",
      agent: { expectedText: "KOVA_AGENT_OK" },
      thresholds: {
        preProviderMs: 10000,
        coldWarmDeltaMs: 30000,
        providerFinalMs: 3000,
        preProviderDominanceRatio: 0.8
      }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "npm" } });

    assertEqual(record.status, "FAIL", "cold pre-provider stall should fail");
    assertEqual(record.measurements.agentTurnCount, 2, "agent turn count");
    assertEqual(record.measurements.coldAgentTurnMs, 62000, "cold turn duration");
    assertEqual(record.measurements.warmAgentTurnMs, 2000, "warm turn duration");
    assertEqual(record.measurements.agentColdWarmDeltaMs, 60000, "cold warm delta");
    assertEqual(record.measurements.coldPreProviderMs, 61000, "cold pre-provider latency");
    assertEqual(record.measurements.warmPreProviderMs, 500, "warm pre-provider latency");
    assertEqual(record.measurements.coldProviderFinalMs, 800, "cold provider final");
    assertEqual(record.measurements.agentLatencyDiagnosis.kind, "cold-pre-provider-stall", "latency diagnosis kind");
    assertEqual(record.measurements.agentTurns[0].responseOk, true, "cold response ok");
    assertEqual(record.measurements.agentTurns[1].providerRoutes[0].value, "/v1/responses", "warm provider route evidence");
    assertEqual(
      renderPasteSummary({
        runId: "self-check-cold-warm",
        target: "runtime:stable",
        mode: "self-check",
        platform: { os: "test", release: "test", arch: "test" },
        records: [record]
      }).includes("cold-warm delta 60000ms"),
      true,
      "paste summary includes cold/warm evidence"
    );

    return {
      id: "agent-cold-warm-evaluation",
      status: "PASS",
      command: "evaluate synthetic cold/warm agent provider attribution",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "agent-cold-warm-evaluation",
      status: "FAIL",
      command: "evaluate synthetic cold/warm agent provider attribution",
      durationMs: 0,
      message: error.message
    };
  }
}

function sourceReleaseCompareCheck() {
  try {
    const releaseReport = syntheticCompareReport({
      runId: "release-run",
      target: "npm:2026.4.27",
      timelineAvailable: false,
      preProviderMs: 62000,
      slowestSpanMs: null
    });
    const sourceReport = syntheticCompareReport({
      runId: "source-run",
      target: "local-build:/tmp/openclaw",
      timelineAvailable: true,
      preProviderMs: 4000,
      slowestSpanMs: 3200
    });
    const comparison = compareReports(releaseReport, sourceReport);
    assertEqual(comparison.ok, true, "source/release comparison with source timeline should pass");
    assertEqual(comparison.sourceRelease?.pairCount, 1, "source/release pair count");
    assertEqual(comparison.sourceRelease?.infoCount, 1, "release missing timeline should be informational");
    assertEqual(comparison.sourceRelease?.pairs?.[0]?.source?.timelineAvailable, true, "source timeline available");
    assertEqual(comparison.sourceRelease?.pairs?.[0]?.release?.timelineAvailable, false, "release timeline missing");

    const missingTimelineComparison = compareReports(releaseReport, syntheticCompareReport({
      runId: "source-no-timeline",
      target: "local-build:/tmp/openclaw",
      timelineAvailable: false,
      preProviderMs: 4000,
      slowestSpanMs: null
    }));
    assertEqual(missingTimelineComparison.ok, false, "source missing timeline should fail comparison");
    assertEqual(missingTimelineComparison.sourceRelease?.blockingCount, 1, "source missing timeline blocking count");
    assertEqual(
      renderCompareSummary(missingTimelineComparison).includes("source-build report did not include OpenClaw timeline diagnostics"),
      true,
      "compare summary includes source timeline blocker"
    );

    const failingReport = syntheticCompareReport({
      runId: "gateway-rss-failing",
      target: "local-build:/tmp/openclaw",
      timelineAvailable: true,
      preProviderMs: 4000,
      slowestSpanMs: 3200
    });
    failingReport.summary = { statuses: { FAIL: 1 } };
    failingReport.records[0].status = "FAIL";
    failingReport.records[0].violations = [{
      metric: "resourcePeakGatewayRssMb",
      message: "gateway peak RSS 701.8 MB exceeded threshold 700 MB"
    }];
    const fixedReport = syntheticCompareReport({
      runId: "gateway-rss-fixed",
      target: "local-build:/tmp/openclaw",
      timelineAvailable: true,
      preProviderMs: 3800,
      slowestSpanMs: 3000
    });
    const fixedComparison = compareReports(failingReport, fixedReport);
    assertEqual(fixedComparison.ok, true, "resolved failure comparison should pass");
    assertEqual(fixedComparison.statusChanges.improvements.length, 1, "status improvement count");
    assertEqual(fixedComparison.findingChanges.resolved.length, 1, "resolved finding count");
    assertEqual(
      renderCompareSummary(fixedComparison).includes("RESOLVED FAIL agent-cold-warm-message/mock-openai-provider"),
      true,
      "compare summary includes resolved finding"
    );

    return {
      id: "source-release-compare",
      status: "PASS",
      command: "evaluate synthetic source-build versus release-runtime comparison",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "source-release-compare",
      status: "FAIL",
      command: "evaluate synthetic source-build versus release-runtime comparison",
      durationMs: 0,
      message: error.message
    };
  }
}

function syntheticCompareReport({ runId, target, timelineAvailable, preProviderMs, slowestSpanMs }) {
  return {
    runId,
    mode: "execution",
    target,
    generatedAt: "2026-05-01T00:00:00.000Z",
    platform: { os: "darwin", arch: "arm64", release: "test", node: "test" },
    summary: { statuses: { PASS: 1 } },
    records: [{
      scenario: "agent-cold-warm-message",
      surface: "agent-cli-local-turn",
      state: { id: "mock-openai-provider" },
      status: "PASS",
      measurements: {
        openclawTimelineAvailable: timelineAvailable,
        openclawTimelineEventCount: timelineAvailable ? 20 : 0,
        openclawSlowestSpanName: timelineAvailable ? "agent.prepare" : null,
        openclawSlowestSpanMs: slowestSpanMs,
        coldAgentTurnMs: preProviderMs + 800,
        coldPreProviderMs: preProviderMs,
        coldProviderFinalMs: 800,
        agentTurnMs: preProviderMs + 800,
        agentPreProviderMs: preProviderMs,
        agentProviderFinalMs: 800,
        runtimeDepsStagingMs: 0,
        peakRssMb: 100
      }
    }]
  };
}

async function diagnosticsTimelineCheck() {
  try {
    const text = await readFile("fixtures/diagnostics/timeline.jsonl", "utf8");
    const timeline = parseTimelineText(text);
    assertEqual(timeline.available, true, "timeline available");
    assertEqual(timeline.eventCount, 8, "timeline event count");
    assertEqual(timeline.parseErrorCount, 0, "timeline parse errors");
    assertEqual(
      timeline.repeatedSpans.some((span) => span.name === "plugins.metadata.scan"),
      true,
      "repeated plugin metadata span"
    );
    assertEqual(timeline.runtimeDeps.slowest?.pluginId, "browser", "runtime deps slowest plugin");
    assertEqual(timeline.runtimeDeps.byPlugin[1]?.pluginId, "memory-core", "runtime deps by plugin");
    assertEqual(timeline.eventLoop.maxMs, 214, "event loop max");
    assertEqual(timeline.providers.maxDurationMs, 1220, "provider duration");
    assertEqual(timeline.childProcesses.failedCount, 1, "child process failures");
    assertEqual(timeline.keySpans["gateway.startup"].maxDurationMs, 2450, "gateway startup key span");
    return {
      id: "diagnostics-timeline-parser",
      status: "PASS",
      command: "parse fixtures/diagnostics/timeline.jsonl",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "diagnostics-timeline-parser",
      status: "FAIL",
      command: "parse fixtures/diagnostics/timeline.jsonl",
      durationMs: 0,
      message: error.message
    };
  }
}

async function diagnosticsOpenSpanCheck() {
  try {
    const text = await readFile("fixtures/diagnostics/timeline-open-span.jsonl", "utf8");
    const timeline = parseTimelineText(text);
    assertEqual(timeline.available, true, "open timeline available");
    assertEqual(timeline.openSpanCount, 1, "open span count");
    assertEqual(timeline.openSpans[0]?.name, "runtimeDeps.stage", "open span name");
    assertEqual(timeline.openSpans[0]?.ageMs, 5000, "open span age");
    assertEqual(timeline.keySpans["runtimeDeps.stage"].openCount, 1, "key open span count");
    return {
      id: "diagnostics-open-span-parser",
      status: "PASS",
      command: "parse fixtures/diagnostics/timeline-open-span.jsonl",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "diagnostics-open-span-parser",
      status: "FAIL",
      command: "parse fixtures/diagnostics/timeline-open-span.jsonl",
      durationMs: 0,
      message: error.message
    };
  }
}

function diagnosticsTimelineEvaluationCheck() {
  try {
    const missingTimelineRecord = {
      scenario: "diagnostic-missing-timeline",
      status: "PASS",
      phases: [],
      finalMetrics: {
        service: { gatewayState: "running" },
        logs: zeroLogMetrics(),
        timeline: {
          available: false,
          eventCount: 0,
          parseErrorCount: 0,
          openSpanCount: 0,
          openSpans: [],
          keySpans: {},
          runtimeDeps: {},
          eventLoop: {},
          providers: {},
          childProcesses: {}
        }
      }
    };
    evaluateRecord(missingTimelineRecord, { thresholds: {} }, {
      targetPlan: { kind: "local-build" },
      profile: {
        id: "diagnostic",
        diagnostics: {
          timelineRequired: true,
          timelineRequiredForTargetKinds: ["local-build"]
        }
      },
      surface: {
        id: "release-runtime-startup",
        diagnostics: { expectedSpans: ["runtimeDeps.stage"] },
        thresholds: {}
      }
    });
    assertEqual(missingTimelineRecord.status, "FAIL", "missing diagnostic timeline status");
    assertEqual(
      missingTimelineRecord.violations.some((violation) => violation.metric === "openclawTimelineAvailable"),
      true,
      "missing diagnostic timeline violation"
    );

    const missingSpanRecord = {
      scenario: "diagnostic-missing-span",
      status: "PASS",
      phases: [],
      finalMetrics: {
        service: { gatewayState: "running" },
        logs: zeroLogMetrics(),
        timeline: {
          available: true,
          eventCount: 1,
          parseErrorCount: 0,
          openSpanCount: 0,
          openSpans: [],
          keySpans: {},
          spanTotals: {
            "gateway.startup": { count: 1, totalDurationMs: 100, maxDurationMs: 100 }
          },
          runtimeDeps: {},
          eventLoop: {},
          providers: {},
          childProcesses: {}
        }
      }
    };
    evaluateRecord(missingSpanRecord, { thresholds: {} }, {
      targetPlan: { kind: "local-build" },
      profile: { id: "diagnostic", diagnostics: { timelineRequired: true } },
      surface: {
        id: "bundled-runtime-deps",
        diagnostics: { expectedSpans: ["runtimeDeps.stage"] },
        thresholds: {}
      }
    });
    assertEqual(missingSpanRecord.status, "FAIL", "missing required span status");
    assertEqual(missingSpanRecord.measurements.openclawMissingRequiredSpanCount, 1, "missing required span measurement");
    assertEqual(
      missingSpanRecord.violations.some((violation) => violation.metric === "openclawMissingRequiredSpanCount"),
      true,
      "missing required span violation"
    );

    const openSpanRecord = {
      scenario: "diagnostic-open-span",
      status: "PASS",
      phases: [],
      finalMetrics: {
        service: { gatewayState: "running" },
        logs: zeroLogMetrics(),
        timeline: parseTimelineText([
          "{\"type\":\"span.start\",\"timestamp\":\"2026-04-29T15:30:00.000Z\",\"name\":\"runtimeDeps.stage\",\"spanId\":\"1\"}",
          "{\"type\":\"eventLoop.sample\",\"timestamp\":\"2026-04-29T15:30:06.000Z\",\"name\":\"eventLoop\",\"maxMs\":400}"
        ].join("\n"))
      }
    };
    evaluateRecord(openSpanRecord, { thresholds: {} }, {
      targetPlan: { kind: "local-build" },
      profile: { id: "diagnostic", diagnostics: { timelineRequired: true } },
      surface: {
        id: "bundled-runtime-deps",
        diagnostics: { expectedSpans: ["runtimeDeps.stage"] },
        thresholds: {}
      }
    });
    assertEqual(openSpanRecord.status, "FAIL", "open required span status");
    assertEqual(openSpanRecord.measurements.openclawOpenRequiredSpanCount, 1, "open required span measurement");
    assertEqual(
      openSpanRecord.violations.some((violation) => violation.metric === "openclawOpenRequiredSpanCount"),
      true,
      "open required span violation"
    );
    const reportSummary = renderReportSummary({
      schemaVersion: "kova.report.v1",
      generatedAt: "2026-04-29T15:30:10.000Z",
      runId: "self-check-diagnostics",
      summary: { total: 1, statuses: { FAIL: 1 } },
      records: [openSpanRecord]
    }, { structured: true });
    assertEqual(
      reportSummary.scenarios[0]?.measurements?.diagnostics?.openRequiredSpanCount,
      1,
      "structured report open span evidence"
    );
    assertEqual(
      reportSummary.scenarios[0]?.measurements?.diagnostics?.openSpans?.[0]?.name,
      "runtimeDeps.stage",
      "structured report open span name"
    );
    assertEqual(
      renderPasteSummary({
        runId: "self-check-diagnostics",
        target: "local-build:/tmp/openclaw",
        mode: "self-check",
        records: [openSpanRecord]
      }).includes("openRequiredSpans: 1"),
      true,
      "brief evidence includes open required spans"
    );

    return {
      id: "diagnostics-timeline-evaluation",
      status: "PASS",
      command: "evaluate synthetic diagnostic timeline records",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "diagnostics-timeline-evaluation",
      status: "FAIL",
      command: "evaluate synthetic diagnostic timeline records",
      durationMs: 0,
      message: error.message
    };
  }
}

function runtimeDepsLogParserCheck() {
  try {
    const summary = summarizeRuntimeDepsLogs([
      "21:22:15 [plugins] browser staging bundled runtime deps (6 specs): @modelcontextprotocol/sdk@1.29.0, commander@^14.0.3",
      "21:22:19 [plugins] browser installed bundled runtime deps in 3964ms: @modelcontextprotocol/sdk@1.29.0, commander@^14.0.3",
      "21:22:19 [plugins] memory-core staging bundled runtime deps (2 specs): chokidar@^5.0.0, typebox@1.1.33",
      "21:22:20 [plugins] memory-core installed bundled runtime deps in 1529ms: chokidar@^5.0.0, typebox@1.1.33",
      "runtime-postbuild: bundled plugin runtime deps completed in 45226ms"
    ].join("\n"));

    assertEqual(summary.stageCount, 2, "runtime deps stage count");
    assertEqual(summary.installCount, 2, "runtime deps install count");
    assertEqual(summary.installMaxMs, 3964, "runtime deps install max");
    assertEqual(summary.postbuildCount, 1, "runtime deps postbuild count");
    assertEqual(summary.postbuildMaxMs, 45226, "runtime deps postbuild max");
    assertEqual(summary.pluginIds.includes("browser"), true, "runtime deps browser plugin");

    return {
      id: "runtime-deps-log-parser",
      status: "PASS",
      command: "parse synthetic OpenClaw runtime dependency logs",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "runtime-deps-log-parser",
      status: "FAIL",
      command: "parse synthetic OpenClaw runtime dependency logs",
      durationMs: 0,
      message: error.message
    };
  }
}

function embeddedRunLogParserCheck() {
  try {
    const text = [
      "[agent/embedded] [trace:embedded-run] startup stages: runId=53b2 sessionId=ocm-direct-live-1 phase=attempt-dispatch totalMs=11948 stages=workspace:0ms@0ms,runtime-plugins:7325ms@7325ms,hooks:0ms@7325ms,model-resolution:1035ms@8360ms,auth:2045ms@10405ms,context-engine:1ms@10406ms,attempt-dispatch:1542ms@11948ms",
      "[agent/embedded] [trace:embedded-run] prep stages: runId=53b2 sessionId=ocm-direct-live-1 phase=stream-setup totalMs=10988 stages=workspace-sandbox:3ms@3ms,skills:0ms@3ms,core-plugin-tools:4688ms@4691ms,bootstrap-context:6ms@4697ms,bundle-tools:519ms@5216ms,system-prompt:2688ms@7904ms,session-resource-loader:526ms@8430ms,agent-session:1ms@8431ms,stream-setup:2557ms@10988ms",
      "[diagnostic] liveness warning: reasons=eventLoopDelay interval=10000ms eventLoopDelayP99Ms=116.9 eventLoopDelayMaxMs=9982.4 eventLoopUtilization=0.688 cpuCoreRatio=0.701 active=1 waiting=0 queued=0"
    ].join("\n");
    const embedded = summarizeEmbeddedRunTraces(text);
    const liveness = summarizeLivenessWarnings(text);

    assertEqual(embedded.eventCount, 2, "embedded trace count");
    assertEqual(embedded.startupCount, 1, "embedded startup count");
    assertEqual(embedded.prepCount, 1, "embedded prep count");
    assertEqual(embedded.stageTotals["runtime-plugins"]?.totalDurationMs, 7325, "runtime plugin stage duration");
    assertEqual(embedded.stageTotals["core-plugin-tools"]?.maxDurationMs, 4688, "core plugin tools max");
    assertEqual(embedded.topStages[0]?.name, "runtime-plugins", "embedded top stage");
    assertEqual(liveness.count, 1, "liveness warning count");
    assertEqual(liveness.maxEventLoopDelayMaxMs, 9982.4, "liveness event loop max");

    const breakdown = buildAgentTurnBreakdown({
      result: {
        command: "node support/run-gateway-session-send-turn.mjs",
        startedAtEpochMs: 1000,
        finishedAtEpochMs: 63000,
        durationMs: 62000
      },
      attribution: {
        commandStartedAtEpochMs: 1000,
        commandFinishedAtEpochMs: 63000,
        totalTurnMs: 62000,
        firstProviderRequestAtEpochMs: 52000,
        lastProviderResponseAtEpochMs: 52800,
        preProviderMs: 51000,
        providerFinalMs: 800,
        postProviderMs: 10200
      },
      timelineSummary: null,
      logSummary: { embeddedRuns: embedded }
    });
    assertEqual(breakdown.sourceLogs.categories.runtimePlugins.totalDurationMs, 7325, "embedded log source category");
    assertEqual(breakdown.sourceLogs.unmappedStages.some((stage) => stage.name === "attempt-dispatch"), true, "unmapped embedded stages preserved");
    assertEqual(
      summarizeAgentTurnBreakdownForMarkdown(breakdown).includes("embedded:attempt-dispatch"),
      true,
      "breakdown markdown includes raw unmapped stage evidence"
    );

    return {
      id: "embedded-run-log-parser",
      status: "PASS",
      command: "parse synthetic OpenClaw embedded-run and liveness logs",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "embedded-run-log-parser",
      status: "FAIL",
      command: "parse synthetic OpenClaw embedded-run and liveness logs",
      durationMs: 0,
      message: error.message
    };
  }
}

function runtimeDepsWarmReuseEvaluationCheck() {
  try {
    const coldLog = [
      "21:22:15 [plugins] browser staging bundled runtime deps (6 specs): @modelcontextprotocol/sdk@1.29.0",
      "21:22:19 [plugins] browser installed bundled runtime deps in 3964ms: @modelcontextprotocol/sdk@1.29.0",
      "21:22:19 [plugins] memory-core staging bundled runtime deps (2 specs): chokidar@^5.0.0",
      "21:22:20 [plugins] memory-core installed bundled runtime deps in 1529ms: chokidar@^5.0.0"
    ].join("\n");
    const scenario = {
      id: "bundled-runtime-deps",
      thresholds: {
        warmRuntimeDepsRestageCount: 0,
        warmRuntimeDepsStagingMs: 5000
      }
    };
    const surface = {
      id: "bundled-runtime-deps",
      thresholds: {}
    };
    const cleanRecord = runtimeDepsRecord({
      coldLog,
      warmLog: coldLog
    });
    evaluateRecord(cleanRecord, scenario, { surface, targetPlan: { kind: "npm" } });
    assertEqual(cleanRecord.status, "PASS", "warm reuse clean record status");
    assertEqual(cleanRecord.measurements.coldRuntimeDepsInstallCount, 2, "cold install count");
    assertEqual(cleanRecord.measurements.warmRuntimeDepsRestageCount, 0, "warm restage count");
    assertEqual(cleanRecord.measurements.runtimeDepsWarmReuseOk, true, "warm reuse ok");

    const restagedRecord = runtimeDepsRecord({
      coldLog,
      warmLog: [
        coldLog,
        "21:23:02 [plugins] browser staging bundled runtime deps (6 specs): @modelcontextprotocol/sdk@1.29.0",
        "21:23:08 [plugins] browser installed bundled runtime deps in 6100ms: @modelcontextprotocol/sdk@1.29.0"
      ].join("\n")
    });
    evaluateRecord(restagedRecord, scenario, { surface, targetPlan: { kind: "npm" } });
    assertEqual(restagedRecord.status, "FAIL", "warm restage record status");
    assertEqual(restagedRecord.measurements.warmRuntimeDepsRestageCount, 1, "warm restage failure count");
    assertEqual(restagedRecord.measurements.warmRuntimeDepsStagingMs, 6100, "warm restage failure duration");
    assertEqual(
      restagedRecord.violations.some((violation) => violation.metric === "warmRuntimeDepsRestageCount"),
      true,
      "warm restage count violation"
    );
    assertEqual(
      renderPasteSummary({
        runId: "self-check-runtime-deps",
        target: "runtime:stable",
        mode: "self-check",
        records: [restagedRecord]
      }).includes("warmRuntimeDepsRestageCount: 1"),
      true,
      "brief evidence includes warm runtime deps restage"
    );

    return {
      id: "runtime-deps-warm-reuse-evaluation",
      status: "PASS",
      command: "evaluate synthetic warm runtime dependency reuse",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "runtime-deps-warm-reuse-evaluation",
      status: "FAIL",
      command: "evaluate synthetic warm runtime dependency reuse",
      durationMs: 0,
      message: error.message
    };
  }
}

function runtimeDepsRecord({ coldLog, warmLog }) {
  return {
    scenario: "bundled-runtime-deps",
    status: "PASS",
    phases: [
      {
        id: "cold-start",
        results: [{ command: "ocm logs kova-runtime-deps --tail 300 --raw", status: 0, stdout: coldLog, stderr: "", durationMs: 100 }],
        metrics: {
          service: { gatewayState: "running" },
          logs: zeroLogMetrics()
        }
      },
      {
        id: "warm-restart",
        results: [{ command: "ocm logs kova-runtime-deps --tail 300 --raw", status: 0, stdout: warmLog, stderr: "", durationMs: 100 }],
        metrics: {
          service: { gatewayState: "running" },
          logs: zeroLogMetrics()
        }
      }
    ],
    finalMetrics: {
      service: { gatewayState: "running" },
      logs: zeroLogMetrics()
    }
  };
}

async function cleanupArtifactsCheck(tmp) {
  const home = join(tmp, "artifact-cleanup-home");
  const staleDir = join(home, "artifacts", "kova-2000-01-01t000000z");
  const keepDir = join(home, "artifacts", "not-a-kova-run");
  await mkdir(staleDir, { recursive: true });
  await mkdir(keepDir, { recursive: true });
  await writeFile(join(staleDir, "sample.txt"), "stale artifact\n", "utf8");
  const oldDate = new Date("2000-01-01T00:00:00.000Z");
  await utimes(staleDir, oldDate, oldDate);

  const dryRun = await runCommand(
    `KOVA_HOME=${quoteShell(home)} node bin/kova.mjs cleanup artifacts --older-than-days 1 --json`,
    { timeoutMs: 30000, maxOutputChars: 1000000 }
  );
  if (dryRun.status !== 0) {
    return {
      id: "cleanup-artifacts",
      status: "FAIL",
      command: dryRun.command,
      durationMs: dryRun.durationMs,
      message: dryRun.stderr.trim() || dryRun.stdout.trim()
    };
  }
  const dryRunJson = JSON.parse(dryRun.stdout);
  assertEqual(dryRunJson.schemaVersion, "kova.cleanup.artifacts.v1", "cleanup artifacts schema");
  assertEqual(dryRunJson.execute, false, "cleanup artifacts dry-run");
  assertEqual(dryRunJson.candidates.length, 1, "cleanup artifacts candidate count");
  assertEqual(dryRunJson.candidates[0].name, "kova-2000-01-01t000000z", "cleanup artifacts candidate name");

  const execute = await runCommand(
    `KOVA_HOME=${quoteShell(home)} node bin/kova.mjs cleanup artifacts --older-than-days 1 --execute --json`,
    { timeoutMs: 30000, maxOutputChars: 1000000 }
  );
  if (execute.status !== 0) {
    return {
      id: "cleanup-artifacts",
      status: "FAIL",
      command: execute.command,
      durationMs: execute.durationMs,
      message: execute.stderr.trim() || execute.stdout.trim()
    };
  }
  const executeJson = JSON.parse(execute.stdout);
  assertEqual(executeJson.execute, true, "cleanup artifacts execute");
  assertEqual(executeJson.results.length, 1, "cleanup artifacts result count");
  let staleStillExists = true;
  try {
    await stat(staleDir);
  } catch (error) {
    staleStillExists = error.code !== "ENOENT";
  }
  assertEqual(staleStillExists, false, "stale artifact directory removed");
  assertEqual((await stat(keepDir)).isDirectory(), true, "non-kova artifact directory retained");

  return {
    id: "cleanup-artifacts",
    status: "PASS",
    command: "node bin/kova.mjs cleanup artifacts --older-than-days 1 --execute --json",
    durationMs: dryRun.durationMs + execute.durationMs
  };
}

async function inventoryPlanCheck(tmp) {
  const binDir = join(tmp, "inventory-bin");
  const repoDir = join(tmp, "inventory-openclaw");
  const openclawBin = join(binDir, "openclaw");
  await mkdir(binDir, { recursive: true });
  await mkdir(join(repoDir, "plugins", "bundled"), { recursive: true });
  await mkdir(join(repoDir, "extensions", "dashboard"), { recursive: true });
  await writeFile(openclawBin, `#!/bin/sh
case "$1" in
  --help)
    cat <<'HELP'
Usage: openclaw <command>

Commands:
  Hint: commands suffixed with * have subcommands.
  dashboard  Start dashboard
  plugins *  Manage plugins
  unknownx   Experimental command
HELP
    ;;
  dashboard)
    echo "OpenClaw dashboard help"
    ;;
  plugins)
    echo "OpenClaw plugins help"
    ;;
  unknownx)
    echo "OpenClaw unknownx help"
    ;;
  *)
    echo "unexpected args: $*" >&2
    exit 2
    ;;
esac
`, "utf8");
  await chmod(openclawBin, 0o755);
  await writeFile(join(repoDir, "package.json"), `${JSON.stringify({
    name: "openclaw",
    scripts: {
      "audit:internal": "node scripts/internal-audit.mjs",
      build: "pnpm build",
      "release:check": "node scripts/release-check.mjs"
    }
  }, null, 2)}\n`, "utf8");
  await writeFile(join(repoDir, "plugins", "bundled", "plugin.json"), `${JSON.stringify({
    name: "plugins",
    description: "Bundled plugin manifest",
    openclawPlugin: true
  }, null, 2)}\n`, "utf8");
  await writeFile(join(repoDir, "extensions", "dashboard", "manifest.json"), `${JSON.stringify({
    name: "dashboard",
    description: "Dashboard extension",
    openclawExtension: true
  }, null, 2)}\n`, "utf8");

  return jsonCommandCheck(
    "inventory-plan-json",
    `node bin/kova.mjs inventory plan --openclaw-bin ${quoteShell(openclawBin)} --openclaw-repo ${quoteShell(repoDir)} --require-modeled cli:unknownx --json`,
    (data) => {
      assertEqual(data.schemaVersion, "kova.inventory.plan.v1", "inventory schema");
      assertEqual(data.sources?.find((source) => source.id === "openclaw-help")?.status, "scanned", "inventory help source");
      assertEqual(data.sources?.find((source) => source.id === "package-scripts")?.status, "scanned", "inventory package source");
      assertEqual(data.sources?.find((source) => source.id === "manifests")?.status, "scanned", "inventory manifests source");
      assertEqual(data.sources?.find((source) => source.id === "package-scripts")?.includedScriptCount, 1, "inventory product script filter");
      assertEqual(data.capabilities?.some((capability) => capability.id === "cli:dashboard" && capability.matchedSurfaceIds?.includes("dashboard")), true, "dashboard command mapped");
      assertEqual(data.capabilities?.some((capability) => capability.id === "cli:Hint"), false, "help parser ignores help prose");
      assertEqual(data.capabilities?.some((capability) => capability.id === "cli:unknownx" && capability.matchStatus === "unmodeled"), true, "unknown command warning");
      assertEqual(data.capabilities?.some((capability) => capability.id === "script:release:check"), true, "product package scripts discovered");
      assertEqual(data.capabilities?.some((capability) => capability.id === "script:build"), false, "internal package scripts filtered");
      assertEqual(data.capabilities?.some((capability) => capability.kind === "plugin-manifest"), true, "plugin manifest discovered");
      assertEqual(data.capabilities?.some((capability) => capability.kind === "extension-manifest"), true, "extension manifest discovered");
      assertEqual((data.coverage?.warnings ?? []).some((warning) => warning.capability === "cli:unknownx"), true, "unmodeled warning emitted");
      assertEqual(data.coverage?.ok, false, "required unmodeled capability blocks inventory coverage");
      assertEqual((data.coverage?.blockers ?? []).some((blocker) => blocker.capability === "cli:unknownx"), true, "required unmodeled blocker emitted");
    }
  );
}

function readinessClassificationCheck() {
  try {
    const record = {
      status: "PASS",
      phases: [
        {
          id: "provision",
          healthScope: "readiness",
          results: [],
          metrics: {
            readiness: {
              deadlineMs: 90000,
              thresholdMs: 30000,
              ready: true,
              listeningReady: true,
              listeningReadyAtMs: 47000,
              healthReadyAtMs: 47100,
              classification: {
                state: "slow-startup",
                severity: "fail",
                reason: "gateway became healthy after 47100ms, beyond the 30000ms threshold"
              }
            },
            logs: {
              missingDependencyErrors: 0,
              pluginLoadFailures: 0,
              metadataScanMentions: 0,
              configNormalizationMentions: 0,
              gatewayRestartMentions: 0,
              providerLoadMentions: 0,
              modelCatalogMentions: 0,
              providerTimeoutMentions: 0,
              eventLoopDelayMentions: 0,
              v8DiagnosticMentions: 0
            }
          }
        }
      ],
      finalMetrics: {
        service: { gatewayState: "running" },
        logs: {
          missingDependencyErrors: 0,
          pluginLoadFailures: 0,
          metadataScanMentions: 0,
          configNormalizationMentions: 0,
          gatewayRestartMentions: 0,
          providerLoadMentions: 0,
          modelCatalogMentions: 0,
          providerTimeoutMentions: 0,
          eventLoopDelayMentions: 0,
          v8DiagnosticMentions: 0
        }
      }
    };
    evaluateRecord(record, { thresholds: { gatewayReadyMs: 30000 } });
    assertEqual(record.status, "FAIL", "slow readiness status");
    assertEqual(record.measurements.health.readiness.classification, "slow-startup", "readiness classification");
    assertEqual(
      record.violations.some((violation) => violation.metric === "readiness.classification"),
      true,
      "readiness violation"
    );
    return {
      id: "readiness-classification",
      status: "PASS",
      command: "evaluate synthetic slow readiness record",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "readiness-classification",
      status: "FAIL",
      command: "evaluate synthetic slow readiness record",
      durationMs: 0,
      message: error.message
    };
  }
}

function healthReadinessModelCheck() {
  try {
    const record = {
      status: "PASS",
      phases: [
        {
          id: "cold-start",
          healthScope: "readiness",
          results: [],
          metrics: {
            readiness: {
              deadlineMs: 90000,
              thresholdMs: 30000,
              ready: true,
              listeningReady: true,
              listeningReadyAtMs: 120,
              healthReadyAtMs: 200,
              attempts: 2,
              classification: {
                state: "ready",
                severity: "pass",
                reason: "gateway became healthy within the readiness threshold"
              },
              healthAttempts: [
                { ok: false, durationMs: 25 },
                { ok: true, durationMs: 30 }
              ]
            },
            healthSamples: [
              { ok: true, durationMs: 40 }
            ],
            healthSummary: {
              count: 1,
              okCount: 1,
              failureCount: 0,
              minMs: 40,
              p50Ms: 40,
              p95Ms: 40,
              maxMs: 40
            }
          }
        },
        {
          id: "api-latency",
          healthScope: "post-ready",
          results: [],
          metrics: {
            healthSamples: [
              { ok: true, durationMs: 10 },
              { ok: true, durationMs: 1500 }
            ],
            healthSummary: {
              count: 2,
              okCount: 2,
              failureCount: 0,
              minMs: 10,
              p50Ms: 10,
              p95Ms: 1500,
              maxMs: 1500
            }
          }
        }
      ],
      finalMetrics: {
        service: { gatewayState: "running" },
        healthSamples: [{ ok: true, durationMs: 50 }],
        healthSummary: {
          count: 1,
          okCount: 1,
          failureCount: 0,
          minMs: 50,
          p50Ms: 50,
          p95Ms: 50,
          maxMs: 50
        },
        health: { ok: true, durationMs: 50 }
      }
    };
    const scenario = {
      phases: [
        { id: "cold-start", healthScope: "readiness" },
        { id: "api-latency", healthScope: "post-ready" }
      ],
      thresholds: {
        gatewayReadyMs: 30000,
        postReadyHealthP95Ms: 1000
      }
    };
    evaluateRecord(record, scenario);
    assertEqual(record.status, "FAIL", "post-ready health threshold fails");
    assertEqual(record.measurements.health.schemaVersion, "kova.health.v1", "health schema");
    assertEqual(record.measurements.health.readiness.healthReadyAtMs, 200, "readiness health ready captured");
    assertEqual(record.measurements.health.startupSamples.p95Ms, 30, "startup health p95 derived from readiness attempts");
    assertEqual(record.measurements.health.postReadySamples.p95Ms, 1500, "post-ready health p95 derived from post-ready samples");
    assertEqual(record.measurements.health.slowestSample.scope, "post-ready", "slowest health scope");
    assertEqual(
      record.violations.some((violation) => violation.metric === "postReadyHealthP95Ms"),
      true,
      "post-ready health violation"
    );
    assertEqual(
      record.violations.some((violation) => violation.metric === "readinessHealthReadyMs"),
      false,
      "post-ready liveness does not masquerade as readiness"
    );
    return {
      id: "health-readiness-model",
      status: "PASS",
      command: "evaluate synthetic scoped health record",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "health-readiness-model",
      status: "FAIL",
      command: "evaluate synthetic scoped health record",
      durationMs: 0,
      message: error.message
    };
  }
}

function agentContainmentHealthScopeCheck() {
  try {
    const record = {
      scenario: "gateway-session-send-turn",
      status: "PASS",
      auth: { mode: "mock", source: "mock", providerId: "openai" },
      phases: [
        {
          id: "gateway-start",
          results: [],
          metrics: {
            logs: zeroLogMetrics(),
            readiness: {
              listeningReadyAtMs: 100,
              healthReadyAtMs: 300,
              thresholdMs: 30000,
              deadlineMs: 90000,
              attempts: 3,
              classification: {
                state: "ready",
                severity: "pass",
                reason: "synthetic startup recovered"
              },
              healthAttempts: [
                { ok: false, durationMs: 0 },
                { ok: false, durationMs: 1 },
                { ok: true, durationMs: 10 }
              ]
            },
            healthSummary: {
              count: 3,
              okCount: 1,
              failureCount: 2,
              minMs: 0,
              p50Ms: 1,
              p95Ms: 10,
              maxMs: 10
            }
          }
        },
        {
          id: "cold-gateway-session-turn",
          results: [{
            command: "ocm @kova -- agent --local --agent main --session-id kova --message hi --json",
            status: 0,
            timedOut: false,
            startedAt: "2026-05-06T10:00:01.000Z",
            startedAtEpochMs: 1778061601000,
            finishedAt: "2026-05-06T10:00:01.400Z",
            finishedAtEpochMs: 1778061601400,
            durationMs: 400,
            stdout: "{\"finalAssistantVisibleText\":\"KOVA_AGENT_OK\"}",
            stderr: "",
            processSnapshots: {
              leaks: {
                schemaVersion: "kova.processLeakSummary.v1",
                leakCount: 0,
                leakedProcesses: [],
                leaksByRole: {}
              }
            }
          }],
          metrics: {
            logs: zeroLogMetrics(),
            health: { ok: true, durationMs: 2 },
            healthSummary: {
              count: 1,
              okCount: 1,
              failureCount: 0,
              minMs: 2,
              p50Ms: 2,
              p95Ms: 2,
              maxMs: 2
            }
          }
        }
      ],
      providerEvidence: {
        available: true,
        requestCount: 1,
        requests: [{
          requestId: "provider",
          receivedAt: "2026-05-06T10:00:01.100Z",
          receivedAtEpochMs: 1778061601100,
          respondedAt: "2026-05-06T10:00:01.200Z",
          respondedAtEpochMs: 1778061601200,
          firstByteLatencyMs: 5,
          firstChunkLatencyMs: 5,
          route: "/v1/responses",
          model: "gpt-5.5",
          status: 200,
          statusClass: "2xx"
        }]
      },
      finalMetrics: {
        service: { gatewayState: "running" },
        logs: zeroLogMetrics(),
        health: { ok: true, durationMs: 1 },
        healthSummary: {
          count: 1,
          okCount: 1,
          failureCount: 0,
          minMs: 1,
          p50Ms: 1,
          p95Ms: 1,
          maxMs: 1
        }
      }
    };

    evaluateRecord(record, {
      id: "gateway-session-send-turn",
      phases: [
        { id: "gateway-start", healthScope: "readiness" },
        { id: "cold-gateway-session-turn", healthScope: "post-ready" }
      ],
      agent: { expectedText: "KOVA_AGENT_OK" },
      thresholds: {
        agentContainmentHealthFailures: 0,
        agentProcessLeaks: 0
      }
    }, { surface: { thresholds: {} }, targetPlan: { kind: "runtime" } });

    assertEqual(record.status, "PASS", "startup health failures should not fail post-agent containment");
    assertEqual(record.measurements.health.startupSamples.failureCount, 2, "startup failures retained");
    assertEqual(record.measurements.health.postReadySamples.failureCount, 0, "post-ready failures absent");
    assertEqual(record.measurements.agentFailureContainment.healthFailures, 0, "containment excludes startup failures");
    assertEqual(record.measurements.agentFailureContainment.healthFailureBreakdown.startup, 2, "containment reports startup failures separately");
    assertEqual(record.measurements.agentFailureContainment.gatewayHealthy, true, "gateway containment healthy");
    assertEqual(
      (record.violations ?? []).some((violation) => violation.metric === "agentGatewayHealthy"),
      false,
      "startup readiness failures do not create agentGatewayHealthy violation"
    );

    return {
      id: "agent-containment-health-scope",
      status: "PASS",
      command: "evaluate agent containment scoped health failures",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "agent-containment-health-scope",
      status: "FAIL",
      command: "evaluate agent containment scoped health failures",
      durationMs: 0,
      message: error.message
    };
  }
}

async function resourceRoleAttributionCheck(tmp) {
  const command = "node -e 'setTimeout(() => {}, 650)'";
  const artifactPath = join(tmp, "resource-role-attribution.jsonl");
  const result = await runCommand(command, {
    timeoutMs: 5000,
    resourceSample: {
      intervalMs: 250,
      processRoles: await loadProcessRoles(),
      artifactPath
    }
  });

  try {
    assertEqual(result.status, 0, "resource attribution command status");
    assertEqual(result.resourceSamples?.schemaVersion, "kova.resourceSamples.v1", "resource schema");
    assertEqual(Boolean(result.resourceSamples?.byRole?.["command-tree"]), true, "command-tree role");
    assertEqual(Boolean(result.resourceSamples?.byRole?.uncategorized), true, "uncategorized role");
    assertArrayNotEmpty(result.resourceSamples?.topRolesByRss, "top roles by RSS");
    assertString(result.resourceSamples?.artifactPath, "resource artifact path");
    return {
      id: "resource-role-attribution",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "resource-role-attribution",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function resourceRootCommandRoleBoundaryCheck() {
  try {
    const processRoles = await loadProcessRoles();
    const gatewayRoles = classifyRegistryRolesForProcess(
      { command: "openclaw-gateway" },
      {
        processRoles,
        rootCommand: "node support/mcp-bridge-smoke.mjs --env kova-mcp-runtime-start-stop",
        existingRoles: ["gateway", "gateway-tree"]
      }
    );
    const commandRoles = classifyRegistryRolesForProcess(
      { command: "node support/mcp-bridge-smoke.mjs --env kova-mcp-runtime-start-stop" },
      {
        processRoles,
        rootCommand: "node support/mcp-bridge-smoke.mjs --env kova-mcp-runtime-start-stop",
        existingRoles: ["command-tree"]
      }
    );

    assertEqual(gatewayRoles.includes("mcp-runtime"), false, "root command role must not tag gateway process");
    assertEqual(commandRoles.includes("mcp-runtime"), true, "root command role tags command tree process");
    return {
      id: "resource-root-command-role-boundary",
      status: "PASS",
      command: "classify synthetic gateway and command-tree roles",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "resource-root-command-role-boundary",
      status: "FAIL",
      command: "classify synthetic gateway and command-tree roles",
      durationMs: 0,
      message: error.message
    };
  }
}

async function resourceRolePollutionCheck() {
  try {
    const processRoles = await loadProcessRoles();
    const mockProviderCommand = "node /tmp/kova-browser-automation-smoke/mock-openai-server.mjs --marker KOVA_AGENT_OK";
    const mockProviderRoles = classifyRegistryRolesForProcess(
      { command: `/bin/zsh -lc ${mockProviderCommand}` },
      {
        processRoles,
        rootCommand: mockProviderCommand,
        existingRoles: ["command-tree"]
      }
    );
    const envNameCommand = "ocm env exec kova-mcp-runtime-start-stop -- node support/configure-openclaw-mock-auth.mjs";
    const envNameRoles = classifyRegistryRolesForProcess(
      { command: envNameCommand },
      {
        processRoles,
        rootCommand: envNameCommand,
        existingRoles: ["command-tree"]
      }
    );
    const openclawAgentRoles = classifyRegistryRolesForProcess(
      { command: "openclaw-agent" },
      {
        processRoles,
        rootCommand: "ocm @kova -- agent --local --message hi",
        existingRoles: ["command-tree"]
      }
    );
    const resourceSummary = summarizeResourceSamples([{
      timestamp: "2026-05-07T00:00:00.000Z",
      elapsedMs: 1000,
      processes: [
        {
          pid: 100,
          rssMb: 700,
          cpuPercent: 100,
          roles: ["gateway", "gateway-tree"],
          role: "gateway,gateway-tree",
          command: "openclaw"
        },
        {
          pid: 101,
          rssMb: 60,
          cpuPercent: 1,
          roles: ["command-tree", "gateway-session-client"],
          role: "command-tree,gateway-session-client",
          command: "node support/run-gateway-session-send-turn.mjs"
        }
      ]
    }]);

    assertEqual(mockProviderRoles.includes("mock-provider"), true, "mock provider helper remains classified");
    assertEqual(mockProviderRoles.includes("agent-cli"), false, "KOVA_AGENT_OK marker must not imply agent-cli");
    assertEqual(mockProviderRoles.includes("agent-process"), false, "KOVA_AGENT_OK marker must not imply agent-process");
    assertEqual(mockProviderRoles.includes("browser-sidecar"), false, "browser env name must not imply browser-sidecar");
    assertEqual(envNameRoles.includes("runtime-management"), false, "mcp-runtime env name must not imply runtime-management");
    assertEqual(envNameRoles.includes("model-cli"), false, "configure-openclaw fixture helper must not imply model-cli");
    assertEqual(openclawAgentRoles.includes("agent-cli"), true, "openclaw-agent process must imply agent-cli");
    assertEqual(openclawAgentRoles.includes("agent-process"), true, "openclaw-agent process must imply agent-process");
    assertEqual(resourceSummary.peakGatewayRssMb, 700, "gateway-session-client role must not inflate gateway RSS");
    assertEqual(resourceSummary.peakCommandTreeRssMb, 60, "gateway-session-client remains command-tree RSS");
    return {
      id: "resource-role-pollution-boundary",
      status: "PASS",
      command: "classify synthetic helper commands for role pollution",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "resource-role-pollution-boundary",
      status: "FAIL",
      command: "classify synthetic helper commands for role pollution",
      durationMs: 0,
      message: error.message
    };
  }
}

async function gatewaySessionSurfaceContractCheck() {
  try {
    const surface = JSON.parse(await readFile("surfaces/gateway-session-send-turn.json", "utf8"));
    const expectedSpans = surface.diagnostics?.expectedSpans ?? [];
    const staleSpans = ["agent.turn", "agent.prepare", "models.catalog", "provider.request", "agent.cleanup"];
    for (const span of staleSpans) {
      assertEqual(expectedSpans.includes(span), false, `gateway session surface must not require stale ${span} span`);
    }
    assertEqual(expectedSpans.includes("gateway.chat_send"), true, "gateway session surface requires gateway chat send spans");
    assertEqual(expectedSpans.includes("auto_reply"), true, "gateway session surface requires auto reply spans");
    assertEqual(expectedSpans.includes("reply"), true, "gateway session surface requires reply spans");
    return {
      id: "gateway-session-surface-contract",
      status: "PASS",
      command: "validate gateway session surface diagnostics contract",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "gateway-session-surface-contract",
      status: "FAIL",
      command: "validate gateway session surface diagnostics contract",
      durationMs: 0,
      message: error.message
    };
  }
}

async function processSnapshotCheck(tmp) {
  const processRoles = await loadProcessRoles();
  const child = runCommand("node -e 'setTimeout(() => {}, 1200)'", {
    timeoutMs: 5000,
    resourceSample: null
  });
  await sleep(250);
  const before = captureProcessSnapshot({
    processRoles,
    envName: "kova-self-check",
    rootCommand: "ocm @kova-self-check -- agent --local --session-id kova-agent-self-check --message hi"
  });
  const result = await child;
  const after = captureProcessSnapshot({
    processRoles,
    envName: "kova-self-check",
    rootCommand: "ocm @kova-self-check -- agent --local --session-id kova-agent-self-check --message hi"
  });
  const leaks = diffProcessSnapshots(before, after, {
    roles: ["agent-cli", "agent-process", "mcp-runtime", "plugin-cli", "mock-provider", "browser-sidecar"]
  });
  const artifactPath = join(tmp, "process-snapshot-leaks.json");
  await writeFile(artifactPath, `${JSON.stringify(leaks, null, 2)}\n`, "utf8");

  try {
    const unrelatedBrowserRoles = classifySnapshotRolesForProcess({
      command: "/Applications/Google Chrome.app/Contents/MacOS/Google Chrome --type=renderer"
    }, {
      processRoles,
      envName: "kova-self-check",
      rootCommand: "ocm @kova-self-check -- agent --local --session-id kova-agent-self-check --message hi"
    });
    const scopedBrowserRoles = classifySnapshotRolesForProcess({
      command: "/Applications/Google Chrome.app/Contents/MacOS/Google Chrome --user-data-dir=/tmp/kova-self-check/browser"
    }, {
      processRoles,
      envName: "kova-self-check",
      rootCommand: "ocm @kova-self-check -- agent --local --session-id kova-agent-self-check --message hi"
    });
    const gatewayBrowserRoles = classifySnapshotRolesForProcess({
      command: "/Applications/Google Chrome.app/Contents/MacOS/Google Chrome --type=renderer"
    }, {
      processRoles,
      existingRoles: ["gateway-tree"],
      envName: "kova-self-check"
    });
    const scopedAgentRoles = classifySnapshotRolesForProcess({
      command: "openclaw-agent --session-id kova-agent-self-check"
    }, {
      processRoles,
      envName: "kova-self-check",
      rootCommand: "ocm @kova-self-check -- agent --local --session-id kova-agent-self-check --message hi"
    });
    assertEqual(result.status, 0, "snapshot command status");
    assertEqual(before.schemaVersion, "kova.processSnapshot.v1", "snapshot schema");
    assertEqual(leaks.schemaVersion, "kova.processLeakSummary.v1", "leak summary schema");
    assertEqual(typeof leaks.leakCount, "number", "leak count type");
    assertEqual(unrelatedBrowserRoles.includes("browser-sidecar"), false, "unrelated browser process excluded from snapshot role");
    assertEqual(scopedBrowserRoles.includes("browser-sidecar"), true, "scoped browser process retained");
    assertEqual(gatewayBrowserRoles.includes("browser-sidecar"), true, "gateway child browser process retained");
    assertEqual(scopedAgentRoles.includes("agent-cli"), true, "scoped agent process retained");
    return {
      id: "process-snapshot-leak-contract",
      status: "PASS",
      command: "capture and diff role-aware process snapshots",
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "process-snapshot-leak-contract",
      status: "FAIL",
      command: "capture and diff role-aware process snapshots",
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

function roleThresholdEvaluationCheck() {
  try {
    const record = {
      scenario: "synthetic-role-threshold",
      title: "Synthetic Role Threshold",
      status: "PASS",
      phases: [
        {
          id: "sample",
          results: [
            {
              command: "synthetic",
              status: 0,
              durationMs: 1,
              resourceSamples: {
                schemaVersion: "kova.resourceSamples.v1",
                sampleCount: 1,
                peakTotalRssMb: 250,
                maxTotalCpuPercent: 80,
                byRole: {
                  gateway: {
                    peakRssMb: 250,
                    maxCpuPercent: 80,
                    peakRssAtMs: 10,
                    peakCpuAtMs: 10,
                    peakProcessCount: 1
                  }
                },
                topRolesByRss: [{ role: "gateway", peakRssMb: 250, maxCpuPercent: 80 }],
                topRolesByCpu: [{ role: "gateway", peakRssMb: 250, maxCpuPercent: 80 }],
                topByRss: [],
                topByCpu: []
              }
            }
          ],
          metrics: {
            logs: zeroLogMetrics()
          }
        }
      ],
      finalMetrics: {
        service: { gatewayState: "running" },
        logs: zeroLogMetrics()
      }
    };
    evaluateRecord(record, { thresholds: {} }, {
      surface: {
        thresholds: {},
        roleThresholds: {
          gateway: { peakRssMb: 100, maxCpuPercent: 50 }
        }
      }
    });
    assertEqual(record.status, "FAIL", "role threshold status");
    assertEqual(record.measurements.resourceByRole.gateway.peakRssMb, 250, "gateway role RSS measurement");
    assertEqual(
      record.violations.some((violation) => violation.metric === "resourceByRole.gateway.peakRssMb"),
      true,
      "role RSS violation"
    );
    assertEqual(
      record.violations.some((violation) => violation.metric === "resourceByRole.gateway.maxCpuPercent"),
      true,
      "role CPU violation"
    );
    return {
      id: "resource-role-thresholds",
      status: "PASS",
      command: "evaluate synthetic role resource thresholds",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "resource-role-thresholds",
      status: "FAIL",
      command: "evaluate synthetic role resource thresholds",
      durationMs: 0,
      message: error.message
    };
  }
}

function thresholdPolicyCalibrationCheck() {
  try {
    const record = {
      scenario: "synthetic-threshold-policy",
      title: "Synthetic Threshold Policy",
      status: "PASS",
      phases: [{
        id: "sample",
        results: [{
          command: "ocm start kova-threshold-test",
          status: 0,
          durationMs: 150,
          resourceSamples: {
            schemaVersion: "kova.resourceSamples.v1",
            sampleCount: 1,
            peakTotalRssMb: 250,
            maxTotalCpuPercent: 80,
            byRole: {
              gateway: {
                peakRssMb: 250,
                maxCpuPercent: 80,
                peakRssAtMs: 10,
                peakCpuAtMs: 10,
                peakProcessCount: 1
              }
            },
            topRolesByRss: [{ role: "gateway", peakRssMb: 250, maxCpuPercent: 80 }],
            topRolesByCpu: [{ role: "gateway", peakRssMb: 250, maxCpuPercent: 80 }],
            topByRss: [],
            topByCpu: []
          }
        }],
        metrics: { logs: zeroLogMetrics() }
      }],
      finalMetrics: {
        service: { gatewayState: "running" },
        logs: zeroLogMetrics()
      }
    };
    evaluateRecord(record, {
      id: "synthetic-threshold-policy",
      thresholds: {}
    }, {
      profile: {
        id: "release",
        calibration: {
          roles: {
            gateway: { peakRssMb: 200 }
          },
          surfaces: {
            "release-runtime-startup": {
              thresholds: { coldReadyMs: 100 }
            }
          }
        }
      },
      surface: {
        id: "release-runtime-startup",
        thresholds: { coldReadyMs: 1000 },
        roleThresholds: {}
      }
    });
    assertEqual(record.status, "FAIL", "profile calibration threshold should fail record");
    assertEqual(record.thresholdPolicy?.profileId, "release", "threshold policy profile id");
    assertEqual(record.thresholdPolicy?.thresholds?.coldReadyMs, 100, "profile surface threshold override");
    assertEqual(record.thresholdPolicy?.roleThresholds?.gateway?.peakRssMb, 200, "profile role threshold");
    assertEqual(
      record.violations.some((violation) => violation.metric === "coldReadyMs"),
      true,
      "profile calibrated duration violation"
    );
    assertEqual(
      record.violations.some((violation) => violation.metric === "resourceByRole.gateway.peakRssMb"),
      true,
      "profile calibrated role violation"
    );
    return {
      id: "threshold-policy-calibration",
      status: "PASS",
      command: "evaluate synthetic profile threshold calibration",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "threshold-policy-calibration",
      status: "FAIL",
      command: "evaluate synthetic profile threshold calibration",
      durationMs: 0,
      message: error.message
    };
  }
}

async function cleanupRetryCheck(tmp) {
  const counterPath = join(tmp, "cleanup-retry-count");
  const command = `node -e 'const fs=require("fs"); const p=${JSON.stringify(counterPath)}; const n=Number(fs.existsSync(p)?fs.readFileSync(p,"utf8"):0)+1; fs.writeFileSync(p,String(n)); if(n<2){console.error("gateway still shutting down"); process.exit(1)} console.log("destroyed")'`;
  const result = await runCleanupCommand(command, {
    timeoutMs: 30000,
    retryDelaysMs: [0, 0, 0]
  });
  try {
    assertEqual(result.status, 0, "cleanup retry final status");
    assertEqual(result.attempts?.length, 2, "cleanup retry attempts");
    assertEqual(result.attempts?.[0]?.status, 1, "first cleanup attempt failed");
    assertEqual(result.attempts?.[1]?.status, 0, "second cleanup attempt passed");
    return {
      id: "cleanup-retry-contract",
      status: "PASS",
      command: "evaluate retryable cleanup command",
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "cleanup-retry-contract",
      status: "FAIL",
      command: "evaluate retryable cleanup command",
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

function markdownFailureCardsCheck() {
  try {
    const rendered = renderMarkdownReport({
      generatedAt: "2026-05-01T00:00:00.000Z",
      runId: "self-check-failure-cards",
      mode: "execution",
      target: "runtime:stable",
      platform: { os: "test", release: "test", arch: "test", node: "test" },
      summary: { total: 1, statuses: { FAIL: 1 } },
      records: [{
        scenario: "gateway-performance",
        title: "Gateway Performance",
        status: "FAIL",
        target: "runtime:stable",
        envName: "kova-self-check",
        likelyOwner: "gateway-runtime",
        objective: "Synthetic failure card check",
        phases: [{
          id: "start",
          title: "Start",
          intent: "Start gateway",
          commands: ["ocm start kova-self-check --runtime stable --json"],
          evidence: [],
          results: [{
            command: "ocm start kova-self-check --runtime stable --json",
            status: 1,
            timedOut: false,
            durationMs: 45000,
            stdout: "",
            stderr: "gateway did not become healthy"
          }]
        }],
        measurements: {
          health: syntheticHealthMeasurement({ healthReadyAtMs: 45000 }),
          peakRssMb: 1100,
          resourceTopRolesByRss: [{ role: "gateway", peakRssMb: 1100, maxCpuPercent: 220 }]
        },
        violations: [{ message: "gateway readiness exceeded threshold" }]
      }]
    });
    assertEqual(rendered.includes("## Findings"), true, "markdown findings section");
    assertEqual(rendered.includes("gateway-performance"), true, "finding scenario");
    assertEqual(rendered.includes("gateway readiness exceeded threshold"), true, "finding summary");
    assertEqual(rendered.includes("gateway-runtime"), true, "finding owner");
    assertEqual(rendered.includes("## Resource Roles"), true, "markdown resource roles section");
    assertEqual(rendered.includes("gateway: RSS 1100 MB; CPU 220%"), true, "markdown resource role summary");
    return {
      id: "markdown-failure-cards",
      status: "PASS",
      command: "render synthetic failure Markdown",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "markdown-failure-cards",
      status: "FAIL",
      command: "render synthetic failure Markdown",
      durationMs: 0,
      message: error.message
    };
  }
}

function reportRecommendedNextScenarioCheck() {
  try {
    const report = {
      generatedAt: "2026-05-01T00:00:00.000Z",
      runId: "self-check-recommended-next",
      mode: "execution",
      target: "local-build:/tmp/OpenClaw Test",
      platform: { os: "test", release: "test", arch: "test", node: "test" },
      summary: { total: 1, statuses: { FAIL: 1 } },
      records: [{
        scenario: "agent-cold-warm-message",
        title: "Agent Cold Warm Message",
        status: "FAIL",
        target: "local-build:/tmp/OpenClaw Test",
        envName: "kova-self-check",
        state: { id: "mock-openai-provider", title: "Mock OpenAI Provider" },
        likelyOwner: "agent-runtime",
        objective: "Synthetic recommended next scenario check",
        phases: [{
          id: "agent-turn",
          title: "Agent Turn",
          intent: "Send a cold message",
          commands: ["ocm @kova-self-check -- agent --local --message hi --json"],
          evidence: [],
          results: []
        }],
        measurements: {
          coldAgentTurnMs: 62000,
          agentPreProviderMs: 61300
        },
        violations: [{ message: "cold pre-provider latency was 61300ms" }]
      }]
    };
    const structured = renderReportSummary(report, { structured: true });
    const recommended = structured.recommendedNextScenario;
    assertEqual(recommended?.scenario, "agent-cold-warm-message", "recommended scenario id");
    assertEqual(recommended?.state, "mock-openai-provider", "recommended state id");
    assertEqual(
      recommended?.command,
      "node bin/kova.mjs run --target 'local-build:/tmp/OpenClaw Test' --scenario agent-cold-warm-message --state mock-openai-provider --execute --profile-on-failure --retain-on-failure --json",
      "recommended command"
    );
    assertEqual(renderReportSummary(report).includes("Recommended next scenario:"), true, "plain summary recommended section");
    const paste = renderPasteSummary(report);
    assertEqual(paste.includes("Recommended next scenario"), true, "paste summary recommended section");
    assertEqual(paste.includes("cold pre-provider latency was 61300ms"), true, "paste summary recommended reason");
    return {
      id: "report-recommended-next-scenario",
      status: "PASS",
      command: "render synthetic recommended next scenario",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "report-recommended-next-scenario",
      status: "FAIL",
      command: "render synthetic recommended next scenario",
      durationMs: 0,
      message: error.message
    };
  }
}

function stateRegistryValidationCheck() {
  try {
    let rejectedTrait = false;
    try {
      validateStateShape({
        id: "bad-state",
        title: "Bad State",
        objective: "Invalid state fixture",
        tags: [],
        traits: ["not-a-real-trait"],
        riskArea: "test",
        ownerArea: "test",
        setupEvidence: ["evidence"],
        cleanupGuarantees: ["cleanup"],
        setup: []
      }, "bad-state.json");
    } catch (error) {
      rejectedTrait = /unknown trait/.test(error.message);
    }
    assertEqual(rejectedTrait, true, "unknown state trait rejected");

    let rejectedEvidence = false;
    try {
      validateStateShape({
        id: "bad-evidence-state",
        title: "Bad Evidence State",
        objective: "Invalid state fixture evidence",
        tags: [],
        traits: ["fresh-user"],
        riskArea: "test",
        ownerArea: "test",
        setupEvidence: [],
        cleanupGuarantees: [],
        setup: []
      }, "bad-evidence-state.json");
    } catch (error) {
      rejectedEvidence = /setupEvidence must not be empty/.test(error.message) &&
        /cleanupGuarantees must not be empty/.test(error.message);
    }
    assertEqual(rejectedEvidence, true, "empty state evidence rejected");

    let rejectedSurface = false;
    try {
      validateRegistryReferences({
        scenarios: [{
          id: "scenario",
          surface: "known-surface",
          proves: ["baseline"],
          states: [],
          targetKinds: [],
          processRoles: []
        }],
        states: [{
          id: "state",
          traits: ["fresh-user"],
          incompatibleSurfaces: ["missing-surface"]
        }],
        profiles: [],
        surfaces: [{
          id: "known-surface",
          processRoles: [],
          requirements: [{
            id: "baseline",
            states: ["state"],
            targetKinds: ["runtime"],
            metrics: []
          }]
        }],
        processRoles: []
      });
    } catch (error) {
      rejectedSurface = /incompatibleSurfaces references unknown surface/.test(error.message);
    }
    assertEqual(rejectedSurface, true, "unknown incompatible surface rejected");

    let rejectedPurpose = false;
    try {
      validateProfileShape({
        id: "profile",
        title: "Bad Profile",
        objective: "Invalid purpose.",
        entries: [{ scenario: "scenario", state: "state" }],
        purpose: "made-up-purpose"
      }, "bad-profile.json");
    } catch (error) {
      rejectedPurpose = /unknown purpose/.test(error.message);
    }
    assertEqual(rejectedPurpose, true, "unknown profile purpose rejected");

    let rejectedDerivedCoverage = false;
    try {
      validateProfileShape({
        id: "profile",
        title: "Bad Profile Coverage",
        objective: "Invalid derived profile coverage.",
        entries: [{ scenario: "scenario", state: "state" }],
        gate: {
          coverage: {
            surfaces: {
              blocking: ["surface"]
            }
          }
        }
      }, "bad-profile-coverage.json");
    } catch (error) {
      rejectedDerivedCoverage = /coverage\.surfaces is derived/.test(error.message);
    }
    assertEqual(rejectedDerivedCoverage, true, "derived profile coverage rejected");

    let rejectedRequirement = false;
    try {
      validateRegistryReferences({
        scenarios: [{
          id: "scenario",
          surface: "known-surface",
          proves: ["missing-requirement"],
          states: [],
          targetKinds: [],
          processRoles: []
        }],
        states: [{
          id: "state",
          traits: ["fresh-user"],
        }],
        profiles: [],
        surfaces: [{
          id: "known-surface",
          processRoles: [],
          thresholds: { knownMetric: 1 },
          requirements: [{
            id: "baseline",
            states: ["missing-state"],
            stateTraits: ["not-a-trait"],
            targetKinds: ["unsupported-target"],
            metrics: ["madeUpMetric"]
          }]
        }],
        processRoles: [],
        metrics: [{ id: "knownMetric" }]
      });
    } catch (error) {
      rejectedRequirement = /proves unknown surface requirement/.test(error.message) &&
        /references unknown state 'missing-state'/.test(error.message) &&
        /references unknown state trait 'not-a-trait'/.test(error.message) &&
        /unsupported-target/.test(error.message) &&
        /unknown metric 'madeUpMetric'/.test(error.message);
    }
    assertEqual(rejectedRequirement, true, "invalid surface requirement and scenario proof rejected");

    let rejectedMetric = false;
    try {
      validateRegistryReferences({
        scenarios: [{
          id: "scenario",
          surface: "known-surface",
          proves: ["baseline"],
          thresholds: { madeUpMetric: 1 },
          states: [],
          targetKinds: [],
          processRoles: []
        }],
        states: [],
        profiles: [],
        surfaces: [{
          id: "known-surface",
          processRoles: [],
          thresholds: { knownMetric: 1 },
          requirements: [{
            id: "baseline",
            states: ["state"],
            targetKinds: ["runtime"],
            metrics: ["knownMetric"]
          }]
        }],
        processRoles: [],
        metrics: [{ id: "knownMetric" }]
      });
    } catch (error) {
      rejectedMetric = /unknown metric 'madeUpMetric'/.test(error.message);
    }
    assertEqual(rejectedMetric, true, "unknown scenario metric rejected");

    let rejectedCalibration = false;
    try {
      validateRegistryReferences({
        scenarios: [],
        states: [],
        profiles: [{
          id: "profile",
          entries: [],
          calibration: {
            roles: {
              missingRole: { peakRssMb: 100 }
            },
            surfaces: {
              missingSurface: {
                thresholds: { peakRssMb: 100 }
              },
              knownSurface: {
                thresholds: { madeUpMetric: 1 },
                roleThresholds: {
                  knownRole: { peakRssMb: 100 }
                }
              }
            }
          }
        }],
        surfaces: [{
          id: "knownSurface",
          processRoles: [],
          requirements: [{
            id: "baseline",
            states: ["state"],
            targetKinds: ["runtime"],
            metrics: []
          }]
        }],
        processRoles: [{ id: "knownRole" }],
        metrics: [{ id: "peakRssMb" }]
      });
    } catch (error) {
      rejectedCalibration = /calibration\.roles references unknown process role/.test(error.message) &&
        /calibration\.surfaces references unknown surface/.test(error.message) &&
        /unknown metric 'madeUpMetric'/.test(error.message);
    }
    assertEqual(rejectedCalibration, true, "invalid profile calibration rejected");

    let rejectedPlatform = false;
    try {
      validateRegistryReferences({
        scenarios: [],
        states: [],
        profiles: [{
          id: "profile",
          entries: [],
          gate: {
            coverage: {
              platforms: {
                blocking: ["macos-arm"]
              }
            }
          }
        }],
        surfaces: [],
        processRoles: [],
        metrics: []
      });
    } catch (error) {
      rejectedPlatform = /unknown platform coverage key 'macos-arm'/.test(error.message);
    }
    assertEqual(rejectedPlatform, true, "unknown platform coverage key rejected");

    return {
      id: "state-registry-validation",
      status: "PASS",
      command: "evaluate synthetic invalid state contracts",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "state-registry-validation",
      status: "FAIL",
      command: "evaluate synthetic invalid state contracts",
      durationMs: 0,
      message: error.message
    };
  }
}

function scenarioCloneFirstValidationCheck() {
  try {
    let rejectedMissingClone = false;
    try {
      validateScenarioShape({
        id: "bad-existing-user",
        surface: "upgrade-existing-user",
        title: "Bad Existing User",
        objective: "Touches source env without clone-first protection.",
        tags: ["upgrade"],
        proves: ["baseline"],
        thresholds: {},
        phases: [{
          id: "status",
          title: "Status",
          intent: "Unsafe durable source access.",
          healthScope: "post-ready",
          commands: ["ocm service status {sourceEnv} --json"],
          evidence: ["status"]
        }]
      }, "bad-existing-user.json");
    } catch (error) {
      rejectedMissingClone = /must start by cloning/.test(error.message);
    }
    assertEqual(rejectedMissingClone, true, "source env scenario without clone-first rejected");

    let rejectedSecondSourceUse = false;
    try {
      validateScenarioShape({
        id: "bad-existing-user-second-source",
        surface: "upgrade-existing-user",
        title: "Bad Existing User Second Source",
        objective: "References source env after clone.",
        tags: ["upgrade"],
        proves: ["baseline"],
        thresholds: {},
        phases: [{
          id: "clone",
          title: "Clone",
          intent: "Clone source.",
          healthScope: "none",
          commands: ["ocm env clone {sourceEnv} {env} --json", "ocm logs {sourceEnv} --tail 20"],
          evidence: ["clone"]
        }]
      }, "bad-existing-user-second-source.json");
    } catch (error) {
      rejectedSecondSourceUse = /may reference it only in the first clone command/.test(error.message);
    }
    assertEqual(rejectedSecondSourceUse, true, "second source env reference rejected");

    validateScenarioShape({
      id: "good-existing-user",
      surface: "upgrade-existing-user",
      title: "Good Existing User",
      objective: "Clone first, then operate only on the disposable env.",
      tags: ["upgrade"],
      proves: ["baseline"],
      thresholds: {},
      phases: [{
        id: "clone",
        title: "Clone",
        intent: "Clone source.",
        healthScope: "none",
        commands: ["ocm env clone {sourceEnv} {env} --json"],
        evidence: ["clone"]
      }, {
        id: "upgrade",
        title: "Upgrade",
        intent: "Upgrade disposable clone.",
        healthScope: "readiness",
        commands: ["ocm upgrade {env} --channel beta --json"],
        evidence: ["upgrade"]
      }]
    }, "good-existing-user.json");

    return {
      id: "scenario-clone-first-validation",
      status: "PASS",
      command: "validate source-env scenario contracts",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "scenario-clone-first-validation",
      status: "FAIL",
      command: "validate source-env scenario contracts",
      durationMs: 0,
      message: error.message
    };
  }
}

function scenarioHealthScopeValidationCheck() {
  try {
    let rejectedMissing = false;
    try {
      validateScenarioShape({
        id: "missing-health-scope",
        surface: "fresh-install",
        title: "Missing Health Scope",
        objective: "Scenario phase without an explicit health scope.",
        tags: ["fresh-user"],
        proves: ["baseline"],
        thresholds: {},
        phases: [{
          id: "start",
          title: "Start",
          intent: "Start gateway.",
          commands: ["ocm start {env} {startSelector} --json"],
          evidence: ["start"]
        }]
      }, "missing-health-scope.json");
    } catch (error) {
      rejectedMissing = /phases\[0\]\.healthScope must be a non-empty string/.test(error.message);
    }
    assertEqual(rejectedMissing, true, "missing healthScope rejected");

    let rejectedInvalid = false;
    try {
      validateScenarioShape({
        id: "invalid-health-scope",
        surface: "fresh-install",
        title: "Invalid Health Scope",
        objective: "Scenario phase with an invalid health scope.",
        tags: ["fresh-user"],
        proves: ["baseline"],
        thresholds: {},
        phases: [{
          id: "start",
          title: "Start",
          intent: "Start gateway.",
          healthScope: "startup",
          commands: ["ocm start {env} {startSelector} --json"],
          evidence: ["start"]
        }]
      }, "invalid-health-scope.json");
    } catch (error) {
      rejectedInvalid = /healthScope must be one of/.test(error.message);
    }
    assertEqual(rejectedInvalid, true, "invalid healthScope rejected");

    return {
      id: "scenario-health-scope-validation",
      status: "PASS",
      command: "validate scenario health scope contracts",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "scenario-health-scope-validation",
      status: "FAIL",
      command: "validate scenario health scope contracts",
      durationMs: 0,
      message: error.message
    };
  }
}

function scenarioStateCompatibilityCheck() {
  try {
    let rejected = false;
    try {
      validateRegistryReferences({
        scenarios: [{
          id: "upgrade-existing-user",
          surface: "upgrade-existing-user",
          proves: ["baseline"],
          states: [],
          targetKinds: [],
          processRoles: []
        }],
        states: [{
          id: "fresh",
          traits: ["fresh-user"],
          incompatibleSurfaces: ["upgrade-existing-user"]
        }],
        profiles: [{
          id: "bad-profile",
          entries: [{ scenario: "upgrade-existing-user", state: "fresh" }]
        }],
        surfaces: [{
          id: "upgrade-existing-user",
          processRoles: [],
          requirements: [{
            id: "baseline",
            states: ["old-release-user"],
            targetKinds: ["runtime"],
            metrics: []
          }]
        }],
        processRoles: []
      });
    } catch (error) {
      rejected = /pairs scenario 'upgrade-existing-user' with state 'fresh'/.test(error.message) ||
        /explicitly incompatible surface/.test(error.message);
    }
    assertEqual(rejected, true, "invalid scenario/state profile pairing rejected");
    return {
      id: "scenario-state-compatibility",
      status: "PASS",
      command: "evaluate synthetic invalid scenario/state pairing",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "scenario-state-compatibility",
      status: "FAIL",
      command: "evaluate synthetic invalid scenario/state pairing",
      durationMs: 0,
      message: error.message
    };
  }
}

function zeroLogMetrics() {
  return {
    missingDependencyErrors: 0,
    pluginLoadFailures: 0,
    metadataScanMentions: 0,
    configNormalizationMentions: 0,
    gatewayRestartMentions: 0,
    providerLoadMentions: 0,
    modelCatalogMentions: 0,
    providerTimeoutMentions: 0,
    eventLoopDelayMentions: 0,
    v8DiagnosticMentions: 0
  };
}

async function commandCheck(id, command) {
  const result = await runCommand(command, { timeoutMs: 30000 });
  return {
    id,
    status: result.status === 0 ? "PASS" : "FAIL",
    command,
    durationMs: result.durationMs,
    message: result.status === 0 ? "" : result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`
  };
}

async function credentialStoreSelfCheck(tmp) {
  const home = join(tmp, "credentials-home");
  const command = `KOVA_HOME=${quoteShell(home)} node bin/kova.mjs setup --non-interactive --auth env-only --provider openai --env-var OPENAI_API_KEY --json`;
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000 });
  try {
    if (result.status !== 0) {
      throw new Error(result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`);
    }
    const data = JSON.parse(result.stdout);
    assertEqual(data.schemaVersion, "kova.setup.v1", "setup schema");
    assertEqual(data.auth?.method, "env-only", "setup auth method");
    const liveEnv = join(home, "credentials", "live.env");
    const metadata = await stat(liveEnv);
    const mode = metadata.mode & 0o777;
    if (mode !== 0o600) {
      throw new Error(`live.env permissions expected 0600, got ${mode.toString(8)}`);
    }
    return {
      id: "credential-store",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "credential-store",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function interactiveSetupChoiceCheck(tmp) {
  const home = join(tmp, "numeric-auth-home");
  const command = `KOVA_HOME=${quoteShell(home)} node bin/kova.mjs setup --non-interactive --provider 2 --auth 3 --value kova-selfcheck-key --json`;
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000 });
  try {
    if (result.status !== 0) {
      throw new Error(result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`);
    }
    const data = JSON.parse(result.stdout);
    assertEqual(data.schemaVersion, "kova.setup.v1", "numeric setup schema");
    assertEqual(data.auth?.provider, "anthropic", "provider selected by number");
    assertEqual(data.auth?.method, "api-key", "auth method selected by number");
    assertEqual(data.auth?.envVar, "ANTHROPIC_API_KEY", "provider env var default");
    return {
      id: "setup-provider-auth-numeric",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "setup-provider-auth-numeric",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function externalCliSetupCheck(tmp) {
  const home = join(tmp, "external-cli-home");
  const fakeBin = join(tmp, "fake-bin");
  const kovaHome = join(tmp, "external-cli-kova-home");
  await mkdir(join(home, ".codex"), { recursive: true });
  await mkdir(fakeBin, { recursive: true });
  const fakeCodex = join(fakeBin, "codex");
  await writeFile(join(home, ".codex", "auth.json"), "{\"tokens\":{\"access_token\":\"redacted\"}}\n", "utf8");
  await writeFile(fakeCodex, "#!/bin/sh\nexit 0\n", "utf8");
  await chmod(fakeCodex, 0o755);

  const command = [
    `HOME=${quoteShell(home)}`,
    `PATH=${quoteShell(`${fakeBin}:${process.env.PATH ?? ""}`)}`,
    `KOVA_HOME=${quoteShell(kovaHome)}`,
    "node bin/kova.mjs setup --non-interactive --provider openai --auth external-cli --json"
  ].join(" ");
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000 });
  try {
    if (result.status !== 0) {
      throw new Error(result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`);
    }
    const data = JSON.parse(result.stdout);
    assertEqual(data.schemaVersion, "kova.setup.v1", "external cli setup schema");
    assertEqual(data.auth?.provider, "openai", "external cli provider");
    assertEqual(data.auth?.method, "external-cli", "external cli method");
    assertEqual(data.auth?.externalCli, "codex", "external cli name");
    assertEqual(data.auth?.verification?.verified, true, "external cli verification");
    const credential = data.checks?.find((check) => check.id === "credentials");
    if (!credential || !credential.message.includes("external-cli codex verified")) {
      throw new Error(`credential check did not report verified external CLI: ${credential?.message ?? "missing"}`);
    }
    return {
      id: "setup-external-cli-verification",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "setup-external-cli-verification",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function externalCliOpenClawConfigCheck(tmp) {
  const home = join(tmp, "external-cli-config-home");
  const command = [
    `OPENCLAW_HOME=${quoteShell(home)}`,
    "node support/configure-openclaw-live-auth.mjs --provider openai --auth-method external-cli --external-cli codex"
  ].join(" ");
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000 });
  try {
    if (result.status !== 0) {
      throw new Error(result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`);
    }
    const config = JSON.parse(await readFile(join(home, ".openclaw", "openclaw.json"), "utf8"));
    assertEqual(config.agents?.defaults?.model?.primary, "codex/gpt-5.5", "external cli model ref");
    assertEqual(config.agents?.defaults?.agentRuntime?.id, "codex", "external cli runtime id");
    assertEqual(config.agents?.defaults?.agentRuntime?.fallback, "none", "external cli runtime fallback");
    assertEqual(config.plugins?.entries?.codex?.enabled, true, "external cli codex plugin enabled");
    if (config.models?.providers?.openai !== undefined) {
      throw new Error("Codex external CLI config must not write an OpenAI provider override");
    }
    if (config.models?.providers?.codex !== undefined) {
      throw new Error("Codex external CLI config must use the bundled codex provider instead of writing a provider override");
    }
    return {
      id: "external-cli-openclaw-config",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "external-cli-openclaw-config",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function anthropicApiKeyOpenClawConfigCheck(tmp) {
  const home = join(tmp, "anthropic-api-key-config-home");
  const command = [
    `OPENCLAW_HOME=${quoteShell(home)}`,
    "node support/configure-openclaw-live-auth.mjs --provider anthropic --env-var ANTHROPIC_API_KEY"
  ].join(" ");
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000 });
  try {
    if (result.status !== 0) {
      throw new Error(result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`);
    }
    const config = JSON.parse(await readFile(join(home, ".openclaw", "openclaw.json"), "utf8"));
    assertEqual(config.models?.providers?.anthropic?.apiKey?.id, "ANTHROPIC_API_KEY", "anthropic env ref");
    assertEqual(config.agents?.defaults?.model?.primary, "anthropic/claude-sonnet-4-5", "anthropic default model");
    return {
      id: "anthropic-api-key-openclaw-config",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "anthropic-api-key-openclaw-config",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function mockAuthOpenClawConfigCheck(tmp) {
  const home = join(tmp, "mock-auth-config-home");
  const portFile = join(tmp, "mock-auth-port");
  await writeFile(portFile, "12345\n", "utf8");
  const command = [
    `OPENCLAW_HOME=${quoteShell(home)}`,
    `node support/configure-openclaw-mock-auth.mjs --port-file ${quoteShell(portFile)}`
  ].join(" ");
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000 });
  try {
    if (result.status !== 0) {
      throw new Error(result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`);
    }
    const config = JSON.parse(await readFile(join(home, ".openclaw", "openclaw.json"), "utf8"));
    assertEqual(config.models?.providers?.openai?.baseUrl, "http://127.0.0.1:12345/v1", "mock provider base URL");
    assertEqual(config.agents?.defaults?.model?.primary, "openai/gpt-5.5", "mock default model");
    assertEqual(config.gateway?.auth?.mode, "token", "mock gateway token mode");
    assertEqual(config.gateway?.auth?.token, "kova-mock-gateway-token", "mock gateway auth token");
    assertEqual(config.gateway?.remote?.token, "kova-mock-gateway-token", "mock gateway remote token");
    return {
      id: "mock-auth-openclaw-config",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "mock-auth-openclaw-config",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function claudeCliOpenClawConfigCheck(tmp) {
  const home = join(tmp, "claude-cli-config-home");
  const command = [
    `OPENCLAW_HOME=${quoteShell(home)}`,
    "node support/configure-openclaw-live-auth.mjs --provider anthropic --auth-method external-cli --external-cli claude"
  ].join(" ");
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000 });
  try {
    if (result.status !== 0) {
      throw new Error(result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`);
    }
    const config = JSON.parse(await readFile(join(home, ".openclaw", "openclaw.json"), "utf8"));
    assertEqual(config.agents?.defaults?.model?.primary, "anthropic/claude-sonnet-4-5", "claude cli model ref");
    assertEqual(config.agents?.defaults?.agentRuntime?.id, "claude-cli", "claude cli runtime id");
    assertEqual(config.agents?.defaults?.agentRuntime?.fallback, "none", "claude cli runtime fallback");
    assertEqual(config.plugins?.entries?.anthropic?.enabled, true, "claude cli anthropic plugin enabled");
    if (config.models?.providers?.anthropic !== undefined) {
      throw new Error("Claude CLI config must use the bundled Anthropic provider instead of writing a provider override");
    }
    return {
      id: "claude-cli-openclaw-config",
      status: "PASS",
      command,
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "claude-cli-openclaw-config",
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

async function externalCliRunAuthVerificationCheck(tmp) {
  const home = join(tmp, "stale-external-cli-home");
  const kovaHome = join(tmp, "stale-external-cli-kova-home");
  const credentials = join(kovaHome, "credentials");
  await mkdir(credentials, { recursive: true });
  await writeFile(join(credentials, "providers.json"), `${JSON.stringify({
    schemaVersion: "kova.credentials.providers.v1",
    defaultProvider: "openai",
    providers: {
      openai: {
        id: "openai",
        method: "external-cli",
        envVars: [],
        externalCli: "codex",
        fallbackPolicy: "mock",
        configuredAt: new Date().toISOString()
      }
    }
  }, null, 2)}\n`, "utf8");
  await writeFile(join(credentials, "live.env"), "", { encoding: "utf8", mode: 0o600 });
  const command = [
    `HOME=${quoteShell(home)}`,
    `KOVA_HOME=${quoteShell(kovaHome)}`,
    "node bin/kova.mjs run --target runtime:stable --scenario fresh-install --auth live --json"
  ].join(" ");
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000 });
  const output = `${result.stdout}\n${result.stderr}`;
  return {
    id: "run-external-cli-revalidates-auth",
    status: result.status !== 0 && output.includes("external-cli codex is not usable") ? "PASS" : "FAIL",
    command,
    durationMs: result.durationMs,
    message: result.status !== 0 && output.includes("external-cli codex is not usable")
      ? ""
      : `expected stale external CLI failure, got status ${result.status}: ${output.trim()}`
  };
}

async function commandTimeoutContractCheck() {
  const command = "node -e 'setTimeout(() => console.log(\"default-timeout-ok\"), 20)'";
  try {
    const result = await runCommand(command, { maxOutputChars: 100000 });
    assertEqual(result.status, 0, "default timeout command status");
    assertEqual(result.timedOut, false, "default timeout should not expire immediately");
    assertEqual(result.stdout.trim(), "default-timeout-ok", "default timeout command output");
    let invalidRejected = false;
    try {
      await runCommand("node -e 'process.exit(0)'", { timeoutMs: 0 });
    } catch (error) {
      invalidRejected = /timeoutMs must be a positive integer/.test(error.message);
    }
    assertEqual(invalidRejected, true, "invalid timeout rejected");
    return {
      id: "command-timeout-contract",
      status: "PASS",
      command: "evaluate runCommand timeout defaults",
      durationMs: result.durationMs
    };
  } catch (error) {
    return {
      id: "command-timeout-contract",
      status: "FAIL",
      command,
      durationMs: 0,
      message: error.message
    };
  }
}

async function failingCommandCheck(id, command, expectedMessage) {
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000 });
  const output = `${result.stdout}\n${result.stderr}`;
  return {
    id,
    status: result.status !== 0 && output.includes(expectedMessage) ? "PASS" : "FAIL",
    command,
    durationMs: result.durationMs,
    message: result.status !== 0 && output.includes(expectedMessage)
      ? ""
      : `expected failure containing ${JSON.stringify(expectedMessage)}, got status ${result.status}: ${output.trim()}`
  };
}

async function jsonCommandCheck(id, command, validate) {
  const result = await runCommand(command, { timeoutMs: 30000, maxOutputChars: 1000000 });
  if (result.status !== 0) {
    return {
      id,
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: result.stderr.trim() || result.stdout.trim() || `exit ${result.status}`
    };
  }

  try {
    const data = JSON.parse(result.stdout);
    await validate(data);
    return {
      id,
      status: "PASS",
      command,
      durationMs: result.durationMs,
      data
    };
  } catch (error) {
    return {
      id,
      status: "FAIL",
      command,
      durationMs: result.durationMs,
      message: error.message
    };
  }
}

function validateReport(report) {
  try {
    assertEqual(report.schemaVersion, "kova.report.v1", "report schema");
    assertEqual(report.mode, "dry-run", "report mode");
    assertEqual(report.summary?.statuses?.["DRY-RUN"], 2, "report dry-run count");
    assertEqual(Object.hasOwn(report, "resolvedCoverage"), false, "report does not include planner-only resolved coverage");
    assertEqual(report.performance?.repeat, 2, "report repeat count");
    assertEqual(report.performance?.groupCount, 1, "report performance group count");
    assertArrayNotEmpty(report.records, "report records");
    const dirs = report.records[0]?.collectorArtifactDirs;
    assertEqual(dirs?.schemaVersion, "kova.collectorArtifactDirs.v1", "collector artifact dirs schema");
    assertString(dirs?.resourceSamples, "collector resource samples dir");
    assertString(dirs?.openclaw, "collector OpenClaw dir");
    assertString(dirs?.nodeProfiles, "collector node profiles dir");
    return {
      id: "dry-run-report-file",
      status: "PASS",
      command: "read generated JSON report",
      durationMs: 0
    };
  } catch (error) {
    return {
      id: "dry-run-report-file",
      status: "FAIL",
      command: "read generated JSON report",
      durationMs: 0,
      message: error.message
    };
  }
}

function assertEqual(actual, expected, label) {
  if (actual !== expected) {
    throw new Error(`${label} expected ${JSON.stringify(expected)}, got ${JSON.stringify(actual)}`);
  }
}

function assertString(value, label) {
  if (typeof value !== "string" || value.length === 0) {
    throw new Error(`${label} must be a non-empty string`);
  }
}

function sleep(ms) {
  return new Promise((resolve) => setTimeout(resolve, ms));
}

function assertArray(value, label) {
  if (!Array.isArray(value)) {
    throw new Error(`${label} must be an array`);
  }
}

function assertArrayNotEmpty(value, label) {
  assertArray(value, label);
  if (value.length === 0) {
    throw new Error(`${label} must not be empty`);
  }
}