Files
openclaw/src/plugin-sdk/qa-runtime.test.ts
2026-05-29 05:21:23 +02:00

274 lines
8.3 KiB
TypeScript

import { Command } from "commander";
import { afterEach, beforeEach, describe, expect, it, vi } from "vitest";
import {
cleanupTempDirs,
expectPrivateQaLabRuntimeSurfaceLoad,
expectQaLabRuntimeSurfaceLoad,
restorePrivateQaCliEnv,
} from "./qa-runtime.test-helpers.js";
const loadBundledPluginPublicSurfaceModuleSync = vi.hoisted(() => vi.fn());
const resolveOpenClawPackageRootSync = vi.hoisted(() => vi.fn());
vi.mock("./facade-runtime.js", () => ({
loadBundledPluginPublicSurfaceModuleSync,
}));
vi.mock("../infra/openclaw-root.js", () => ({
resolveOpenClawPackageRootSync,
}));
describe("plugin-sdk qa-runtime", () => {
const tempDirs: string[] = [];
const originalPrivateQaCli = process.env.OPENCLAW_ENABLE_PRIVATE_QA_CLI;
beforeEach(() => {
loadBundledPluginPublicSurfaceModuleSync.mockReset();
resolveOpenClawPackageRootSync.mockReset().mockReturnValue(null);
delete process.env.OPENCLAW_ENABLE_PRIVATE_QA_CLI;
});
afterEach(() => {
cleanupTempDirs(tempDirs);
restorePrivateQaCliEnv(originalPrivateQaCli);
});
it("stays cold until the runtime seam is used", async () => {
const module = await import("./qa-runtime.js");
expect(loadBundledPluginPublicSurfaceModuleSync).not.toHaveBeenCalled();
expect(module.loadQaRuntimeModule).toBeTypeOf("function");
expect(module.isQaRuntimeAvailable).toBeTypeOf("function");
});
it("loads the qa-lab runtime public surface through the generic seam", async () => {
await expectQaLabRuntimeSurfaceLoad({
importRuntime: () => import("./qa-runtime.js"),
loadBundledPluginPublicSurfaceModuleSync,
});
});
it("uses the source bundled tree for qa-lab runtime loading in private qa mode", async () => {
await expectPrivateQaLabRuntimeSurfaceLoad({
tempDirs,
importRuntime: () => import("./qa-runtime.js"),
loadBundledPluginPublicSurfaceModuleSync,
resolveOpenClawPackageRootSync,
});
});
it("reports the runtime as unavailable when the qa-lab surface is missing", async () => {
loadBundledPluginPublicSurfaceModuleSync.mockImplementation(() => {
throw new Error("Unable to resolve bundled plugin public surface qa-lab/runtime-api.js");
});
const module = await import("./qa-runtime.js");
expect(module.isQaRuntimeAvailable()).toBe(false);
});
it("renders shared QA markdown reports with multiline details", async () => {
const module = await import("./qa-runtime.js");
const report = module.renderQaMarkdownReport({
title: "QA Report",
startedAt: new Date("2026-01-01T00:00:00.000Z"),
finishedAt: new Date("2026-01-01T00:00:02.000Z"),
checks: [{ name: "preflight", status: "pass" }],
scenarios: [
{
name: "transport reply",
status: "fail",
details: "line one\nline two",
steps: [{ name: "send", status: "pass", details: "ok" }],
},
],
timeline: ["sent request"],
notes: ["kept artifacts"],
});
expect(report).toContain("# QA Report");
expect(report).toContain("- Duration ms: 2000");
expect(report).toContain("- Passed: 1");
expect(report).toContain("- Failed: 1");
expect(report).toContain("```text\nline one\nline two\n```");
expect(report).toContain("- [x] send");
expect(report).toContain("## Timeline");
});
it("keeps shared live transport scenario coverage helpers ordered and strict", async () => {
const module = await import("./qa-runtime.js");
expect(module.LIVE_TRANSPORT_BASELINE_STANDARD_SCENARIO_IDS).toEqual([
"canary",
"mention-gating",
"allowlist-block",
"top-level-reply-shape",
"restart-resume",
]);
const definitions = [
{ id: "alpha", timeoutMs: 1_000, title: "alpha" },
{ id: "beta", timeoutMs: 1_000, title: "beta" },
] as const;
expect(
module.selectLiveTransportScenarios({
ids: ["beta"],
laneLabel: "Demo",
scenarios: definitions,
}),
).toEqual([definitions[1]]);
expect(() =>
module.selectLiveTransportScenarios({
ids: ["missing"],
laneLabel: "Demo",
scenarios: definitions,
}),
).toThrow("unknown Demo QA scenario id(s): missing");
const covered = module.collectLiveTransportStandardScenarioCoverage({
alwaysOnStandardScenarioIds: ["canary"],
scenarios: [
{ id: "scenario-1", standardId: "mention-gating", timeoutMs: 1_000, title: "mention" },
{
id: "scenario-2",
standardId: "mention-gating",
timeoutMs: 1_000,
title: "mention again",
},
{ id: "scenario-3", standardId: "restart-resume", timeoutMs: 1_000, title: "restart" },
],
});
expect(covered).toEqual(["canary", "mention-gating", "restart-resume"]);
expect(
module.findMissingLiveTransportStandardScenarios({
coveredStandardScenarioIds: covered,
expectedStandardScenarioIds: module.LIVE_TRANSPORT_BASELINE_STANDARD_SCENARIO_IDS,
}),
).toEqual(["allowlist-block", "top-level-reply-shape"]);
});
it("registers shared live transport QA CLI options", async () => {
const module = await import("./qa-runtime.js");
const run = vi.fn(async () => {});
const qa = new Command();
module
.createLiveTransportQaCliRegistration({
commandName: "telegram",
credentialOptions: {
sourceDescription: "Credential source for Telegram QA",
roleDescription: "Credential role for Telegram QA",
},
defaultProviderMode: "live-frontier",
description: "Run Telegram QA",
providerModeHelp: "Provider mode",
listScenariosHelp: "List Telegram scenarios",
outputDirHelp: "Telegram output directory",
profileHelp: "QA profile",
failFastHelp: "Stop after first failure",
allowFailuresHelp: "Allow failures",
scenarioHelp: "Run only the named scenario",
sutAccountHelp: "Temporary SUT account",
run,
})
.register(qa);
await qa.parseAsync([
"node",
"openclaw",
"telegram",
"--repo-root",
"/tmp/repo",
"--output-dir",
".artifacts/qa",
"--provider-mode",
"mock-openai",
"--model",
"primary",
"--alt-model",
"alternate",
"--scenario",
"alpha",
"--scenario",
" ",
"--scenario",
"beta",
"--fast",
"--allow-failures",
"--list-scenarios",
"--profile",
"fast",
"--fail-fast",
"--sut-account",
"sut-2",
"--credential-source",
"convex",
"--credential-role",
"maintainer",
]);
expect(run).toHaveBeenCalledWith({
repoRoot: "/tmp/repo",
outputDir: ".artifacts/qa",
providerMode: "mock-openai",
primaryModel: "primary",
alternateModel: "alternate",
fastMode: true,
allowFailures: true,
failFast: true,
profile: "fast",
scenarioIds: ["alpha", "beta"],
listScenarios: true,
sutAccountId: "sut-2",
credentialSource: "convex",
credentialRole: "maintainer",
});
});
it("builds shared live-lane artifact errors", async () => {
const module = await import("./qa-runtime.js");
expect(
module.buildQaLiveLaneArtifactsError({
heading: "Matrix QA failed.",
details: ["cleanup: ok"],
artifacts: {
report: "/tmp/report.md",
summary: "/tmp/summary.json",
},
}),
).toBe(
[
"Matrix QA failed.",
"cleanup: ok",
"Artifacts:",
"- report: /tmp/report.md",
"- summary: /tmp/summary.json",
].join("\n"),
);
});
it("shares Docker health parsing across array and jsonl compose output", async () => {
const module = await import("./qa-runtime.js");
const runtime = module.createQaDockerRuntime({ auditContext: "qa-test" });
const dockerPsOutputs = ['[{"Health":"starting"}]', '{"State":"running"}\n'];
const runCommand = vi.fn(async () => ({
stdout: dockerPsOutputs.shift() ?? '{"State":"running"}',
stderr: "",
}));
const sleepImpl = vi.fn(async () => {});
await runtime.waitForDockerServiceHealth(
"homeserver",
"/tmp/docker-compose.yml",
"/repo",
runCommand,
sleepImpl,
);
expect(runCommand).toHaveBeenCalledTimes(2);
expect(sleepImpl).toHaveBeenCalledTimes(1);
});
});