openclaw/extensions/qa-lab/src/model-switch-eval.test.ts

import { describe, expect, it } from "vitest";
import { hasModelSwitchContinuityEvidence } from "./model-switch-eval.js";

describe("qa model-switch evaluation", () => {
  it("accepts direct handoff replies that mention the kickoff task", () => {
    expect(
      hasModelSwitchContinuityEvidence(
        "Handoff confirmed: I reread QA_KICKOFF_TASK.md and switched to gpt.",
      ),
    ).toBe(true);
  });

  it("accepts short mission-oriented switch confirmations", () => {
    expect(
      hasModelSwitchContinuityEvidence(
        "model switch complete. reread the kickoff task; qa mission stays the same.",
      ),
    ).toBe(true);
  });

  it("rejects unrelated handoff chatter that never confirms the kickoff reread", () => {
    expect(
      hasModelSwitchContinuityEvidence(
        "subagent-handoff confirmed. qa report update: scenario pass. qa run complete.",
      ),
    ).toBe(false);
  });

  it("rejects over-scoped multi-line wrap-ups even if they mention a switch and the mission", () => {
    expect(
      hasModelSwitchContinuityEvidence(
        `model switch acknowledged. qa mission stays the same.

Final QA tally update: all mandatory scenarios resolved. QA run complete.`,
      ),
    ).toBe(false);
  });
});