mirror of
https://github.com/openclaw/openclaw.git
synced 2026-06-30 16:23:32 +00:00
Merged via squash.
Prepared head SHA: b6a81f07f1
Co-authored-by: steipete <58493+steipete@users.noreply.github.com>
Reviewed-by: @steipete
2562 lines
84 KiB
TypeScript
2562 lines
84 KiB
TypeScript
// E2E tests for run-reply-agent execution and generated session artifacts.
|
|
import { mkdtemp, rm } from "node:fs/promises";
|
|
import { tmpdir } from "node:os";
|
|
import { join } from "node:path";
|
|
import { beforeAll, beforeEach, describe, expect, it, vi } from "vitest";
|
|
import { saveSessionStore, type SessionEntry } from "../../config/sessions.js";
|
|
import { readSessionStoreForTest } from "../../config/sessions/test-helpers.js";
|
|
import type { TypingMode } from "../../config/types.js";
|
|
import type { TemplateContext } from "../templating.js";
|
|
import type { GetReplyOptions } from "../types.js";
|
|
import {
|
|
enqueueFollowupRun,
|
|
refreshQueuedFollowupSession,
|
|
scheduleFollowupDrain,
|
|
type FollowupRun,
|
|
type QueueSettings,
|
|
} from "./queue.js";
|
|
import {
|
|
REPLY_OPERATION_RUN_STATE,
|
|
type ReplyOperationRunState,
|
|
type ReplyOptionsWithOperationRunState,
|
|
} from "./reply-operation-run-state.js";
|
|
import { createReplyOperation, testing as replyRunTesting } from "./reply-run-registry.js";
|
|
import { consumeReplyUsageState } from "./reply-usage-state.js";
|
|
import { createMockTypingController } from "./test-helpers.js";
|
|
|
|
type AgentRunParams = {
|
|
sessionId?: string;
|
|
sessionFile?: string;
|
|
onPartialReply?: (payload: { text?: string }) => Promise<void> | void;
|
|
onAssistantMessageStart?: () => Promise<void> | void;
|
|
onReasoningStream?: (payload: { text?: string }) => Promise<void> | void;
|
|
onBlockReply?: (payload: { text?: string; mediaUrls?: string[] }) => Promise<void> | void;
|
|
onToolResult?: (payload: ReplyPayload) => Promise<void> | void;
|
|
onAgentEvent?: (evt: { stream: string; data: Record<string, unknown> }) => void;
|
|
silentExpected?: boolean;
|
|
};
|
|
|
|
const state = vi.hoisted(() => ({
|
|
compactEmbeddedAgentSessionMock: vi.fn(),
|
|
queueEmbeddedAgentMessageMock: vi.fn(),
|
|
runEmbeddedAgentMock: vi.fn(),
|
|
}));
|
|
|
|
function countMatching<T>(items: readonly T[], predicate: (item: T) => boolean): number {
|
|
let count = 0;
|
|
for (const item of items) {
|
|
if (predicate(item)) {
|
|
count += 1;
|
|
}
|
|
}
|
|
return count;
|
|
}
|
|
|
|
function requireRecord(value: unknown, label: string): Record<string, unknown> {
|
|
if (!value || typeof value !== "object" || Array.isArray(value)) {
|
|
throw new Error(`expected ${label} to be an object`);
|
|
}
|
|
return value as Record<string, unknown>;
|
|
}
|
|
|
|
function mockCallArgs(mock: ReturnType<typeof vi.fn>, label: string, callIndex = 0): unknown[] {
|
|
const call = mock.mock.calls[callIndex] as unknown[] | undefined;
|
|
if (!call) {
|
|
throw new Error(`expected ${label} mock call ${callIndex}`);
|
|
}
|
|
return call;
|
|
}
|
|
|
|
function requireStoredSessionEntry(storePath: string, sessionKey = "main"): SessionEntry {
|
|
const entry = readSessionStoreForTest(storePath)[sessionKey];
|
|
if (!entry) {
|
|
throw new Error(`expected stored session entry for ${sessionKey}`);
|
|
}
|
|
return entry;
|
|
}
|
|
|
|
let modelFallbackModule: typeof import("../../agents/model-fallback.js");
|
|
let onAgentEvent: typeof import("../../infra/agent-events.js").onAgentEvent;
|
|
|
|
let runReplyAgentPromise:
|
|
| Promise<(typeof import("./agent-runner.js"))["runReplyAgent"]>
|
|
| undefined;
|
|
|
|
async function getRunReplyAgent() {
|
|
if (!runReplyAgentPromise) {
|
|
runReplyAgentPromise = import("./agent-runner.js").then((m) => m.runReplyAgent);
|
|
}
|
|
return await runReplyAgentPromise;
|
|
}
|
|
|
|
vi.mock("../../agents/model-fallback.js", () => ({
|
|
runWithModelFallback: async ({
|
|
provider,
|
|
model,
|
|
run,
|
|
}: {
|
|
provider: string;
|
|
model: string;
|
|
run: (provider: string, model: string) => Promise<unknown>;
|
|
}) => ({
|
|
outcome: "completed" as const,
|
|
result: await run(provider, model),
|
|
provider,
|
|
model,
|
|
attempts: [],
|
|
}),
|
|
isFallbackSummaryError: (err: unknown) =>
|
|
err instanceof Error &&
|
|
err.name === "FallbackSummaryError" &&
|
|
Array.isArray((err as { attempts?: unknown[] }).attempts),
|
|
}));
|
|
|
|
vi.mock("../../agents/embedded-agent.js", () => ({
|
|
compactEmbeddedAgentSession: (params: unknown) => state.compactEmbeddedAgentSessionMock(params),
|
|
queueEmbeddedAgentMessage: vi.fn().mockReturnValue(false),
|
|
runEmbeddedAgent: (params: unknown) => state.runEmbeddedAgentMock(params),
|
|
}));
|
|
|
|
vi.mock("../../agents/embedded-agent-runner/runs.js", () => ({
|
|
queueEmbeddedAgentMessage: (sessionId: string, prompt: string, options: unknown) =>
|
|
state.queueEmbeddedAgentMessageMock(sessionId, prompt, options),
|
|
}));
|
|
|
|
vi.mock("./queue.js", () => ({
|
|
enqueueFollowupRun: vi.fn(),
|
|
refreshQueuedFollowupSession: vi.fn(),
|
|
scheduleFollowupDrain: vi.fn(),
|
|
}));
|
|
|
|
beforeAll(async () => {
|
|
// Avoid attributing the initial agent-runner import cost to the first test case.
|
|
modelFallbackModule = await import("../../agents/model-fallback.js");
|
|
({ onAgentEvent } = await import("../../infra/agent-events.js"));
|
|
await getRunReplyAgent();
|
|
});
|
|
|
|
beforeEach(() => {
|
|
replyRunTesting.resetReplyRunRegistry();
|
|
state.compactEmbeddedAgentSessionMock.mockReset();
|
|
state.compactEmbeddedAgentSessionMock.mockResolvedValue({
|
|
ok: true,
|
|
compacted: false,
|
|
reason: "test-default",
|
|
});
|
|
state.runEmbeddedAgentMock.mockReset();
|
|
state.runEmbeddedAgentMock.mockResolvedValue({
|
|
payloads: [{ text: "final" }],
|
|
meta: { agentMeta: { usage: { input: 1, output: 1 } } },
|
|
});
|
|
state.queueEmbeddedAgentMessageMock.mockReset();
|
|
state.queueEmbeddedAgentMessageMock.mockReturnValue(false);
|
|
vi.mocked(enqueueFollowupRun).mockReset().mockReturnValue(true);
|
|
vi.mocked(refreshQueuedFollowupSession).mockReset();
|
|
vi.mocked(scheduleFollowupDrain).mockReset();
|
|
vi.stubEnv("OPENCLAW_TEST_FAST", "1");
|
|
});
|
|
|
|
function createMinimalRun(params?: {
|
|
opts?: GetReplyOptions & ReplyOptionsWithOperationRunState;
|
|
resolvedVerboseLevel?: "off" | "on";
|
|
sessionStore?: Record<string, SessionEntry>;
|
|
sessionEntry?: SessionEntry;
|
|
sessionKey?: string;
|
|
storePath?: string;
|
|
typingMode?: TypingMode;
|
|
blockStreamingEnabled?: boolean;
|
|
isActive?: boolean;
|
|
isRunActive?: () => boolean;
|
|
isStreaming?: boolean;
|
|
shouldSteer?: boolean;
|
|
shouldFollowup?: boolean;
|
|
resolvedQueueMode?: string;
|
|
sessionCtx?: Partial<TemplateContext>;
|
|
runOverrides?: Partial<FollowupRun["run"]>;
|
|
}) {
|
|
const typing = createMockTypingController();
|
|
const opts = params?.opts;
|
|
const sessionCtx = {
|
|
Provider: "whatsapp",
|
|
MessageSid: "msg",
|
|
...params?.sessionCtx,
|
|
} as unknown as TemplateContext;
|
|
const resolvedQueue = {
|
|
mode: params?.resolvedQueueMode ?? "interrupt",
|
|
} as unknown as QueueSettings;
|
|
const sessionKey = params?.sessionKey ?? "main";
|
|
const followupRun = {
|
|
prompt: "hello",
|
|
summaryLine: "hello",
|
|
enqueuedAt: Date.now(),
|
|
run: {
|
|
sessionId: "session",
|
|
sessionKey,
|
|
messageProvider: "whatsapp",
|
|
sessionFile: "/tmp/session.jsonl",
|
|
workspaceDir: "/tmp",
|
|
config: {},
|
|
skillsSnapshot: {},
|
|
provider: "anthropic",
|
|
model: "claude",
|
|
thinkLevel: "low",
|
|
verboseLevel: params?.resolvedVerboseLevel ?? "off",
|
|
elevatedLevel: "off",
|
|
bashElevated: {
|
|
enabled: false,
|
|
allowed: false,
|
|
defaultLevel: "off",
|
|
},
|
|
timeoutMs: 1_000,
|
|
blockReplyBreak: "message_end",
|
|
skipProviderRuntimeHints: process.env.OPENCLAW_TEST_FAST === "1",
|
|
...params?.runOverrides,
|
|
},
|
|
} as unknown as FollowupRun;
|
|
|
|
return {
|
|
typing,
|
|
opts,
|
|
run: async () => {
|
|
const runReplyAgent = await getRunReplyAgent();
|
|
return runReplyAgent({
|
|
commandBody: "hello",
|
|
followupRun,
|
|
queueKey: "main",
|
|
resolvedQueue,
|
|
shouldSteer: params?.shouldSteer ?? false,
|
|
shouldFollowup: params?.shouldFollowup ?? false,
|
|
isActive: params?.isActive ?? false,
|
|
isRunActive: params?.isRunActive,
|
|
isStreaming: params?.isStreaming ?? false,
|
|
opts,
|
|
typing,
|
|
sessionEntry: params?.sessionEntry,
|
|
sessionStore: params?.sessionStore,
|
|
sessionKey,
|
|
storePath: params?.storePath,
|
|
sessionCtx,
|
|
defaultModel: "anthropic/claude-opus-4-6",
|
|
resolvedVerboseLevel: params?.resolvedVerboseLevel ?? "off",
|
|
isNewSession: false,
|
|
blockStreamingEnabled: params?.blockStreamingEnabled ?? false,
|
|
resolvedBlockStreamingBreak: "message_end",
|
|
shouldInjectGroupIntro: false,
|
|
typingMode: params?.typingMode ?? "instant",
|
|
});
|
|
},
|
|
};
|
|
}
|
|
|
|
describe("runReplyAgent heartbeat followup guard", () => {
|
|
it("drops heartbeat runs when reply-lane admission finds an active owner", async () => {
|
|
const runState: ReplyOperationRunState = {};
|
|
const active = createReplyOperation({
|
|
sessionKey: "main",
|
|
sessionId: "active-session",
|
|
resetTriggered: false,
|
|
});
|
|
const { run, typing } = createMinimalRun({
|
|
opts: { isHeartbeat: true, [REPLY_OPERATION_RUN_STATE]: runState },
|
|
isActive: false,
|
|
shouldFollowup: false,
|
|
});
|
|
|
|
const result = await run();
|
|
|
|
expect(result).toBeUndefined();
|
|
expect(state.runEmbeddedAgentMock).not.toHaveBeenCalled();
|
|
expect(typing.cleanup).toHaveBeenCalledTimes(1);
|
|
expect(runState.admission).toEqual({ status: "skipped", reason: "active-run" });
|
|
active.complete();
|
|
});
|
|
|
|
it("records the operation owned by an admitted heartbeat run", async () => {
|
|
const runState: ReplyOperationRunState = {};
|
|
const { run } = createMinimalRun({
|
|
opts: { isHeartbeat: true, [REPLY_OPERATION_RUN_STATE]: runState },
|
|
});
|
|
|
|
await run();
|
|
|
|
expect(runState.admission).toEqual({ status: "owned" });
|
|
});
|
|
|
|
it("runs visible turns with the session id returned by admission", async () => {
|
|
const active = createReplyOperation({
|
|
sessionKey: "main",
|
|
sessionId: "pre-compact-session",
|
|
resetTriggered: false,
|
|
});
|
|
active.setPhase("preflight_compacting");
|
|
const sessionStore = {
|
|
main: {
|
|
sessionId: "pre-compact-session",
|
|
sessionFile: "/tmp/pre-compact.jsonl",
|
|
updatedAt: Date.now(),
|
|
},
|
|
};
|
|
const { run } = createMinimalRun({
|
|
runOverrides: { sessionId: "stale-session" },
|
|
sessionStore,
|
|
});
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "final" }],
|
|
meta: {
|
|
agentMeta: {
|
|
provider: "anthropic",
|
|
model: "claude",
|
|
usage: { input: 1, output: 1 },
|
|
},
|
|
},
|
|
});
|
|
|
|
const pending = run();
|
|
await new Promise<void>((resolve) => {
|
|
setTimeout(resolve, 0);
|
|
});
|
|
active.updateSessionId("post-compact-session");
|
|
sessionStore.main = {
|
|
sessionId: "post-compact-session",
|
|
sessionFile: "/tmp/post-compact.jsonl",
|
|
updatedAt: Date.now(),
|
|
};
|
|
active.complete();
|
|
await pending;
|
|
|
|
expect(state.runEmbeddedAgentMock).toHaveBeenCalledTimes(1);
|
|
const [call] = mockCallArgs(state.runEmbeddedAgentMock, "run embedded agent");
|
|
expect((call as AgentRunParams).sessionId).toBe("post-compact-session");
|
|
expect((call as AgentRunParams).sessionFile).toBe("/tmp/post-compact.jsonl");
|
|
});
|
|
|
|
it("drops runs when reply-lane admission sees an already-aborted caller", async () => {
|
|
const abortController = new AbortController();
|
|
abortController.abort();
|
|
const runState: ReplyOperationRunState = {};
|
|
const { run, typing } = createMinimalRun({
|
|
opts: {
|
|
abortSignal: abortController.signal,
|
|
[REPLY_OPERATION_RUN_STATE]: runState,
|
|
},
|
|
isActive: false,
|
|
shouldFollowup: false,
|
|
});
|
|
|
|
const result = await run();
|
|
|
|
expect(result).toBeUndefined();
|
|
expect(state.runEmbeddedAgentMock).not.toHaveBeenCalled();
|
|
expect(typing.cleanup).toHaveBeenCalledTimes(1);
|
|
expect(runState.admission).toEqual({ status: "skipped", reason: "aborted" });
|
|
});
|
|
|
|
it("drops heartbeat runs when another run is active", async () => {
|
|
const runState: ReplyOperationRunState = {};
|
|
const { run, typing } = createMinimalRun({
|
|
opts: { isHeartbeat: true, [REPLY_OPERATION_RUN_STATE]: runState },
|
|
isActive: true,
|
|
shouldFollowup: true,
|
|
resolvedQueueMode: "collect",
|
|
});
|
|
|
|
const result = await run();
|
|
|
|
expect(result).toBeUndefined();
|
|
expect(vi.mocked(enqueueFollowupRun)).not.toHaveBeenCalled();
|
|
expect(state.runEmbeddedAgentMock).not.toHaveBeenCalled();
|
|
expect(typing.cleanup).toHaveBeenCalledTimes(1);
|
|
expect(runState.admission).toEqual({ status: "skipped", reason: "active-run" });
|
|
});
|
|
|
|
it("drops heartbeat runs before steering active streams", async () => {
|
|
state.queueEmbeddedAgentMessageMock.mockReturnValueOnce(true);
|
|
const { run, typing } = createMinimalRun({
|
|
opts: { isHeartbeat: true },
|
|
isActive: true,
|
|
isStreaming: true,
|
|
shouldSteer: true,
|
|
shouldFollowup: true,
|
|
resolvedQueueMode: "collect",
|
|
});
|
|
|
|
const result = await run();
|
|
|
|
expect(result).toBeUndefined();
|
|
expect(state.queueEmbeddedAgentMessageMock).not.toHaveBeenCalled();
|
|
expect(vi.mocked(enqueueFollowupRun)).not.toHaveBeenCalled();
|
|
expect(state.runEmbeddedAgentMock).not.toHaveBeenCalled();
|
|
expect(typing.cleanup).toHaveBeenCalledTimes(1);
|
|
});
|
|
|
|
it("still enqueues non-heartbeat runs when another run is active", async () => {
|
|
const { run } = createMinimalRun({
|
|
opts: { isHeartbeat: false },
|
|
isActive: true,
|
|
shouldFollowup: true,
|
|
resolvedQueueMode: "collect",
|
|
});
|
|
|
|
const result = await run();
|
|
|
|
expect(result).toBeUndefined();
|
|
expect(vi.mocked(enqueueFollowupRun)).toHaveBeenCalledTimes(1);
|
|
expect(state.runEmbeddedAgentMock).not.toHaveBeenCalled();
|
|
});
|
|
|
|
it("cleans up typing when followup admission is rejected", async () => {
|
|
vi.mocked(enqueueFollowupRun).mockReturnValueOnce(false);
|
|
const { run, typing } = createMinimalRun({
|
|
opts: { isHeartbeat: false },
|
|
isActive: true,
|
|
isRunActive: () => true,
|
|
shouldFollowup: true,
|
|
resolvedQueueMode: "collect",
|
|
});
|
|
|
|
const result = await run();
|
|
|
|
expect(result).toBeUndefined();
|
|
expect(vi.mocked(enqueueFollowupRun)).toHaveBeenCalledTimes(1);
|
|
expect(vi.mocked(scheduleFollowupDrain)).not.toHaveBeenCalled();
|
|
expect(state.runEmbeddedAgentMock).not.toHaveBeenCalled();
|
|
expect(typing.cleanup).toHaveBeenCalledTimes(1);
|
|
});
|
|
|
|
it("keeps typing alive when a followup is queued behind a live active run", async () => {
|
|
const active = createReplyOperation({
|
|
sessionKey: "main",
|
|
sessionId: "session",
|
|
resetTriggered: false,
|
|
});
|
|
const { run, typing } = createMinimalRun({
|
|
opts: { isHeartbeat: false },
|
|
isActive: true,
|
|
isRunActive: () => true,
|
|
shouldFollowup: true,
|
|
resolvedQueueMode: "collect",
|
|
});
|
|
|
|
const result = await run();
|
|
|
|
expect(result).toBeUndefined();
|
|
expect(vi.mocked(enqueueFollowupRun)).toHaveBeenCalledTimes(1);
|
|
expect(vi.mocked(scheduleFollowupDrain)).not.toHaveBeenCalled();
|
|
expect(state.runEmbeddedAgentMock).not.toHaveBeenCalled();
|
|
expect(typing.startTypingLoop).toHaveBeenCalledTimes(1);
|
|
expect(typing.refreshTypingTtl).toHaveBeenCalledTimes(1);
|
|
expect(typing.cleanup).not.toHaveBeenCalled();
|
|
active.complete();
|
|
});
|
|
|
|
it("starts draining after enqueue when the reply lane owner is already gone", async () => {
|
|
const { run, typing } = createMinimalRun({
|
|
opts: { isHeartbeat: false },
|
|
isActive: true,
|
|
isRunActive: () => false,
|
|
shouldFollowup: true,
|
|
resolvedQueueMode: "collect",
|
|
});
|
|
|
|
const result = await run();
|
|
|
|
expect(result).toBeUndefined();
|
|
expect(vi.mocked(enqueueFollowupRun)).toHaveBeenCalledTimes(1);
|
|
expect(vi.mocked(enqueueFollowupRun).mock.calls[0]?.[5]).toBe(false);
|
|
expect(vi.mocked(scheduleFollowupDrain)).toHaveBeenCalledTimes(1);
|
|
expect(state.runEmbeddedAgentMock).not.toHaveBeenCalled();
|
|
expect(typing.cleanup).toHaveBeenCalledTimes(1);
|
|
});
|
|
|
|
it("keeps the drain dormant until the reply lane owner clears", async () => {
|
|
const active = createReplyOperation({
|
|
sessionKey: "main",
|
|
sessionId: "session",
|
|
resetTriggered: false,
|
|
});
|
|
const { run } = createMinimalRun({
|
|
opts: { isHeartbeat: false },
|
|
isActive: true,
|
|
isRunActive: () => true,
|
|
shouldFollowup: true,
|
|
resolvedQueueMode: "collect",
|
|
});
|
|
|
|
await run();
|
|
|
|
expect(vi.mocked(enqueueFollowupRun).mock.calls[0]?.[5]).toBe(false);
|
|
expect(vi.mocked(scheduleFollowupDrain)).not.toHaveBeenCalled();
|
|
|
|
active.complete();
|
|
|
|
expect(vi.mocked(scheduleFollowupDrain)).toHaveBeenCalledTimes(1);
|
|
});
|
|
|
|
it("drains followup queue when an unexpected exception escapes the run path", async () => {
|
|
const accounting = await import("./session-run-accounting.js");
|
|
const persistSpy = vi
|
|
.spyOn(accounting, "persistRunSessionUsage")
|
|
.mockRejectedValueOnce(new Error("persist exploded"));
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "ok" }],
|
|
meta: { agentMeta: { usage: { input: 1, output: 1 } } },
|
|
});
|
|
|
|
try {
|
|
const { run } = createMinimalRun();
|
|
await expect(run()).rejects.toThrow("persist exploded");
|
|
expect(vi.mocked(scheduleFollowupDrain)).toHaveBeenCalledTimes(1);
|
|
} finally {
|
|
persistSpy.mockRestore();
|
|
}
|
|
});
|
|
});
|
|
|
|
describe("runReplyAgent pending final delivery capture", () => {
|
|
async function createSessionStoreFile(entry: SessionEntry) {
|
|
const dir = await mkdtemp(join(tmpdir(), "openclaw-agent-runner-pending-"));
|
|
const storePath = join(dir, "sessions.json");
|
|
await saveSessionStore(storePath, { main: entry }, { skipMaintenance: true });
|
|
return storePath;
|
|
}
|
|
|
|
async function readStoredMainSession(storePath: string): Promise<SessionEntry> {
|
|
return requireStoredSessionEntry(storePath);
|
|
}
|
|
|
|
it("does not persist message-tool-only final replies for heartbeat replay", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
const storePath = await createSessionStoreFile(sessionEntry);
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "private final" }],
|
|
meta: {},
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
opts: { sourceReplyDeliveryMode: "message_tool_only" },
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
storePath,
|
|
});
|
|
|
|
await run();
|
|
|
|
const stored = await readStoredMainSession(storePath);
|
|
expect(stored.pendingFinalDelivery).toBeUndefined();
|
|
expect(stored.pendingFinalDeliveryText).toBeUndefined();
|
|
});
|
|
|
|
it("does not persist sendPolicy-denied final replies for heartbeat replay", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
sendPolicy: "deny",
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
const storePath = await createSessionStoreFile(sessionEntry);
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "denied final" }],
|
|
meta: {},
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
storePath,
|
|
});
|
|
|
|
await run();
|
|
|
|
const stored = await readStoredMainSession(storePath);
|
|
expect(stored.pendingFinalDelivery).toBeUndefined();
|
|
expect(stored.pendingFinalDeliveryText).toBeUndefined();
|
|
});
|
|
|
|
it("persists only visible non-reasoning final reply text", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
const storePath = await createSessionStoreFile(sessionEntry);
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "hidden reasoning", isReasoning: true }, { text: "visible final" }],
|
|
meta: {},
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
storePath,
|
|
});
|
|
|
|
await run();
|
|
|
|
const stored = await readStoredMainSession(storePath);
|
|
expect(stored.pendingFinalDelivery).toBe(true);
|
|
expect(stored.pendingFinalDeliveryText).toBe("visible final");
|
|
});
|
|
|
|
it("persists auto-reply delivery context for restart recovery", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
const storePath = await createSessionStoreFile(sessionEntry);
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async () => {
|
|
const storedDuringRun = await readStoredMainSession(storePath);
|
|
expect(storedDuringRun.restartRecoveryDeliveryContext).toEqual({
|
|
channel: "discord",
|
|
to: "channel:24680",
|
|
accountId: "work",
|
|
threadId: "1503645939964055592",
|
|
});
|
|
expect(typeof storedDuringRun.restartRecoveryDeliveryRunId).toBe("string");
|
|
return {
|
|
payloads: [{ text: "visible final" }],
|
|
meta: {},
|
|
};
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
sessionCtx: {
|
|
Provider: "discord",
|
|
OriginatingChannel: "discord",
|
|
OriginatingTo: "channel:24680",
|
|
AccountId: "work",
|
|
MessageSid: "1503645939964055592",
|
|
MessageThreadId: "1503645939964055592",
|
|
},
|
|
runOverrides: { messageProvider: "discord" },
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
storePath,
|
|
});
|
|
|
|
await run();
|
|
|
|
const stored = await readStoredMainSession(storePath);
|
|
expect(stored.pendingFinalDelivery).toBe(true);
|
|
expect(stored.pendingFinalDeliveryText).toBe("visible final");
|
|
expect(stored.pendingFinalDeliveryContext).toEqual({
|
|
channel: "discord",
|
|
to: "channel:24680",
|
|
accountId: "work",
|
|
threadId: "1503645939964055592",
|
|
});
|
|
expect(stored.restartRecoveryDeliveryContext).toBeUndefined();
|
|
expect(stored.restartRecoveryDeliveryRunId).toBeUndefined();
|
|
});
|
|
|
|
it("keeps heartbeat replies with real content in pending final delivery", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
const storePath = await createSessionStoreFile(sessionEntry);
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "Sent daily summary to channel." }],
|
|
meta: {},
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
opts: { isHeartbeat: true },
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
storePath,
|
|
});
|
|
|
|
await run();
|
|
|
|
const stored = await readStoredMainSession(storePath);
|
|
expect(stored.pendingFinalDelivery).toBe(true);
|
|
expect(stored.pendingFinalDeliveryText).toBe("Sent daily summary to channel.");
|
|
});
|
|
|
|
it("persists heartbeat reply remainder as pending delivery when remainder exceeds ackMaxChars", async () => {
|
|
// When a heartbeat response contains HEARTBEAT_OK followed by substantive content,
|
|
// the remainder after stripping the token must be persisted for durable delivery.
|
|
// The default ackMaxChars is 300 — any remainder longer than that is treated as real content.
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
const storePath = await createSessionStoreFile(sessionEntry);
|
|
const longRemainder = "Sent daily digest to channel. ".repeat(12).trimEnd(); // ~360 chars, > 300
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: `HEARTBEAT_OK ${longRemainder}` }],
|
|
meta: {},
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
opts: { isHeartbeat: true },
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
storePath,
|
|
});
|
|
|
|
await run();
|
|
|
|
const stored = await readStoredMainSession(storePath);
|
|
expect(stored.pendingFinalDelivery).toBe(true);
|
|
expect(stored.pendingFinalDeliveryText).toBe(longRemainder);
|
|
});
|
|
});
|
|
|
|
describe("runReplyAgent typing (heartbeat)", () => {
|
|
it("signals typing for normal runs", async () => {
|
|
const onPartialReply = vi.fn();
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
await params.onPartialReply?.({ text: "hi" });
|
|
return { payloads: [{ text: "final" }], meta: {} };
|
|
});
|
|
|
|
const { run, typing } = createMinimalRun({
|
|
opts: { isHeartbeat: false, onPartialReply },
|
|
});
|
|
await run();
|
|
|
|
expect(onPartialReply).toHaveBeenCalled();
|
|
expect(typing.startTypingOnText).toHaveBeenCalledWith("hi");
|
|
expect(typing.startTypingLoop).toHaveBeenCalled();
|
|
});
|
|
|
|
it("never signals typing for heartbeat runs", async () => {
|
|
const onPartialReply = vi.fn();
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
await params.onPartialReply?.({ text: "hi" });
|
|
return { payloads: [{ text: "final" }], meta: {} };
|
|
});
|
|
|
|
const { run, typing } = createMinimalRun({
|
|
opts: { isHeartbeat: true, onPartialReply },
|
|
});
|
|
await run();
|
|
|
|
expect(onPartialReply).toHaveBeenCalled();
|
|
expect(typing.startTypingOnText).not.toHaveBeenCalled();
|
|
expect(typing.startTypingLoop).not.toHaveBeenCalled();
|
|
});
|
|
|
|
it("does not persist heartbeat ack text as pending final delivery", async () => {
|
|
const dir = await mkdtemp(join(tmpdir(), "openclaw-heartbeat-pending-"));
|
|
const storePath = join(dir, "sessions.json");
|
|
await saveSessionStore(
|
|
storePath,
|
|
{ main: { sessionId: "session", updatedAt: 1 } },
|
|
{ skipMaintenance: true },
|
|
);
|
|
try {
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "HEARTBEAT_OK" }],
|
|
meta: {},
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
opts: { isHeartbeat: true },
|
|
sessionCtx: { Provider: "heartbeat" },
|
|
sessionKey: "main",
|
|
storePath,
|
|
});
|
|
await run();
|
|
|
|
const stored = requireStoredSessionEntry(storePath);
|
|
expect(stored.pendingFinalDelivery).toBeUndefined();
|
|
expect(stored.pendingFinalDeliveryText).toBeUndefined();
|
|
} finally {
|
|
await rm(dir, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
it("suppresses NO_REPLY partials but allows normal No-prefix partials", async () => {
|
|
const cases = [
|
|
{
|
|
partials: ["NO_REPLY"],
|
|
finalText: "NO_REPLY",
|
|
expectedForwarded: [] as string[],
|
|
shouldType: false,
|
|
},
|
|
{
|
|
partials: ["NO", "NO_", "NO_RE", "NO_REPLY"],
|
|
finalText: "NO_REPLY",
|
|
expectedForwarded: [] as string[],
|
|
shouldType: false,
|
|
},
|
|
{
|
|
partials: ["No", "No, that is valid"],
|
|
finalText: "No, that is valid",
|
|
expectedForwarded: ["No", "No, that is valid"],
|
|
shouldType: true,
|
|
},
|
|
{
|
|
partials: ["NO_REPLYThe user is saying hello"],
|
|
finalText: "NO_REPLYThe user is saying hello",
|
|
expectedForwarded: ["The user is saying hello"],
|
|
shouldType: true,
|
|
},
|
|
] as const;
|
|
|
|
for (const testCase of cases) {
|
|
const onPartialReply = vi.fn();
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
for (const text of testCase.partials) {
|
|
await params.onPartialReply?.({ text });
|
|
}
|
|
return { payloads: [{ text: testCase.finalText }], meta: {} };
|
|
});
|
|
|
|
const { run, typing } = createMinimalRun({
|
|
opts: { isHeartbeat: false, onPartialReply },
|
|
typingMode: "message",
|
|
});
|
|
await run();
|
|
|
|
if (testCase.expectedForwarded.length === 0) {
|
|
expect(onPartialReply).not.toHaveBeenCalled();
|
|
} else {
|
|
expect(onPartialReply).toHaveBeenCalledTimes(testCase.expectedForwarded.length);
|
|
testCase.expectedForwarded.forEach((text, index) => {
|
|
expect(onPartialReply).toHaveBeenNthCalledWith(index + 1, {
|
|
text,
|
|
mediaUrls: undefined,
|
|
});
|
|
});
|
|
}
|
|
|
|
if (testCase.shouldType) {
|
|
expect(typing.startTypingOnText).toHaveBeenCalled();
|
|
} else {
|
|
expect(typing.startTypingOnText).not.toHaveBeenCalled();
|
|
}
|
|
expect(typing.startTypingLoop).not.toHaveBeenCalled();
|
|
}
|
|
});
|
|
|
|
it("keeps final text blocks after partial preview streaming", async () => {
|
|
const onPartialReply = vi.fn();
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
await params.onPartialReply?.({ text: "First block\n\nSecond block" });
|
|
return {
|
|
payloads: [{ text: "First block" }, { text: "Second block" }],
|
|
meta: {},
|
|
};
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
opts: { onPartialReply },
|
|
typingMode: "message",
|
|
});
|
|
|
|
const result = await run();
|
|
|
|
expect(onPartialReply).toHaveBeenCalledWith({ text: "First block\n\nSecond block" });
|
|
expect(result).toEqual([
|
|
expect.objectContaining({ text: "First block" }),
|
|
expect.objectContaining({ text: "Second block" }),
|
|
]);
|
|
});
|
|
|
|
it("suppresses narrated silent-turn partials, block replies, and final payloads", async () => {
|
|
const onPartialReply = vi.fn();
|
|
const onBlockReply = vi.fn();
|
|
const onReasoningStream = vi.fn();
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
expect(params.silentExpected).toBe(true);
|
|
await params.onReasoningStream?.({ text: "Reasoning:\nI am trying to send NO_REPLY now." });
|
|
await params.onPartialReply?.({ text: "I am trying to send NO_REPLY now." });
|
|
await params.onBlockReply?.({ text: "I am trying to send NO_REPLY now." });
|
|
return { payloads: [{ text: "I am trying to send NO_REPLY now." }], meta: {} };
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
opts: { isHeartbeat: false, onPartialReply, onBlockReply, onReasoningStream },
|
|
blockStreamingEnabled: true,
|
|
runOverrides: { silentExpected: true },
|
|
});
|
|
const res = await run();
|
|
|
|
expect(onReasoningStream).not.toHaveBeenCalled();
|
|
expect(onPartialReply).not.toHaveBeenCalled();
|
|
expect(onBlockReply).not.toHaveBeenCalled();
|
|
expect(res).toBeUndefined();
|
|
});
|
|
|
|
it("suppresses bare NO_REPLY silent-turn payloads", async () => {
|
|
const onPartialReply = vi.fn();
|
|
const onBlockReply = vi.fn();
|
|
const onReasoningStream = vi.fn();
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
expect(params.silentExpected).toBe(true);
|
|
await params.onReasoningStream?.({ text: "Reasoning:\nNO_REPLY" });
|
|
await params.onPartialReply?.({ text: "NO_REPLY" });
|
|
await params.onBlockReply?.({ text: "NO_REPLY" });
|
|
return { payloads: [{ text: "NO_REPLY" }], meta: { finalAssistantText: "NO_REPLY" } };
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
opts: { isHeartbeat: false, onPartialReply, onBlockReply, onReasoningStream },
|
|
blockStreamingEnabled: true,
|
|
runOverrides: { silentExpected: true },
|
|
});
|
|
const res = await run();
|
|
|
|
expect(onReasoningStream).not.toHaveBeenCalled();
|
|
expect(onPartialReply).not.toHaveBeenCalled();
|
|
expect(onBlockReply).not.toHaveBeenCalled();
|
|
expect(res).toBeUndefined();
|
|
});
|
|
|
|
it("does not start typing on assistant message start without prior text in message mode", async () => {
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
await params.onAssistantMessageStart?.();
|
|
return { payloads: [{ text: "final" }], meta: {} };
|
|
});
|
|
|
|
const { run, typing } = createMinimalRun({
|
|
typingMode: "message",
|
|
});
|
|
await run();
|
|
|
|
expect(typing.startTypingLoop).not.toHaveBeenCalled();
|
|
expect(typing.startTypingOnText).not.toHaveBeenCalled();
|
|
});
|
|
|
|
it("starts typing from reasoning stream in thinking mode", async () => {
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
await params.onReasoningStream?.({ text: "Reasoning:\n_step_" });
|
|
await params.onPartialReply?.({ text: "hi" });
|
|
return { payloads: [{ text: "final" }], meta: {} };
|
|
});
|
|
|
|
const { run, typing } = createMinimalRun({
|
|
typingMode: "thinking",
|
|
});
|
|
await run();
|
|
|
|
expect(typing.startTypingLoop).toHaveBeenCalled();
|
|
expect(typing.startTypingOnText).not.toHaveBeenCalled();
|
|
});
|
|
|
|
it("keeps assistant partial streaming enabled when reasoning mode is stream", async () => {
|
|
const onPartialReply = vi.fn();
|
|
const onReasoningStream = vi.fn();
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
await params.onReasoningStream?.({ text: "Reasoning:\n_step_" });
|
|
await params.onPartialReply?.({ text: "answer chunk" });
|
|
return { payloads: [{ text: "final" }], meta: {} };
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
opts: { onPartialReply, onReasoningStream },
|
|
runOverrides: { reasoningLevel: "stream" },
|
|
});
|
|
await run();
|
|
|
|
expect(onReasoningStream).toHaveBeenCalled();
|
|
expect(onPartialReply).toHaveBeenCalledWith({ text: "answer chunk", mediaUrls: undefined });
|
|
});
|
|
|
|
it("suppresses typing in never mode", async () => {
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
await params.onPartialReply?.({ text: "hi" });
|
|
return { payloads: [{ text: "final" }], meta: {} };
|
|
});
|
|
|
|
const { run, typing } = createMinimalRun({
|
|
typingMode: "never",
|
|
});
|
|
await run();
|
|
|
|
expect(typing.startTypingOnText).not.toHaveBeenCalled();
|
|
expect(typing.startTypingLoop).not.toHaveBeenCalled();
|
|
});
|
|
|
|
it("signals typing on normalized block replies", async () => {
|
|
const onBlockReply = vi.fn();
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
await params.onBlockReply?.({ text: "\n\nchunk", mediaUrls: [] });
|
|
return { payloads: [{ text: "final" }], meta: {} };
|
|
});
|
|
|
|
const { run, typing } = createMinimalRun({
|
|
typingMode: "message",
|
|
blockStreamingEnabled: true,
|
|
opts: { onBlockReply },
|
|
});
|
|
await run();
|
|
|
|
expect(typing.startTypingOnText).toHaveBeenCalledWith("chunk");
|
|
expect(onBlockReply).toHaveBeenCalled();
|
|
const [blockPayload, blockOpts] = onBlockReply.mock.calls.at(0) ?? [];
|
|
const blockPayloadRecord = requireRecord(blockPayload, "block payload");
|
|
expect(blockPayloadRecord.text).toBe("chunk");
|
|
expect(blockPayloadRecord.audioAsVoice).toBe(false);
|
|
const blockOptions = requireRecord(blockOpts, "block options");
|
|
expect(blockOptions.abortSignal).toBeInstanceOf(AbortSignal);
|
|
expect(blockOptions.timeoutMs).toBeTypeOf("number");
|
|
});
|
|
|
|
it("strips workflow function response scaffolding from final delivery", async () => {
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async () => ({
|
|
payloads: [
|
|
{
|
|
text: [
|
|
"Visible intro.",
|
|
"<function_calls>",
|
|
'<invoke name="exec"><parameter name="command">node scripts/search.mjs</parameter></invoke>',
|
|
"</function_calls>",
|
|
"<function_response>",
|
|
'Searching for: "what skills matter most in the age of AI"',
|
|
"...",
|
|
"</function_response>",
|
|
"Visible answer.",
|
|
].join("\n"),
|
|
},
|
|
],
|
|
meta: {},
|
|
}));
|
|
|
|
const { run } = createMinimalRun();
|
|
const res = await run();
|
|
const payloads = Array.isArray(res) ? res : res ? [res] : [];
|
|
|
|
expect(payloads).toHaveLength(1);
|
|
expect(payloads[0]?.text).toBe("Visible intro.\n\n\nVisible answer.");
|
|
});
|
|
|
|
it("handles typing for normal and silent tool results", async () => {
|
|
const cases = [
|
|
{
|
|
toolText: "tooling",
|
|
shouldType: true,
|
|
shouldForward: true,
|
|
},
|
|
{
|
|
toolText: "NO_REPLY",
|
|
shouldType: false,
|
|
shouldForward: false,
|
|
},
|
|
] as const;
|
|
|
|
for (const testCase of cases) {
|
|
const onToolResult = vi.fn();
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
await params.onToolResult?.({ text: testCase.toolText, mediaUrls: [] });
|
|
return { payloads: [{ text: "final" }], meta: {} };
|
|
});
|
|
|
|
const { run, typing } = createMinimalRun({
|
|
typingMode: "message",
|
|
opts: { onToolResult },
|
|
});
|
|
await run();
|
|
|
|
if (testCase.shouldType) {
|
|
expect(typing.startTypingOnText).toHaveBeenCalledWith(testCase.toolText);
|
|
} else {
|
|
expect(typing.startTypingOnText).not.toHaveBeenCalled();
|
|
}
|
|
|
|
if (testCase.shouldForward) {
|
|
expect(onToolResult).toHaveBeenCalledWith({
|
|
text: testCase.toolText,
|
|
mediaUrls: [],
|
|
});
|
|
} else {
|
|
expect(onToolResult).not.toHaveBeenCalled();
|
|
}
|
|
}
|
|
});
|
|
|
|
it("preserves channelData on forwarded tool results", async () => {
|
|
const onToolResult = vi.fn();
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
await params.onToolResult?.({
|
|
text: "Approval required.\n\n```txt\n/approve 117ba06d allow-once\n```",
|
|
channelData: {
|
|
execApproval: {
|
|
approvalId: "117ba06d-1111-2222-3333-444444444444",
|
|
approvalSlug: "117ba06d",
|
|
allowedDecisions: ["allow-once", "allow-always", "deny"],
|
|
},
|
|
},
|
|
});
|
|
return { payloads: [{ text: "final" }], meta: {} };
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
typingMode: "message",
|
|
opts: { onToolResult },
|
|
});
|
|
await run();
|
|
|
|
expect(onToolResult).toHaveBeenCalledWith({
|
|
text: "Approval required.\n\n```txt\n/approve 117ba06d allow-once\n```",
|
|
channelData: {
|
|
execApproval: {
|
|
approvalId: "117ba06d-1111-2222-3333-444444444444",
|
|
approvalSlug: "117ba06d",
|
|
allowedDecisions: ["allow-once", "allow-always", "deny"],
|
|
},
|
|
},
|
|
});
|
|
});
|
|
|
|
it("forwards media-only tool results without typing text", async () => {
|
|
const onToolResult = vi.fn();
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
await params.onToolResult?.({
|
|
mediaUrls: ["/tmp/generated.png"],
|
|
});
|
|
return { payloads: [{ text: "final" }], meta: {} };
|
|
});
|
|
|
|
const { run, typing } = createMinimalRun({
|
|
typingMode: "message",
|
|
opts: { onToolResult },
|
|
});
|
|
await run();
|
|
|
|
expect(typing.startTypingOnText).not.toHaveBeenCalled();
|
|
expect(onToolResult).toHaveBeenCalledTimes(1);
|
|
const toolPayload = requireRecord(
|
|
mockCallArgs(onToolResult, "onToolResult")[0],
|
|
"tool payload",
|
|
);
|
|
expect(toolPayload.mediaUrls).toEqual(["/tmp/generated.png"]);
|
|
expect(toolPayload.text).toBeUndefined();
|
|
});
|
|
|
|
it("retries transient HTTP failures once with timer-driven backoff", async () => {
|
|
vi.useFakeTimers();
|
|
let calls = 0;
|
|
state.runEmbeddedAgentMock.mockImplementation(async () => {
|
|
calls += 1;
|
|
if (calls === 1) {
|
|
throw new Error("502 Bad Gateway");
|
|
}
|
|
return { payloads: [{ text: "final" }], meta: {} };
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
typingMode: "message",
|
|
});
|
|
const runPromise = run();
|
|
|
|
await vi.advanceTimersByTimeAsync(2_499);
|
|
expect(calls).toBe(1);
|
|
await vi.advanceTimersByTimeAsync(1);
|
|
await runPromise;
|
|
expect(calls).toBe(2);
|
|
vi.useRealTimers();
|
|
});
|
|
|
|
it("announces model fallback transitions across verbose levels", async () => {
|
|
const cases = [
|
|
{ name: "verbose on", verbose: "on" as const },
|
|
{ name: "verbose off", verbose: "off" as const },
|
|
] as const;
|
|
for (const testCase of cases) {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "final" }],
|
|
meta: {},
|
|
});
|
|
vi.spyOn(modelFallbackModule, "runWithModelFallback").mockImplementationOnce(async (args) => {
|
|
const { run, onFallbackStep } = args;
|
|
await onFallbackStep?.({
|
|
fallbackStepType: "fallback_step",
|
|
fallbackStepFromModel: "fireworks/fireworks/accounts/fireworks/routers/kimi-k2p5-turbo",
|
|
fallbackStepToModel: "deepinfra/moonshotai/Kimi-K2.5",
|
|
fallbackStepFromFailureReason: "rate_limit",
|
|
fallbackStepFinalOutcome: "succeeded",
|
|
});
|
|
return {
|
|
outcome: "completed" as const,
|
|
result: await run("deepinfra", "moonshotai/Kimi-K2.5"),
|
|
provider: "deepinfra",
|
|
model: "moonshotai/Kimi-K2.5",
|
|
attempts: [
|
|
{
|
|
provider: "fireworks",
|
|
model: "fireworks/accounts/fireworks/routers/kimi-k2p5-turbo",
|
|
error: "Provider fireworks is in cooldown (all profiles unavailable)",
|
|
reason: "rate_limit",
|
|
},
|
|
],
|
|
};
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
resolvedVerboseLevel: testCase.verbose,
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
});
|
|
const phases: string[] = [];
|
|
const off = onAgentEvent((evt) => {
|
|
const phase = typeof evt.data?.phase === "string" ? evt.data.phase : null;
|
|
if (evt.stream === "lifecycle" && phase) {
|
|
phases.push(phase);
|
|
}
|
|
});
|
|
const res = await run();
|
|
off();
|
|
const payload = Array.isArray(res)
|
|
? (res[0] as { text?: string })
|
|
: (res as { text?: string });
|
|
expect(payload.text, testCase.name).toContain("Model Fallback:");
|
|
expect(payload.text, testCase.name).toContain("deepinfra/moonshotai/Kimi-K2.5");
|
|
expect(sessionEntry.fallbackNoticeReason, testCase.name).toBe("rate limit");
|
|
expect(
|
|
phases.filter((phase) => phase === "fallback"),
|
|
testCase.name,
|
|
).toHaveLength(1);
|
|
expect(phases, testCase.name).toContain("fallback_step");
|
|
}
|
|
});
|
|
|
|
it("does not report an exhausted fallback candidate as a successful winner", async () => {
|
|
const root = await mkdtemp(join(tmpdir(), "openclaw-exhausted-trace-"));
|
|
const storePath = join(root, "sessions.json");
|
|
const sessionFile = join(root, "session.jsonl");
|
|
const runId = "run-exhausted-trace";
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
traceLevel: "raw",
|
|
};
|
|
await saveSessionStore(storePath, { main: sessionEntry }, { skipMaintenance: true });
|
|
try {
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "Terminal tool summary", isError: true }],
|
|
meta: {
|
|
error: {
|
|
kind: "incomplete_turn",
|
|
message: "Agent ended incomplete",
|
|
fallbackSafe: true,
|
|
terminalPresentation: true,
|
|
},
|
|
executionTrace: {
|
|
winnerProvider: "anthropic",
|
|
winnerModel: "claude",
|
|
attempts: [{ provider: "anthropic", model: "claude", result: "success" }],
|
|
fallbackUsed: false,
|
|
runner: "embedded",
|
|
},
|
|
agentMeta: {
|
|
sessionId: "session",
|
|
provider: "anthropic",
|
|
model: "claude",
|
|
usage: { input: 10, output: 2 },
|
|
},
|
|
},
|
|
});
|
|
vi.spyOn(modelFallbackModule, "runWithModelFallback").mockImplementationOnce(
|
|
async (args) => ({
|
|
outcome: "exhausted",
|
|
result: await args.run("anthropic", "claude"),
|
|
provider: "anthropic",
|
|
model: "claude",
|
|
attempts: [
|
|
{
|
|
provider: "anthropic",
|
|
model: "claude",
|
|
error: "Agent ended incomplete",
|
|
reason: "format",
|
|
},
|
|
],
|
|
}),
|
|
);
|
|
|
|
const { run } = createMinimalRun({
|
|
opts: { runId },
|
|
sessionEntry,
|
|
sessionStore: { main: sessionEntry },
|
|
sessionKey: "main",
|
|
storePath,
|
|
runOverrides: {
|
|
sessionFile,
|
|
traceAuthorized: true,
|
|
},
|
|
});
|
|
const result = await run();
|
|
const text = (Array.isArray(result) ? result : [result])
|
|
.map((payload) => payload?.text ?? "")
|
|
.join("\n");
|
|
|
|
expect(text).not.toContain("winner=anthropic/claude");
|
|
expect(text).not.toContain("result=success");
|
|
expect(text).toContain("Summary: fallback=yes attempts=1");
|
|
expect(consumeReplyUsageState(runId)?.resolvedRef).toBeUndefined();
|
|
} finally {
|
|
await rm(root, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
it("does not persist active fallback state for internal subagent announce fallback", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
modelProvider: "openai",
|
|
model: "gpt-5.5",
|
|
responseUsage: "tokens",
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
const storeRoot = await mkdtemp(join(tmpdir(), "openclaw-internal-fallback-"));
|
|
const storePath = join(storeRoot, "sessions.json");
|
|
await saveSessionStore(storePath, sessionStore, { skipMaintenance: true });
|
|
try {
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "subagent timed out" }],
|
|
meta: {
|
|
agentMeta: {
|
|
usage: {
|
|
input: 100,
|
|
output: 50,
|
|
},
|
|
},
|
|
},
|
|
});
|
|
vi.spyOn(modelFallbackModule, "runWithModelFallback").mockImplementationOnce(async (args) => {
|
|
const { run, onFallbackStep } = args;
|
|
await onFallbackStep?.({
|
|
fallbackStepType: "fallback_step",
|
|
fallbackStepFromModel: "openai/gpt-5.5",
|
|
fallbackStepToModel: "google/gemini-2.5-flash",
|
|
fallbackStepFromFailureReason: "timeout",
|
|
fallbackStepFinalOutcome: "succeeded",
|
|
});
|
|
return {
|
|
outcome: "completed" as const,
|
|
result: await run("google", "gemini-2.5-flash"),
|
|
provider: "google",
|
|
model: "gemini-2.5-flash",
|
|
attempts: [
|
|
{
|
|
provider: "openai",
|
|
model: "gpt-5.5",
|
|
error: "codex app-server attempt timed out",
|
|
reason: "timeout",
|
|
},
|
|
],
|
|
};
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
storePath,
|
|
runOverrides: {
|
|
inputProvenance: {
|
|
kind: "inter_session",
|
|
sourceSessionKey: "agent:codex:subagent:c34fca91",
|
|
sourceChannel: "__internal__",
|
|
sourceTool: "subagent_announce",
|
|
},
|
|
},
|
|
});
|
|
const res = await run();
|
|
|
|
expect(sessionEntry.modelProvider).toBe("openai");
|
|
expect(sessionEntry.model).toBe("gpt-5.5");
|
|
expect(sessionEntry.providerOverride).toBeUndefined();
|
|
expect(sessionEntry.modelOverride).toBeUndefined();
|
|
expect(sessionEntry.modelOverrideSource).toBeUndefined();
|
|
expect(sessionEntry.fallbackNoticeSelectedModel).toBeUndefined();
|
|
expect(sessionEntry.fallbackNoticeActiveModel).toBeUndefined();
|
|
expect(sessionEntry.fallbackNoticeReason).toBeUndefined();
|
|
const persistedSession = requireStoredSessionEntry(storePath);
|
|
expect(persistedSession.modelProvider).toBe("openai");
|
|
expect(persistedSession.model).toBe("gpt-5.5");
|
|
expect(persistedSession.providerOverride).toBeUndefined();
|
|
expect(persistedSession.modelOverride).toBeUndefined();
|
|
expect(persistedSession.modelOverrideSource).toBeUndefined();
|
|
expect(persistedSession.fallbackNoticeSelectedModel).toBeUndefined();
|
|
expect(persistedSession.fallbackNoticeActiveModel).toBeUndefined();
|
|
const payloads = Array.isArray(res) ? res : res ? [res] : [];
|
|
expect(payloads.some((payload) => payload.text?.includes("Model Fallback:"))).toBe(false);
|
|
expect(payloads.some((payload) => payload.text?.includes("Usage:"))).toBe(false);
|
|
} finally {
|
|
await rm(storeRoot, { recursive: true, force: true });
|
|
}
|
|
});
|
|
|
|
it("surfaces empty internal fallback failures without persisting visible fallback state", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
modelProvider: "openai",
|
|
model: "gpt-5.5",
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [],
|
|
meta: {},
|
|
});
|
|
vi.spyOn(modelFallbackModule, "runWithModelFallback").mockImplementationOnce(async (args) => {
|
|
const { run, onFallbackStep } = args;
|
|
await onFallbackStep?.({
|
|
fallbackStepType: "fallback_step",
|
|
fallbackStepFromModel: "openai/gpt-5.5",
|
|
fallbackStepToModel: "google/gemini-2.5-flash",
|
|
fallbackStepFromFailureReason: "timeout",
|
|
fallbackStepFinalOutcome: "succeeded",
|
|
});
|
|
return {
|
|
outcome: "completed" as const,
|
|
result: await run("google", "gemini-2.5-flash"),
|
|
provider: "google",
|
|
model: "gemini-2.5-flash",
|
|
attempts: [
|
|
{
|
|
provider: "openai",
|
|
model: "gpt-5.5",
|
|
error: "codex app-server attempt timed out",
|
|
reason: "timeout",
|
|
},
|
|
],
|
|
};
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
runOverrides: {
|
|
inputProvenance: {
|
|
kind: "inter_session",
|
|
sourceSessionKey: "agent:codex:subagent:c34fca91",
|
|
sourceChannel: "__internal__",
|
|
sourceTool: "subagent_announce",
|
|
},
|
|
},
|
|
});
|
|
const res = await run();
|
|
|
|
const payload = Array.isArray(res) ? res[0] : res;
|
|
expect(payload?.isError).toBe(true);
|
|
expect(payload?.text).toContain("Fallback used google/gemini-2.5-flash");
|
|
expect(sessionEntry.modelProvider).toBe("openai");
|
|
expect(sessionEntry.model).toBe("gpt-5.5");
|
|
expect(sessionEntry.providerOverride).toBeUndefined();
|
|
expect(sessionEntry.modelOverride).toBeUndefined();
|
|
expect(sessionEntry.modelOverrideSource).toBeUndefined();
|
|
expect(sessionEntry.fallbackNoticeSelectedModel).toBeUndefined();
|
|
expect(sessionEntry.fallbackNoticeActiveModel).toBeUndefined();
|
|
expect(sessionEntry.fallbackNoticeReason).toBeUndefined();
|
|
});
|
|
|
|
it("keeps fallback transition notices when block streaming has no final text", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
const onBlockReply = vi.fn();
|
|
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async (params: AgentRunParams) => {
|
|
await params.onBlockReply?.({ text: "streamed answer" });
|
|
return { payloads: [], meta: {} };
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementationOnce(
|
|
async ({ run }: { run: (provider: string, model: string) => Promise<unknown> }) => ({
|
|
outcome: "completed" as const,
|
|
result: await run("deepinfra", "moonshotai/Kimi-K2.5"),
|
|
provider: "deepinfra",
|
|
model: "moonshotai/Kimi-K2.5",
|
|
attempts: [
|
|
{
|
|
provider: "fireworks",
|
|
model: "fireworks/accounts/fireworks/routers/kimi-k2p5-turbo",
|
|
error: "Provider fireworks is in cooldown (all profiles unavailable)",
|
|
reason: "rate_limit",
|
|
},
|
|
],
|
|
}),
|
|
);
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
blockStreamingEnabled: true,
|
|
opts: { onBlockReply },
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
});
|
|
const res = await run();
|
|
const payloads = Array.isArray(res) ? res : res ? [res] : [];
|
|
|
|
expect(onBlockReply).toHaveBeenCalled();
|
|
expect(payloads).toHaveLength(1);
|
|
expect(payloads[0]?.text).toContain("Model Fallback:");
|
|
expect(payloads[0]?.text).not.toContain("streamed answer");
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("threads fallback notices without consuming the first assistant reply slot", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "final" }],
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementationOnce(
|
|
async ({ run }: { run: (provider: string, model: string) => Promise<unknown> }) => ({
|
|
outcome: "completed" as const,
|
|
result: await run("deepinfra", "moonshotai/Kimi-K2.5"),
|
|
provider: "deepinfra",
|
|
model: "moonshotai/Kimi-K2.5",
|
|
attempts: [
|
|
{
|
|
provider: "fireworks",
|
|
model: "fireworks/accounts/fireworks/routers/kimi-k2p5-turbo",
|
|
error: "Provider fireworks is in cooldown (all profiles unavailable)",
|
|
reason: "rate_limit",
|
|
},
|
|
],
|
|
}),
|
|
);
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
runOverrides: {
|
|
config: {
|
|
channels: {
|
|
whatsapp: {
|
|
replyToMode: "first",
|
|
},
|
|
},
|
|
},
|
|
},
|
|
});
|
|
const res = await run();
|
|
const payloads = Array.isArray(res) ? res : res ? [res] : [];
|
|
|
|
expect(payloads).toHaveLength(2);
|
|
expect(payloads[0]?.text).toContain("Model Fallback:");
|
|
expect(payloads[0]?.replyToId).toBe("msg");
|
|
expect(payloads[1]?.text).toBe("final");
|
|
expect(payloads[1]?.replyToId).toBe("msg");
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("surfaces a configured backend failure when fallback produces no visible reply", async () => {
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "NO_REPLY" }],
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementationOnce(
|
|
async ({ run }: { run: (provider: string, model: string) => Promise<unknown> }) => ({
|
|
outcome: "completed" as const,
|
|
result: await run("openai", "gpt-5.5"),
|
|
provider: "openai",
|
|
model: "gpt-5.5",
|
|
attempts: [
|
|
{
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
error: "Connection error.",
|
|
reason: "timeout",
|
|
},
|
|
],
|
|
}),
|
|
);
|
|
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
runOverrides: {
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
},
|
|
sessionCtx: {
|
|
Provider: "discord",
|
|
OriginatingChannel: "discord",
|
|
MessageSid: "1503645939964055592",
|
|
},
|
|
});
|
|
const res = await run();
|
|
const payload = Array.isArray(res) ? res[0] : res;
|
|
|
|
expect(payload?.isError).toBe(true);
|
|
expect(payload?.text).toContain("configured model backend lmstudio/gemma-4-e4b-it");
|
|
expect(payload?.text).toContain("Fallback used openai/gpt-5.5");
|
|
expect(payload?.text).toContain("no visible reply");
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("surfaces a configured backend failure when fallback returns no payloads", async () => {
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [],
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementationOnce(
|
|
async ({ run }: { run: (provider: string, model: string) => Promise<unknown> }) => ({
|
|
outcome: "completed" as const,
|
|
result: await run("openai", "gpt-5.5"),
|
|
provider: "openai",
|
|
model: "gpt-5.5",
|
|
attempts: [
|
|
{
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
error: "Connection error.",
|
|
reason: "timeout",
|
|
},
|
|
],
|
|
}),
|
|
);
|
|
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
runOverrides: {
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
},
|
|
sessionCtx: {
|
|
Provider: "discord",
|
|
OriginatingChannel: "discord",
|
|
MessageSid: "1503645939964055592",
|
|
},
|
|
});
|
|
const res = await run();
|
|
const payload = Array.isArray(res) ? res[0] : res;
|
|
|
|
expect(payload?.isError).toBe(true);
|
|
expect(payload?.text).toContain("configured model backend lmstudio/gemma-4-e4b-it");
|
|
expect(payload?.text).toContain("Fallback used openai/gpt-5.5");
|
|
expect(payload?.text).toContain("no visible reply");
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("surfaces a persisted configured backend failure when the active fallback is silent", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
providerOverride: "openai",
|
|
modelOverride: "gpt-5.5",
|
|
modelOverrideSource: "auto",
|
|
modelOverrideFallbackOriginProvider: "lmstudio",
|
|
modelOverrideFallbackOriginModel: "gemma-4-e4b-it",
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "NO_REPLY" }],
|
|
meta: {},
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
runOverrides: {
|
|
provider: "openai",
|
|
model: "gpt-5.5",
|
|
},
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionCtx: {
|
|
Provider: "discord",
|
|
OriginatingChannel: "discord",
|
|
MessageSid: "1503677587568722061",
|
|
},
|
|
});
|
|
const res = await run();
|
|
const payload = Array.isArray(res) ? res[0] : res;
|
|
|
|
expect(payload?.isError).toBe(true);
|
|
expect(payload?.text).toContain("configured model backend lmstudio/gemma-4-e4b-it");
|
|
expect(payload?.text).toContain("Fallback used openai/gpt-5.5");
|
|
expect(payload?.text).toContain("no visible reply");
|
|
});
|
|
|
|
it("announces fallback without silence failure when fallback already replied through a messaging tool", async () => {
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "already sent" }],
|
|
messagingToolSentTexts: ["already sent"],
|
|
messagingToolSentTargets: [{ tool: "message", provider: "discord", to: "channel:C1" }],
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementationOnce(
|
|
async ({ run }: { run: (provider: string, model: string) => Promise<unknown> }) => ({
|
|
outcome: "completed" as const,
|
|
result: await run("openai", "gpt-5.5"),
|
|
provider: "openai",
|
|
model: "gpt-5.5",
|
|
attempts: [
|
|
{
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
error: "Connection error.",
|
|
reason: "timeout",
|
|
},
|
|
],
|
|
}),
|
|
);
|
|
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
runOverrides: {
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
messageProvider: "discord",
|
|
},
|
|
sessionCtx: {
|
|
Provider: "discord",
|
|
OriginatingChannel: "discord",
|
|
OriginatingTo: "channel:C1",
|
|
AccountId: "primary",
|
|
MessageSid: "1503645939964055592",
|
|
},
|
|
});
|
|
|
|
const res = await run();
|
|
const payload = Array.isArray(res) ? res[0] : res;
|
|
|
|
expect(payload?.isError).not.toBe(true);
|
|
expect(payload?.text).toContain("Model Fallback:");
|
|
expect(payload?.text).not.toContain("no visible reply");
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("does not report silent fallback failure after a did-send-only side effect", async () => {
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [],
|
|
didSendViaMessagingTool: true,
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementationOnce(
|
|
async ({ run }: { run: (provider: string, model: string) => Promise<unknown> }) => ({
|
|
outcome: "completed" as const,
|
|
result: await run("openai", "gpt-5.5"),
|
|
provider: "openai",
|
|
model: "gpt-5.5",
|
|
attempts: [
|
|
{
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
error: "Connection error.",
|
|
reason: "timeout",
|
|
},
|
|
],
|
|
}),
|
|
);
|
|
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
runOverrides: {
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
},
|
|
sessionCtx: {
|
|
Provider: "discord",
|
|
OriginatingChannel: "discord",
|
|
MessageSid: "1503645939964055592",
|
|
},
|
|
});
|
|
|
|
const res = await run();
|
|
const payload = Array.isArray(res) ? res[0] : res;
|
|
|
|
expect(payload?.isError).not.toBe(true);
|
|
expect(payload?.text).toContain("Model Fallback:");
|
|
expect(payload?.text).not.toContain("no visible reply");
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("does not treat whitespace-only messaging evidence as fallback delivery", async () => {
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "NO_REPLY" }],
|
|
messagingToolSentTexts: [" "],
|
|
messagingToolSentMediaUrls: ["\t"],
|
|
messagingToolSentTargets: [
|
|
{ tool: "message", provider: "discord", to: "channel:C1", text: " " },
|
|
],
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementationOnce(
|
|
async ({ run }: { run: (provider: string, model: string) => Promise<unknown> }) => ({
|
|
outcome: "completed" as const,
|
|
result: await run("openai", "gpt-5.5"),
|
|
provider: "openai",
|
|
model: "gpt-5.5",
|
|
attempts: [
|
|
{
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
error: "Connection error.",
|
|
reason: "timeout",
|
|
},
|
|
],
|
|
}),
|
|
);
|
|
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
runOverrides: {
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
messageProvider: "discord",
|
|
},
|
|
sessionCtx: {
|
|
Provider: "discord",
|
|
OriginatingChannel: "discord",
|
|
OriginatingTo: "channel:C1",
|
|
AccountId: "primary",
|
|
MessageSid: "1503645939964055592",
|
|
},
|
|
});
|
|
const res = await run();
|
|
const payload = Array.isArray(res) ? res[0] : res;
|
|
|
|
expect(payload?.isError).toBe(true);
|
|
expect(payload?.text).toContain("configured model backend lmstudio/gemma-4-e4b-it");
|
|
expect(payload?.text).toContain("Fallback used openai/gpt-5.5");
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("announces fallback without silence failure when fallback already completed a cron side effect", async () => {
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "NO_REPLY" }],
|
|
successfulCronAdds: 1,
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementationOnce(
|
|
async ({ run }: { run: (provider: string, model: string) => Promise<unknown> }) => ({
|
|
outcome: "completed" as const,
|
|
result: await run("openai", "gpt-5.5"),
|
|
provider: "openai",
|
|
model: "gpt-5.5",
|
|
attempts: [
|
|
{
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
error: "Connection error.",
|
|
reason: "timeout",
|
|
},
|
|
],
|
|
}),
|
|
);
|
|
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
runOverrides: {
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
messageProvider: "discord",
|
|
},
|
|
sessionCtx: {
|
|
Provider: "discord",
|
|
OriginatingChannel: "discord",
|
|
OriginatingTo: "channel:C1",
|
|
AccountId: "primary",
|
|
MessageSid: "1503645939964055592",
|
|
},
|
|
});
|
|
|
|
const res = await run();
|
|
const payload = Array.isArray(res) ? res[0] : res;
|
|
|
|
expect(payload?.isError).not.toBe(true);
|
|
expect(payload?.text).toContain("Model Fallback:");
|
|
expect(payload?.text).not.toContain("no visible reply");
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("announces fallback without silence failure when fallback committed target-only messaging delivery", async () => {
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "NO_REPLY" }],
|
|
messagingToolSentTargets: [{ tool: "message", provider: "discord", to: "channel:C1" }],
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementationOnce(
|
|
async ({ run }: { run: (provider: string, model: string) => Promise<unknown> }) => ({
|
|
outcome: "completed" as const,
|
|
result: await run("openai", "gpt-5.5"),
|
|
provider: "openai",
|
|
model: "gpt-5.5",
|
|
attempts: [
|
|
{
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
error: "Connection error.",
|
|
reason: "timeout",
|
|
},
|
|
],
|
|
}),
|
|
);
|
|
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
runOverrides: {
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
messageProvider: "discord",
|
|
},
|
|
sessionCtx: {
|
|
Provider: "discord",
|
|
OriginatingChannel: "discord",
|
|
OriginatingTo: "channel:C1",
|
|
AccountId: "primary",
|
|
MessageSid: "1503645939964055592",
|
|
},
|
|
});
|
|
|
|
const res = await run();
|
|
const payload = Array.isArray(res) ? res[0] : res;
|
|
|
|
expect(payload?.isError).not.toBe(true);
|
|
expect(payload?.text).toContain("Model Fallback:");
|
|
expect(payload?.text).not.toContain("no visible reply");
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("announces fallback without silence failure when fallback already delivered an approval prompt", async () => {
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [],
|
|
didSendDeterministicApprovalPrompt: true,
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementationOnce(
|
|
async ({ run }: { run: (provider: string, model: string) => Promise<unknown> }) => ({
|
|
outcome: "completed" as const,
|
|
result: await run("openai", "gpt-5.5"),
|
|
provider: "openai",
|
|
model: "gpt-5.5",
|
|
attempts: [
|
|
{
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
error: "Connection error.",
|
|
reason: "timeout",
|
|
},
|
|
],
|
|
}),
|
|
);
|
|
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
runOverrides: {
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
},
|
|
sessionCtx: {
|
|
Provider: "discord",
|
|
OriginatingChannel: "discord",
|
|
MessageSid: "1503645939964055592",
|
|
},
|
|
});
|
|
|
|
const res = await run();
|
|
const payload = Array.isArray(res) ? res[0] : res;
|
|
|
|
expect(payload?.isError).not.toBe(true);
|
|
expect(payload?.text).toContain("Model Fallback:");
|
|
expect(payload?.text).not.toContain("no visible reply");
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("preserves intentional fallback silence when the turn permits silent replies", async () => {
|
|
state.runEmbeddedAgentMock.mockResolvedValueOnce({
|
|
payloads: [{ text: "NO_REPLY" }],
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementationOnce(
|
|
async ({ run }: { run: (provider: string, model: string) => Promise<unknown> }) => ({
|
|
outcome: "completed" as const,
|
|
result: await run("openai", "gpt-5.5"),
|
|
provider: "openai",
|
|
model: "gpt-5.5",
|
|
attempts: [
|
|
{
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
error: "Connection error.",
|
|
reason: "timeout",
|
|
},
|
|
],
|
|
}),
|
|
);
|
|
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
runOverrides: {
|
|
provider: "lmstudio",
|
|
model: "gemma-4-e4b-it",
|
|
allowEmptyAssistantReplyAsSilent: true,
|
|
},
|
|
sessionCtx: {
|
|
Provider: "discord",
|
|
OriginatingChannel: "discord",
|
|
OriginatingTo: "channel:C1",
|
|
ChatType: "channel",
|
|
WasMentioned: false,
|
|
MessageSid: "1503645939964055592",
|
|
},
|
|
});
|
|
|
|
await expect(run()).resolves.toBeUndefined();
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("announces model fallback only once per active fallback state", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
|
|
state.runEmbeddedAgentMock.mockResolvedValue({
|
|
payloads: [{ text: "final" }],
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementation(
|
|
async ({ run }: { run: (provider: string, model: string) => Promise<unknown> }) => ({
|
|
outcome: "completed" as const,
|
|
result: await run("deepinfra", "moonshotai/Kimi-K2.5"),
|
|
provider: "deepinfra",
|
|
model: "moonshotai/Kimi-K2.5",
|
|
attempts: [
|
|
{
|
|
provider: "fireworks",
|
|
model: "fireworks/accounts/fireworks/routers/kimi-k2p5-turbo",
|
|
error: "Provider fireworks is in cooldown (all profiles unavailable)",
|
|
reason: "rate_limit",
|
|
},
|
|
],
|
|
}),
|
|
);
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
resolvedVerboseLevel: "on",
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
});
|
|
const fallbackEvents: Array<Record<string, unknown>> = [];
|
|
const off = onAgentEvent((evt) => {
|
|
if (evt.stream === "lifecycle" && evt.data?.phase === "fallback") {
|
|
fallbackEvents.push(evt.data);
|
|
}
|
|
});
|
|
const first = await run();
|
|
const second = await run();
|
|
off();
|
|
|
|
const firstText = Array.isArray(first) ? first[0]?.text : first?.text;
|
|
const secondText = Array.isArray(second) ? second[0]?.text : second?.text;
|
|
expect(firstText).toContain("Model Fallback:");
|
|
expect(secondText).not.toContain("Model Fallback:");
|
|
expect(fallbackEvents).toHaveLength(1);
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("re-announces model fallback after returning to selected model", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
let callCount = 0;
|
|
|
|
state.runEmbeddedAgentMock.mockResolvedValue({
|
|
payloads: [{ text: "final" }],
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementation(
|
|
async ({
|
|
provider,
|
|
model,
|
|
run,
|
|
}: {
|
|
provider: string;
|
|
model: string;
|
|
run: (provider: string, model: string) => Promise<unknown>;
|
|
}) => {
|
|
callCount += 1;
|
|
if (callCount === 2) {
|
|
return {
|
|
outcome: "completed" as const,
|
|
result: await run(provider, model),
|
|
provider,
|
|
model,
|
|
attempts: [],
|
|
};
|
|
}
|
|
return {
|
|
outcome: "completed" as const,
|
|
result: await run("deepinfra", "moonshotai/Kimi-K2.5"),
|
|
provider: "deepinfra",
|
|
model: "moonshotai/Kimi-K2.5",
|
|
attempts: [
|
|
{
|
|
provider: "fireworks",
|
|
model: "fireworks/accounts/fireworks/routers/kimi-k2p5-turbo",
|
|
error: "Provider fireworks is in cooldown (all profiles unavailable)",
|
|
reason: "rate_limit",
|
|
},
|
|
],
|
|
};
|
|
},
|
|
);
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
resolvedVerboseLevel: "on",
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
});
|
|
const first = await run();
|
|
const second = await run();
|
|
const third = await run();
|
|
|
|
const firstText = Array.isArray(first) ? first[0]?.text : first?.text;
|
|
const secondText = Array.isArray(second) ? second[0]?.text : second?.text;
|
|
const thirdText = Array.isArray(third) ? third[0]?.text : third?.text;
|
|
expect(firstText).toContain("Model Fallback:");
|
|
expect(secondText).not.toContain("Model Fallback:");
|
|
expect(thirdText).toContain("Model Fallback:");
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("announces fallback-cleared once when runtime returns to selected model", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
let callCount = 0;
|
|
|
|
state.runEmbeddedAgentMock.mockResolvedValue({
|
|
payloads: [{ text: "final" }],
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementation(
|
|
async ({
|
|
provider,
|
|
model,
|
|
run,
|
|
}: {
|
|
provider: string;
|
|
model: string;
|
|
run: (provider: string, model: string) => Promise<unknown>;
|
|
}) => {
|
|
callCount += 1;
|
|
if (callCount === 1) {
|
|
return {
|
|
outcome: "completed" as const,
|
|
result: await run("deepinfra", "moonshotai/Kimi-K2.5"),
|
|
provider: "deepinfra",
|
|
model: "moonshotai/Kimi-K2.5",
|
|
attempts: [
|
|
{
|
|
provider: "fireworks",
|
|
model: "fireworks/accounts/fireworks/routers/kimi-k2p5-turbo",
|
|
error: "Provider fireworks is in cooldown (all profiles unavailable)",
|
|
reason: "rate_limit",
|
|
},
|
|
],
|
|
};
|
|
}
|
|
return {
|
|
outcome: "completed" as const,
|
|
result: await run(provider, model),
|
|
provider,
|
|
model,
|
|
attempts: [],
|
|
};
|
|
},
|
|
);
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
resolvedVerboseLevel: "on",
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
});
|
|
const phases: string[] = [];
|
|
const off = onAgentEvent((evt) => {
|
|
const phase = typeof evt.data?.phase === "string" ? evt.data.phase : null;
|
|
if (evt.stream === "lifecycle" && phase) {
|
|
phases.push(phase);
|
|
}
|
|
});
|
|
const first = await run();
|
|
const second = await run();
|
|
const third = await run();
|
|
off();
|
|
|
|
const firstText = Array.isArray(first) ? first[0]?.text : first?.text;
|
|
const secondText = Array.isArray(second) ? second[0]?.text : second?.text;
|
|
const thirdText = Array.isArray(third) ? third[0]?.text : third?.text;
|
|
expect(firstText).toContain("Model Fallback:");
|
|
expect(secondText).toContain("Model Fallback cleared:");
|
|
expect(thirdText).not.toContain("Model Fallback cleared:");
|
|
expect(countMatching(phases, (phase) => phase === "fallback")).toBe(1);
|
|
expect(countMatching(phases, (phase) => phase === "fallback_cleared")).toBe(1);
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("announces fallback transitions and emits lifecycle events while verbose is off", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
let callCount = 0;
|
|
|
|
state.runEmbeddedAgentMock.mockResolvedValue({
|
|
payloads: [{ text: "final" }],
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementation(
|
|
async ({
|
|
provider,
|
|
model,
|
|
run,
|
|
}: {
|
|
provider: string;
|
|
model: string;
|
|
run: (provider: string, model: string) => Promise<unknown>;
|
|
}) => {
|
|
callCount += 1;
|
|
if (callCount === 1) {
|
|
return {
|
|
outcome: "completed" as const,
|
|
result: await run("deepinfra", "moonshotai/Kimi-K2.5"),
|
|
provider: "deepinfra",
|
|
model: "moonshotai/Kimi-K2.5",
|
|
attempts: [
|
|
{
|
|
provider: "fireworks",
|
|
model: "fireworks/accounts/fireworks/routers/kimi-k2p5-turbo",
|
|
error: "Provider fireworks is in cooldown (all profiles unavailable)",
|
|
reason: "rate_limit",
|
|
},
|
|
],
|
|
};
|
|
}
|
|
return {
|
|
outcome: "completed" as const,
|
|
result: await run(provider, model),
|
|
provider,
|
|
model,
|
|
attempts: [],
|
|
};
|
|
},
|
|
);
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
resolvedVerboseLevel: "off",
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
});
|
|
const phases: string[] = [];
|
|
const off = onAgentEvent((evt) => {
|
|
const phase = typeof evt.data?.phase === "string" ? evt.data.phase : null;
|
|
if (evt.stream === "lifecycle" && phase) {
|
|
phases.push(phase);
|
|
}
|
|
});
|
|
const first = await run();
|
|
const second = await run();
|
|
off();
|
|
|
|
const firstText = Array.isArray(first) ? first[0]?.text : first?.text;
|
|
const secondText = Array.isArray(second) ? second[0]?.text : second?.text;
|
|
expect(firstText).toContain("Model Fallback:");
|
|
expect(secondText).toContain("Model Fallback cleared:");
|
|
expect(countMatching(phases, (phase) => phase === "fallback")).toBe(1);
|
|
expect(countMatching(phases, (phase) => phase === "fallback_cleared")).toBe(1);
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it("updates fallback reason summary while fallback stays active", async () => {
|
|
const cases = [
|
|
{
|
|
existingReason: undefined,
|
|
reportedReason: "rate_limit",
|
|
expectedReason: "rate limit",
|
|
},
|
|
{
|
|
existingReason: undefined,
|
|
reportedReason: "overloaded",
|
|
expectedReason: "overloaded",
|
|
},
|
|
{
|
|
existingReason: "rate limit",
|
|
reportedReason: "timeout",
|
|
expectedReason: "timeout",
|
|
},
|
|
] as const;
|
|
|
|
for (const testCase of cases) {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
fallbackNoticeSelectedModel: "anthropic/claude",
|
|
fallbackNoticeActiveModel: "deepinfra/moonshotai/Kimi-K2.5",
|
|
...(testCase.existingReason ? { fallbackNoticeReason: testCase.existingReason } : {}),
|
|
modelProvider: "deepinfra",
|
|
model: "moonshotai/Kimi-K2.5",
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
|
|
state.runEmbeddedAgentMock.mockResolvedValue({
|
|
payloads: [{ text: "final" }],
|
|
meta: {},
|
|
});
|
|
const fallbackSpy = vi
|
|
.spyOn(modelFallbackModule, "runWithModelFallback")
|
|
.mockImplementation(
|
|
async ({ run }: { run: (provider: string, model: string) => Promise<unknown> }) => ({
|
|
outcome: "completed" as const,
|
|
result: await run("deepinfra", "moonshotai/Kimi-K2.5"),
|
|
provider: "deepinfra",
|
|
model: "moonshotai/Kimi-K2.5",
|
|
attempts: [
|
|
{
|
|
provider: "anthropic",
|
|
model: "claude",
|
|
error: "Provider anthropic is in cooldown (all profiles unavailable)",
|
|
reason: testCase.reportedReason,
|
|
},
|
|
],
|
|
}),
|
|
);
|
|
try {
|
|
const { run } = createMinimalRun({
|
|
resolvedVerboseLevel: "on",
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
});
|
|
const res = await run();
|
|
const firstText = Array.isArray(res) ? res[0]?.text : res?.text;
|
|
expect(firstText).not.toContain("Model Fallback:");
|
|
expect(sessionEntry.fallbackNoticeReason).toBe(testCase.expectedReason);
|
|
} finally {
|
|
fallbackSpy.mockRestore();
|
|
}
|
|
}
|
|
});
|
|
|
|
it("does not persist fallback state for an equivalent CLI runtime alias", async () => {
|
|
const sessionEntry: SessionEntry = {
|
|
sessionId: "session",
|
|
updatedAt: Date.now(),
|
|
fallbackNoticeSelectedModel: "anthropic/claude-opus-4-7",
|
|
fallbackNoticeActiveModel: "claude-cli/claude-opus-4-7",
|
|
fallbackNoticeReason: "selected model unavailable",
|
|
};
|
|
const sessionStore = { main: sessionEntry };
|
|
const dir = await mkdtemp(join(tmpdir(), "openclaw-agent-runner-cli-alias-"));
|
|
const storePath = join(dir, "sessions.json");
|
|
await saveSessionStore(storePath, { main: sessionEntry }, { skipMaintenance: true });
|
|
|
|
state.runEmbeddedAgentMock.mockResolvedValue({
|
|
payloads: [{ text: "final" }],
|
|
meta: {
|
|
agentMeta: {
|
|
provider: "claude-cli",
|
|
model: "claude-opus-4-7",
|
|
usage: { input: 36_000, output: 19_000 },
|
|
},
|
|
},
|
|
});
|
|
|
|
const { run } = createMinimalRun({
|
|
sessionEntry,
|
|
sessionStore,
|
|
sessionKey: "main",
|
|
storePath,
|
|
runOverrides: {
|
|
provider: "anthropic",
|
|
model: "claude-opus-4-7",
|
|
config: {
|
|
agents: {
|
|
defaults: {
|
|
cliBackends: {
|
|
"claude-cli": { command: "claude" },
|
|
},
|
|
},
|
|
},
|
|
},
|
|
},
|
|
});
|
|
await run();
|
|
|
|
const stored = requireStoredSessionEntry(storePath);
|
|
expect(sessionEntry.fallbackNoticeSelectedModel).toBeUndefined();
|
|
expect(sessionEntry.fallbackNoticeActiveModel).toBeUndefined();
|
|
expect(stored.fallbackNoticeSelectedModel).toBeUndefined();
|
|
expect(stored.fallbackNoticeActiveModel).toBeUndefined();
|
|
expect(stored.modelProvider).toBe("claude-cli");
|
|
expect(stored.model).toBe("claude-opus-4-7");
|
|
expect(stored.totalTokens).toBe(36_000);
|
|
expect(stored.totalTokensFresh).toBe(true);
|
|
});
|
|
|
|
it("surfaces overflow fallback when embedded run returns empty payloads", async () => {
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async () => ({
|
|
payloads: [],
|
|
meta: {
|
|
durationMs: 1,
|
|
error: {
|
|
kind: "context_overflow",
|
|
message: 'Context overflow: Summarization failed: 400 {"message":"prompt is too long"}',
|
|
},
|
|
},
|
|
}));
|
|
|
|
const { run } = createMinimalRun();
|
|
const res = await run();
|
|
const payload = Array.isArray(res) ? res[0] : res;
|
|
if (!payload) {
|
|
throw new Error("expected payload");
|
|
}
|
|
expect(payload.text).toContain("Auto-compaction could not recover this turn");
|
|
expect(payload.text).toContain("reserveTokensFloor");
|
|
expect(payload.text).toContain("/new");
|
|
});
|
|
|
|
it("surfaces overflow fallback when embedded payload text is whitespace-only", async () => {
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async () => ({
|
|
payloads: [{ text: " \n\t ", isError: true }],
|
|
meta: {
|
|
durationMs: 1,
|
|
error: {
|
|
kind: "context_overflow",
|
|
message: 'Context overflow: Summarization failed: 400 {"message":"prompt is too long"}',
|
|
},
|
|
},
|
|
}));
|
|
|
|
const { run } = createMinimalRun();
|
|
const res = await run();
|
|
const payload = Array.isArray(res) ? res[0] : res;
|
|
if (!payload) {
|
|
throw new Error("expected payload");
|
|
}
|
|
expect(payload.text).toContain("Auto-compaction could not recover this turn");
|
|
expect(payload.text).toContain("reserveTokensFloor");
|
|
expect(payload.text).toContain("/new");
|
|
});
|
|
|
|
it("returns friendly message for role ordering errors thrown as exceptions", async () => {
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async () => {
|
|
throw new Error("400 Incorrect role information");
|
|
});
|
|
|
|
const { run } = createMinimalRun({});
|
|
const res = await run();
|
|
|
|
const payload = requireRecord(res, "ordering conflict payload");
|
|
expect(payload.text).toContain("model provider rejected the conversation state");
|
|
expect(payload.text).not.toContain("400");
|
|
});
|
|
|
|
it("rewrites Bun socket errors into friendly text", async () => {
|
|
state.runEmbeddedAgentMock.mockImplementationOnce(async () => ({
|
|
payloads: [
|
|
{
|
|
text: "TypeError: The socket connection was closed unexpectedly. For more information, pass `verbose: true` in the second argument to fetch()",
|
|
isError: true,
|
|
},
|
|
],
|
|
meta: {},
|
|
}));
|
|
|
|
const { run } = createMinimalRun();
|
|
const res = await run();
|
|
const payloads = Array.isArray(res) ? res : res ? [res] : [];
|
|
expect(payloads.length).toBe(1);
|
|
expect(payloads[0]?.text).toContain("LLM connection failed");
|
|
expect(payloads[0]?.text).toContain("socket connection was closed unexpectedly");
|
|
expect(payloads[0]?.text).toContain("```");
|
|
});
|
|
});
|
|
|
|
import type { ReplyPayload } from "../types.js";
|