mirror of
https://github.com/openclaw/openclaw.git
synced 2026-05-03 05:00:25 +00:00
110 lines
3.7 KiB
TypeScript
110 lines
3.7 KiB
TypeScript
import type { Message, Model } from "@mariozechner/pi-ai";
|
|
import { describe, expect, it, vi } from "vitest";
|
|
import {
|
|
completeSimpleWithLiveTimeout,
|
|
extractAssistantText,
|
|
logLiveCache,
|
|
} from "./live-cache-test-support.js";
|
|
import { isLiveTestEnabled } from "./live-test-helpers.js";
|
|
import { wrapStreamFnSanitizeMalformedToolCalls } from "./pi-embedded-runner/run/attempt.tool-call-normalization.js";
|
|
import { buildAssistantMessageWithZeroUsage } from "./stream-message-shared.js";
|
|
|
|
const ANTHROPIC_LIVE = isLiveTestEnabled(["ANTHROPIC_LIVE_TEST"]);
|
|
const describeLive = ANTHROPIC_LIVE ? describe : describe.skip;
|
|
const ANTHROPIC_TIMEOUT_MS = 120_000;
|
|
const TOOL_OUTPUT_SENTINEL = "TOOL-RESULT-LIVE-MAGENTA";
|
|
|
|
function buildLiveAnthropicModel(): {
|
|
apiKey: string;
|
|
model: Model<"anthropic-messages">;
|
|
} {
|
|
const apiKey = process.env.ANTHROPIC_API_KEY;
|
|
if (!apiKey) {
|
|
throw new Error("missing ANTHROPIC_API_KEY");
|
|
}
|
|
const modelId =
|
|
(process.env.OPENCLAW_LIVE_ANTHROPIC_CACHE_MODEL || "claude-sonnet-4-6")
|
|
.split(/[/:]/)
|
|
.filter(Boolean)
|
|
.pop() || "claude-sonnet-4-6";
|
|
return {
|
|
apiKey,
|
|
model: {
|
|
id: modelId,
|
|
name: modelId,
|
|
api: "anthropic-messages" as const,
|
|
provider: "anthropic",
|
|
baseUrl: "https://api.anthropic.com/v1",
|
|
reasoning: true,
|
|
input: ["text"] as const,
|
|
cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
|
|
contextWindow: 200_000,
|
|
maxTokens: 8_192,
|
|
} satisfies Model<"anthropic-messages">,
|
|
};
|
|
}
|
|
|
|
describeLive("pi embedded anthropic replay sanitization (live)", () => {
|
|
it(
|
|
"preserves toolCall replay history that Anthropic accepts end-to-end",
|
|
async () => {
|
|
const { apiKey, model } = buildLiveAnthropicModel();
|
|
const messages: Message[] = [
|
|
{
|
|
...buildAssistantMessageWithZeroUsage({
|
|
model: { api: model.api, provider: model.provider, id: model.id },
|
|
content: [{ type: "toolCall", id: "call_1", name: "noop", arguments: {} }],
|
|
stopReason: "toolUse",
|
|
}),
|
|
},
|
|
{
|
|
role: "toolResult",
|
|
toolCallId: "call_1",
|
|
toolName: "noop",
|
|
content: [{ type: "text", text: TOOL_OUTPUT_SENTINEL }],
|
|
isError: false,
|
|
timestamp: Date.now(),
|
|
},
|
|
{
|
|
role: "user",
|
|
content:
|
|
"The tool finished. Reply with exactly OK as plain text if this replay history is valid.",
|
|
timestamp: Date.now(),
|
|
},
|
|
];
|
|
|
|
const baseFn = vi.fn((_model: unknown, context: unknown) => ({ context }));
|
|
const wrapped = wrapStreamFnSanitizeMalformedToolCalls(baseFn as never, new Set(["noop"]), {
|
|
validateGeminiTurns: false,
|
|
validateAnthropicTurns: true,
|
|
});
|
|
|
|
await Promise.resolve(wrapped(model as never, { messages } as never, {} as never));
|
|
|
|
expect(baseFn).toHaveBeenCalledTimes(1);
|
|
const seenMessages = (baseFn.mock.calls[0]?.[1] as { messages?: unknown[] })?.messages;
|
|
expect(seenMessages).toEqual(messages);
|
|
|
|
logLiveCache(`anthropic replay live model=${model.provider}/${model.id}`);
|
|
const response = await completeSimpleWithLiveTimeout(
|
|
model,
|
|
{ messages: seenMessages as typeof messages },
|
|
{
|
|
apiKey,
|
|
cacheRetention: "none",
|
|
sessionId: "anthropic-tool-replay-live",
|
|
maxTokens: 64,
|
|
temperature: 0,
|
|
},
|
|
"anthropic replay live synthetic transcript",
|
|
ANTHROPIC_TIMEOUT_MS,
|
|
);
|
|
|
|
const text = extractAssistantText(response);
|
|
logLiveCache(`anthropic replay live result=${JSON.stringify(text)}`);
|
|
expect(response.content.length).toBeGreaterThanOrEqual(0);
|
|
},
|
|
6 * 60_000,
|
|
);
|
|
});
|