Files
openclaw/extensions/xai/code-execution.test.ts
2026-05-16 18:00:31 +08:00

263 lines
7.7 KiB
TypeScript

import { withFetchPreconnect } from "openclaw/plugin-sdk/test-env";
import { afterEach, describe, expect, it, vi } from "vitest";
import { createCodeExecutionTool } from "./code-execution.js";
function installCodeExecutionFetch(payload?: Record<string, unknown>) {
const mockFetch = vi.fn((_input?: unknown, _init?: unknown) =>
Promise.resolve({
ok: true,
json: () =>
Promise.resolve(
payload ?? {
output: [
{ type: "code_interpreter_call" },
{
type: "message",
content: [
{
type: "output_text",
text: "Mean: 42",
annotations: [{ type: "url_citation", url: "https://example.com/data.csv" }],
},
],
},
],
citations: ["https://example.com/data.csv"],
},
),
} as Response),
);
global.fetch = withFetchPreconnect(mockFetch);
return mockFetch;
}
function firstFetchCall(mockFetch: ReturnType<typeof installCodeExecutionFetch>) {
const [call] = mockFetch.mock.calls;
if (!call) {
throw new Error("expected code_execution fetch call");
}
return call;
}
function firstFetchUrl(mockFetch: ReturnType<typeof installCodeExecutionFetch>) {
const [url] = firstFetchCall(mockFetch);
return String(url);
}
function firstFetchInit(mockFetch: ReturnType<typeof installCodeExecutionFetch>): RequestInit {
const [, init] = firstFetchCall(mockFetch);
if (!init || typeof init !== "object" || Array.isArray(init)) {
throw new Error("expected code_execution fetch init");
}
return init as RequestInit;
}
function firstAuthorizationHeader(mockFetch: ReturnType<typeof installCodeExecutionFetch>) {
const headers = firstFetchInit(mockFetch).headers;
if (!headers || typeof headers !== "object" || Array.isArray(headers)) {
throw new Error("expected code_execution request headers");
}
return (headers as Record<string, string>).Authorization;
}
function parseFirstRequestBody(mockFetch: ReturnType<typeof installCodeExecutionFetch>) {
const requestBody = firstFetchInit(mockFetch).body;
return JSON.parse(typeof requestBody === "string" ? requestBody : "{}") as Record<
string,
unknown
>;
}
afterEach(() => {
vi.restoreAllMocks();
});
describe("xai code_execution tool", () => {
it("enables code_execution when the xAI plugin web search key is configured", () => {
const tool = createCodeExecutionTool({
config: {
plugins: {
entries: {
xai: {
config: {
webSearch: {
apiKey: "xai-plugin-key", // pragma: allowlist secret
},
},
},
},
},
},
});
expect(tool?.name).toBe("code_execution");
});
it("enables code_execution from an xAI auth profile and uses it for requests", async () => {
const mockFetch = installCodeExecutionFetch();
const tool = createCodeExecutionTool({
config: {},
auth: {
hasAuthForProvider: (providerId) => providerId === "xai",
resolveApiKeyForProvider: async (providerId) =>
providerId === "xai" ? "xai-profile-key" : undefined, // pragma: allowlist secret
},
});
expect(tool?.name).toBe("code_execution");
await tool?.execute?.("code-execution:auth-profile", {
task: "Sum [20, 22]",
});
expect(firstAuthorizationHeader(mockFetch)).toBe("Bearer xai-profile-key");
});
it("uses the xAI Responses code_interpreter tool", async () => {
const mockFetch = installCodeExecutionFetch();
const tool = createCodeExecutionTool({
config: {
plugins: {
entries: {
xai: {
config: {
webSearch: {
apiKey: "xai-config-test", // pragma: allowlist secret
},
codeExecution: {
model: "grok-4-1-fast",
maxTurns: 2,
timeoutSeconds: 45,
},
},
},
},
},
},
});
const result = await tool?.execute?.("code-execution:1", {
task: "Calculate the mean of [40, 42, 44]",
});
expect(mockFetch).toHaveBeenCalled();
expect(firstFetchUrl(mockFetch)).toContain("api.x.ai/v1/responses");
const body = parseFirstRequestBody(mockFetch);
expect(body.model).toBe("grok-4-1-fast");
expect(body.max_turns).toBe(2);
expect(body.tools).toEqual([{ type: "code_interpreter" }]);
expect(
(result?.details as { usedCodeExecution?: boolean } | undefined)?.usedCodeExecution,
).toBe(true);
});
it("reuses the xAI plugin web search key for code_execution requests", async () => {
const mockFetch = installCodeExecutionFetch();
const tool = createCodeExecutionTool({
config: {
plugins: {
entries: {
xai: {
config: {
webSearch: {
apiKey: "xai-plugin-key", // pragma: allowlist secret
},
},
},
},
},
},
});
await tool?.execute?.("code-execution:plugin-key", {
task: "Compute the standard deviation of [1, 2, 3]",
});
expect(firstAuthorizationHeader(mockFetch)).toBe("Bearer xai-plugin-key");
});
it("reports malformed code_execution JSON as a provider error", async () => {
const mockFetch = vi.fn((_input?: unknown, _init?: unknown) =>
Promise.resolve({
ok: true,
json: () => Promise.reject(new SyntaxError("Unexpected token")),
} as Response),
);
global.fetch = withFetchPreconnect(mockFetch);
const tool = createCodeExecutionTool({
config: {
plugins: {
entries: {
xai: {
config: {
webSearch: {
apiKey: "xai-plugin-key", // pragma: allowlist secret
},
},
},
},
},
},
});
await expect(
tool?.execute?.("code-execution:malformed-json", {
task: "Calculate the mean of [40, 42, 44]",
}),
).rejects.toThrow("xAI code execution failed: malformed JSON response");
});
it("rejects code_execution success JSON without answer text", async () => {
const mockFetch = vi.fn((_input?: unknown, _init?: unknown) =>
Promise.resolve({
ok: true,
json: () => Promise.resolve({ output: [{ type: "code_interpreter_call" }] }),
} as Response),
);
global.fetch = withFetchPreconnect(mockFetch);
const tool = createCodeExecutionTool({
config: {
plugins: {
entries: {
xai: {
config: {
webSearch: {
apiKey: "xai-plugin-key", // pragma: allowlist secret
},
},
},
},
},
},
});
await expect(
tool?.execute?.("code-execution:missing-text", {
task: "Calculate the mean of [40, 42, 44]",
}),
).rejects.toThrow("xAI code execution failed: malformed JSON response");
});
it("reuses the legacy grok web search key for code_execution requests", async () => {
const mockFetch = installCodeExecutionFetch();
const tool = createCodeExecutionTool({
config: {
tools: {
web: {
search: {
grok: {
apiKey: "xai-legacy-key", // pragma: allowlist secret
},
},
},
},
},
});
await tool?.execute?.("code-execution:legacy-key", {
task: "Count rows in a two-column table",
});
expect(firstAuthorizationHeader(mockFetch)).toBe("Bearer xai-legacy-key");
});
});