Files
openclaw/extensions/xai/stt.test.ts
2026-05-09 22:19:39 +01:00

89 lines
2.8 KiB
TypeScript

import { describe, expect, it, vi } from "vitest";
import {
buildXaiMediaUnderstandingProvider,
transcribeXaiAudio,
XAI_DEFAULT_STT_MODEL,
} from "./stt.js";
const { postTranscriptionRequestMock } = vi.hoisted(() => ({
postTranscriptionRequestMock: vi.fn(
async (_params: { headers: Headers; body: BodyInit; url: string; timeoutMs?: number }) => ({
response: new Response(JSON.stringify({ text: "hello from audio" }), { status: 200 }),
release: vi.fn(),
}),
),
}));
function requireFirstPostTranscriptionCall(): {
url?: string;
timeoutMs?: number;
auditContext?: string;
headers: Headers;
body: BodyInit;
} {
const params = (
postTranscriptionRequestMock.mock.calls as unknown as Array<[unknown]>
)[0]?.[0] as
| {
url?: string;
timeoutMs?: number;
auditContext?: string;
headers?: Headers;
body?: BodyInit;
}
| undefined;
if (!params?.headers || !params.body) {
throw new Error("Expected transcription request params");
}
return {
...params,
headers: params.headers,
body: params.body,
};
}
vi.mock("openclaw/plugin-sdk/provider-http", async (importOriginal) => {
const actual = await importOriginal<typeof import("openclaw/plugin-sdk/provider-http")>();
return {
...actual,
postTranscriptionRequest: postTranscriptionRequestMock,
};
});
describe("xai stt", () => {
it("posts audio files to the xAI STT endpoint", async () => {
const result = await transcribeXaiAudio({
buffer: Buffer.from("audio-bytes"),
fileName: "sample.wav",
mime: "audio/wav",
apiKey: "xai-key",
baseUrl: "https://api.x.ai/v1/",
model: XAI_DEFAULT_STT_MODEL,
language: "en",
prompt: "ignored provider hint",
timeoutMs: 10_000,
});
expect(result).toEqual({ text: "hello from audio", model: XAI_DEFAULT_STT_MODEL });
const call = requireFirstPostTranscriptionCall();
expect(call.url).toBe("https://api.x.ai/v1/stt");
expect(call.timeoutMs).toBe(10_000);
expect(call.auditContext).toBe("xai stt");
expect(call.headers.get("authorization")).toBe("Bearer xai-key");
expect(call.body).toBeInstanceOf(FormData);
const form = call.body as FormData;
expect(form.get("model")).toBe(XAI_DEFAULT_STT_MODEL);
expect(form.get("language")).toBe("en");
expect(form.get("prompt")).toBeNull();
expect(form.get("file")).toBeInstanceOf(Blob);
});
it("registers as an audio media-understanding provider", () => {
const provider = buildXaiMediaUnderstandingProvider();
expect(provider.id).toBe("xai");
expect(provider.capabilities).toEqual(["audio"]);
expect(provider.defaultModels).toEqual({ audio: XAI_DEFAULT_STT_MODEL });
expect(provider.autoPriority).toEqual({ audio: 25 });
});
});