Files
openclaw/extensions/inworld/speech-provider.test.ts
2026-05-03 22:52:18 -07:00

215 lines
6.1 KiB
TypeScript

import { afterEach, describe, expect, it, vi } from "vitest";
const { inworldTTSMock, listInworldVoicesMock } = vi.hoisted(() => ({
inworldTTSMock: vi.fn(),
listInworldVoicesMock: vi.fn(),
}));
vi.mock("./tts.js", async (importOriginal) => {
const actual = await importOriginal<typeof import("./tts.js")>();
return {
...actual,
inworldTTS: inworldTTSMock,
listInworldVoices: listInworldVoicesMock,
};
});
import { buildInworldSpeechProvider } from "./speech-provider.js";
describe("buildInworldSpeechProvider", () => {
const originalEnv = process.env.INWORLD_API_KEY;
afterEach(() => {
process.env.INWORLD_API_KEY = originalEnv;
inworldTTSMock.mockReset();
listInworldVoicesMock.mockReset();
vi.restoreAllMocks();
});
it("reports configured when INWORLD_API_KEY env var is set", () => {
process.env.INWORLD_API_KEY = "test-key";
const provider = buildInworldSpeechProvider();
expect(
provider.isConfigured({
providerConfig: {},
timeoutMs: 30_000,
}),
).toBe(true);
});
it("reports configured when providerConfig apiKey is set", () => {
delete process.env.INWORLD_API_KEY;
const provider = buildInworldSpeechProvider();
expect(
provider.isConfigured({
providerConfig: { apiKey: "config-key" },
timeoutMs: 30_000,
}),
).toBe(true);
});
it("reports not configured when no key is available", () => {
delete process.env.INWORLD_API_KEY;
const provider = buildInworldSpeechProvider();
expect(
provider.isConfigured({
providerConfig: {},
timeoutMs: 30_000,
}),
).toBe(false);
});
it("has correct provider metadata", () => {
const provider = buildInworldSpeechProvider();
expect(provider.id).toBe("inworld");
expect(provider.label).toBe("Inworld");
expect(provider.autoSelectOrder).toBe(30);
expect(provider.models).toContain("inworld-tts-1.5-max");
expect(provider.models).toContain("inworld-tts-1.5-mini");
});
it("normalizes provider-owned speech config from raw provider config", () => {
const provider = buildInworldSpeechProvider();
const resolved = provider.resolveConfig?.({
cfg: {} as never,
timeoutMs: 30_000,
rawConfig: {
providers: {
inworld: {
apiKey: "basic-key",
baseUrl: "https://custom.inworld.example.com/",
voiceId: "Ashley",
modelId: "inworld-tts-1.5-mini",
temperature: 0.8,
},
},
},
});
expect(resolved).toEqual({
apiKey: "basic-key",
baseUrl: "https://custom.inworld.example.com",
voiceId: "Ashley",
modelId: "inworld-tts-1.5-mini",
temperature: 0.8,
});
});
it("parses Inworld TTS directive overrides", () => {
const provider = buildInworldSpeechProvider();
const policy = {
enabled: true,
allowText: true,
allowProvider: true,
allowVoice: true,
allowModelId: true,
allowVoiceSettings: true,
allowNormalization: true,
allowSeed: true,
};
expect(provider.parseDirectiveToken?.({ key: "voice", value: "Ashley", policy })).toEqual({
handled: true,
overrides: { voiceId: "Ashley" },
});
expect(
provider.parseDirectiveToken?.({
key: "model",
value: "inworld-tts-1.5-mini",
policy,
}),
).toEqual({
handled: true,
overrides: { modelId: "inworld-tts-1.5-mini" },
});
expect(provider.parseDirectiveToken?.({ key: "temperature", value: "0.7", policy })).toEqual({
handled: true,
overrides: { temperature: 0.7 },
});
});
it("warns on invalid directive temperature", () => {
const provider = buildInworldSpeechProvider();
expect(
provider.parseDirectiveToken?.({
key: "temperature",
value: "3",
policy: {
enabled: true,
allowText: true,
allowProvider: true,
allowVoice: true,
allowModelId: true,
allowVoiceSettings: true,
allowNormalization: true,
allowSeed: true,
},
}),
).toEqual({
handled: true,
warnings: ['invalid Inworld temperature "3"'],
});
});
it("synthesizes voice-note targets with native OGG_OPUS output", async () => {
inworldTTSMock.mockResolvedValueOnce(Buffer.from("opus"));
const provider = buildInworldSpeechProvider();
const result = await provider.synthesize?.({
text: "Hello",
cfg: {} as never,
providerConfig: { apiKey: "key", voiceId: "Sarah", modelId: "inworld-tts-1.5-max" },
providerOverrides: { voice: "Ashley", model: "inworld-tts-1.5-mini", temperature: 0.6 },
target: "voice-note",
timeoutMs: 30_000,
});
expect(inworldTTSMock).toHaveBeenCalledWith({
text: "Hello",
apiKey: "key",
baseUrl: "https://api.inworld.ai",
voiceId: "Ashley",
modelId: "inworld-tts-1.5-mini",
audioEncoding: "OGG_OPUS",
temperature: 0.6,
timeoutMs: 30_000,
});
expect(result).toEqual({
audioBuffer: Buffer.from("opus"),
outputFormat: "ogg_opus",
fileExtension: ".ogg",
voiceCompatible: true,
});
});
it("synthesizes telephony PCM at 22050 Hz", async () => {
inworldTTSMock.mockResolvedValueOnce(Buffer.from("pcm"));
const provider = buildInworldSpeechProvider();
const result = await provider.synthesizeTelephony?.({
text: "Hello",
cfg: {} as never,
providerConfig: { apiKey: "key", voiceId: "Sarah", modelId: "inworld-tts-1.5-max" },
providerOverrides: { voice: "Ashley", model: "inworld-tts-1.5-mini", temperature: 0.6 },
timeoutMs: 30_000,
});
expect(inworldTTSMock).toHaveBeenCalledWith({
text: "Hello",
apiKey: "key",
baseUrl: "https://api.inworld.ai",
voiceId: "Ashley",
modelId: "inworld-tts-1.5-mini",
audioEncoding: "PCM",
sampleRateHertz: 22_050,
temperature: 0.6,
timeoutMs: 30_000,
});
expect(result).toEqual({
audioBuffer: Buffer.from("pcm"),
outputFormat: "pcm",
sampleRate: 22_050,
});
});
});