mirror of
https://github.com/openclaw/openclaw.git
synced 2026-05-28 23:06:48 +00:00
* refactor: share talk event metric extraction * refactor: reuse shared coercion helpers * refactor: reuse shared primitive guards * refactor: reuse shared record guard * refactor: reuse shared primitive helpers * refactor: reuse shared string guards * refactor: reuse shared non-empty string guard * refactor: share plugin primitive coercion helpers * refactor: reuse plugin coercion helpers * refactor: reuse plugin coercion helpers in more plugins * refactor: reuse channel coercion helpers * refactor: reuse monitor coercion helpers * refactor: reuse provider coercion helpers * refactor: reuse core coercion helpers * refactor: reuse runtime coercion helpers * refactor: reuse helper coercion in codex paths * refactor: reuse helper coercion in runtime paths * refactor: reuse codex app-server coercion helpers * refactor: reuse codex record helpers * refactor: reuse migration and qa record helpers * refactor: reuse feishu and core helper guards * refactor: reuse browser and policy coercion helpers * refactor: reuse memory wiki record helper * refactor: share boolean coercion helpers * refactor: reuse finite number coercion * refactor: reuse trimmed string list helpers * refactor: reuse string list normalization * refactor: reuse remaining string list helpers * refactor: reuse string entry normalizer * refactor: share sorted string helpers * refactor: share string list normalization * test: preserve command registry browser imports * refactor: reuse trimmed list helpers * refactor: reuse string dedupe helpers * refactor: reuse local dedupe helpers * refactor: reuse more string dedupe helpers * refactor: reuse command string dedupe helpers * refactor: dedupe memory path lists with helper * refactor: expose string dedupe helpers to plugins * refactor: reuse core string dedupe helpers * refactor: reuse shared unique value helpers * refactor: reuse unique helpers in agent utilities * refactor: reuse unique helpers in config plumbing * refactor: reuse unique helpers in extensions * refactor: reuse unique helpers in core utilities * refactor: reuse unique helpers in qa plugins * refactor: reuse unique helpers in memory plugins * refactor: reuse unique helpers in channel plugins * refactor: reuse unique helpers in core tails * refactor: reuse unique helper in comfy workflow * refactor: reuse unique helpers in test utilities * refactor: expose unique value helper to plugins * refactor: reuse unique helpers for numeric lists * refactor: replace index dedupe filters * refactor: reuse string entry normalization * refactor: reuse string normalization in plugin helpers * refactor: reuse string normalization in extension helpers * refactor: reuse string normalization in channel parsers * refactor: reuse string normalization in memory search * refactor: reuse string normalization in provider parsers * refactor: reuse string normalization in qa helpers * refactor: reuse string normalization in infra parsers * refactor: reuse string normalization in messaging parsers * refactor: reuse string normalization in core parsers * refactor: reuse string normalization in extension parsers * refactor: reuse string normalization in remaining parsers * refactor: reuse string normalization in final parser spots * refactor: reuse string normalization in qa media helpers * refactor: reuse normalization in provider and media lists * refactor: reuse normalization for remaining set filters * refactor: reuse normalization in policy allowlists * refactor: reuse normalization in session and owner lists * refactor: centralize primitive string lists * refactor: reuse lowercase entry helpers * refactor: reuse sorted string helpers * refactor: reuse unique trimmed helpers * refactor: reuse string normalization helpers * refactor: reuse catalog string helpers * refactor: reuse remaining string helpers * refactor: simplify remaining list normalization * refactor: reuse codex auth order normalization * chore: refresh plugin sdk api baseline * fix: make shared string sorting deterministic * chore: refresh plugin sdk api baseline * fix: align host env security ordering
105 lines
3.2 KiB
TypeScript
105 lines
3.2 KiB
TypeScript
import type {
|
|
AudioTranscriptionRequest,
|
|
AudioTranscriptionResult,
|
|
} from "openclaw/plugin-sdk/media-understanding";
|
|
import {
|
|
assertOkOrThrowHttpError,
|
|
postTranscriptionRequest,
|
|
readProviderJsonObjectResponse,
|
|
resolveProviderHttpRequestConfig,
|
|
requireTranscriptionText,
|
|
} from "openclaw/plugin-sdk/provider-http";
|
|
import { asOptionalRecord as asRecord } from "openclaw/plugin-sdk/string-coerce-runtime";
|
|
|
|
export const DEFAULT_DEEPGRAM_AUDIO_BASE_URL = "https://api.deepgram.com/v1";
|
|
export const DEFAULT_DEEPGRAM_AUDIO_MODEL = "nova-3";
|
|
|
|
function resolveModel(model?: string): string {
|
|
const trimmed = model?.trim();
|
|
return trimmed || DEFAULT_DEEPGRAM_AUDIO_MODEL;
|
|
}
|
|
|
|
function readDeepgramTranscript(payload: Record<string, unknown>): string | undefined {
|
|
const results = asRecord(payload.results);
|
|
if (!results) {
|
|
return undefined;
|
|
}
|
|
if (!Array.isArray(results.channels)) {
|
|
throw new Error("Audio transcription failed: malformed JSON response");
|
|
}
|
|
const channel = asRecord(results.channels[0]);
|
|
if (!channel) {
|
|
return undefined;
|
|
}
|
|
if (!Array.isArray(channel.alternatives)) {
|
|
throw new Error("Audio transcription failed: malformed JSON response");
|
|
}
|
|
const alternative = asRecord(channel.alternatives[0]);
|
|
if (!alternative) {
|
|
return undefined;
|
|
}
|
|
if (alternative.transcript !== undefined && typeof alternative.transcript !== "string") {
|
|
throw new Error("Audio transcription failed: malformed JSON response");
|
|
}
|
|
return alternative.transcript;
|
|
}
|
|
|
|
export async function transcribeDeepgramAudio(
|
|
params: AudioTranscriptionRequest,
|
|
): Promise<AudioTranscriptionResult> {
|
|
const fetchFn = params.fetchFn ?? fetch;
|
|
const model = resolveModel(params.model);
|
|
const { baseUrl, allowPrivateNetwork, headers, dispatcherPolicy } =
|
|
resolveProviderHttpRequestConfig({
|
|
baseUrl: params.baseUrl,
|
|
defaultBaseUrl: DEFAULT_DEEPGRAM_AUDIO_BASE_URL,
|
|
headers: params.headers,
|
|
request: params.request,
|
|
defaultHeaders: {
|
|
authorization: `Token ${params.apiKey}`,
|
|
"content-type": params.mime ?? "application/octet-stream",
|
|
},
|
|
provider: "deepgram",
|
|
capability: "audio",
|
|
transport: "media-understanding",
|
|
});
|
|
|
|
const url = new URL(`${baseUrl}/listen`);
|
|
url.searchParams.set("model", model);
|
|
if (params.language?.trim()) {
|
|
url.searchParams.set("language", params.language.trim());
|
|
}
|
|
if (params.query) {
|
|
for (const [key, value] of Object.entries(params.query)) {
|
|
if (value === undefined) {
|
|
continue;
|
|
}
|
|
url.searchParams.set(key, String(value));
|
|
}
|
|
}
|
|
|
|
const body = new Uint8Array(params.buffer);
|
|
const { response: res, release } = await postTranscriptionRequest({
|
|
url: url.toString(),
|
|
headers,
|
|
body,
|
|
timeoutMs: params.timeoutMs,
|
|
fetchFn,
|
|
allowPrivateNetwork,
|
|
dispatcherPolicy,
|
|
});
|
|
|
|
try {
|
|
await assertOkOrThrowHttpError(res, "Audio transcription failed");
|
|
|
|
const payload = await readProviderJsonObjectResponse(res, "Audio transcription failed");
|
|
const transcript = requireTranscriptionText(
|
|
readDeepgramTranscript(payload),
|
|
"Audio transcription response missing transcript",
|
|
);
|
|
return { text: transcript, model };
|
|
} finally {
|
|
await release();
|
|
}
|
|
}
|