Files
openclaw/src/plugins/document-extractor-public-artifacts.ts
Peter Steinberger 77d9ac30bb refactor: reuse shared coercion helpers (#86419)
* refactor: share talk event metric extraction

* refactor: reuse shared coercion helpers

* refactor: reuse shared primitive guards

* refactor: reuse shared record guard

* refactor: reuse shared primitive helpers

* refactor: reuse shared string guards

* refactor: reuse shared non-empty string guard

* refactor: share plugin primitive coercion helpers

* refactor: reuse plugin coercion helpers

* refactor: reuse plugin coercion helpers in more plugins

* refactor: reuse channel coercion helpers

* refactor: reuse monitor coercion helpers

* refactor: reuse provider coercion helpers

* refactor: reuse core coercion helpers

* refactor: reuse runtime coercion helpers

* refactor: reuse helper coercion in codex paths

* refactor: reuse helper coercion in runtime paths

* refactor: reuse codex app-server coercion helpers

* refactor: reuse codex record helpers

* refactor: reuse migration and qa record helpers

* refactor: reuse feishu and core helper guards

* refactor: reuse browser and policy coercion helpers

* refactor: reuse memory wiki record helper

* refactor: share boolean coercion helpers

* refactor: reuse finite number coercion

* refactor: reuse trimmed string list helpers

* refactor: reuse string list normalization

* refactor: reuse remaining string list helpers

* refactor: reuse string entry normalizer

* refactor: share sorted string helpers

* refactor: share string list normalization

* test: preserve command registry browser imports

* refactor: reuse trimmed list helpers

* refactor: reuse string dedupe helpers

* refactor: reuse local dedupe helpers

* refactor: reuse more string dedupe helpers

* refactor: reuse command string dedupe helpers

* refactor: dedupe memory path lists with helper

* refactor: expose string dedupe helpers to plugins

* refactor: reuse core string dedupe helpers

* refactor: reuse shared unique value helpers

* refactor: reuse unique helpers in agent utilities

* refactor: reuse unique helpers in config plumbing

* refactor: reuse unique helpers in extensions

* refactor: reuse unique helpers in core utilities

* refactor: reuse unique helpers in qa plugins

* refactor: reuse unique helpers in memory plugins

* refactor: reuse unique helpers in channel plugins

* refactor: reuse unique helpers in core tails

* refactor: reuse unique helper in comfy workflow

* refactor: reuse unique helpers in test utilities

* refactor: expose unique value helper to plugins

* refactor: reuse unique helpers for numeric lists

* refactor: replace index dedupe filters

* refactor: reuse string entry normalization

* refactor: reuse string normalization in plugin helpers

* refactor: reuse string normalization in extension helpers

* refactor: reuse string normalization in channel parsers

* refactor: reuse string normalization in memory search

* refactor: reuse string normalization in provider parsers

* refactor: reuse string normalization in qa helpers

* refactor: reuse string normalization in infra parsers

* refactor: reuse string normalization in messaging parsers

* refactor: reuse string normalization in core parsers

* refactor: reuse string normalization in extension parsers

* refactor: reuse string normalization in remaining parsers

* refactor: reuse string normalization in final parser spots

* refactor: reuse string normalization in qa media helpers

* refactor: reuse normalization in provider and media lists

* refactor: reuse normalization for remaining set filters

* refactor: reuse normalization in policy allowlists

* refactor: reuse normalization in session and owner lists

* refactor: centralize primitive string lists

* refactor: reuse lowercase entry helpers

* refactor: reuse sorted string helpers

* refactor: reuse unique trimmed helpers

* refactor: reuse string normalization helpers

* refactor: reuse catalog string helpers

* refactor: reuse remaining string helpers

* refactor: simplify remaining list normalization

* refactor: reuse codex auth order normalization

* chore: refresh plugin sdk api baseline

* fix: make shared string sorting deterministic

* chore: refresh plugin sdk api baseline

* fix: align host env security ordering
2026-05-25 21:20:41 +01:00

97 lines
2.9 KiB
TypeScript

import { isRecord } from "../shared/record-coerce.js";
import type {
DocumentExtractorPlugin,
PluginDocumentExtractorEntry,
} from "./document-extractor-types.js";
import { loadBundledPluginPublicArtifactModuleSync } from "./public-surface-loader.js";
const DOCUMENT_EXTRACTOR_ARTIFACT_CANDIDATES = [
"document-extractor.js",
"document-extractor-api.js",
] as const;
function isDocumentExtractorPlugin(value: unknown): value is DocumentExtractorPlugin {
return (
isRecord(value) &&
typeof value.id === "string" &&
typeof value.label === "string" &&
Array.isArray(value.mimeTypes) &&
value.mimeTypes.every((mimeType) => typeof mimeType === "string" && mimeType.trim()) &&
(value.autoDetectOrder === undefined || typeof value.autoDetectOrder === "number") &&
typeof value.extract === "function"
);
}
function tryLoadBundledPublicArtifactModule(params: {
dirName: string;
}): Record<string, unknown> | null {
for (const artifactBasename of DOCUMENT_EXTRACTOR_ARTIFACT_CANDIDATES) {
try {
return loadBundledPluginPublicArtifactModuleSync<Record<string, unknown>>({
dirName: params.dirName,
artifactBasename,
});
} catch (error) {
if (
error instanceof Error &&
error.message.startsWith("Unable to resolve bundled plugin public surface ")
) {
continue;
}
throw error;
}
}
return null;
}
function collectExtractorFactories(mod: Record<string, unknown>): {
extractors: DocumentExtractorPlugin[];
errors: unknown[];
} {
const extractors: DocumentExtractorPlugin[] = [];
const errors: unknown[] = [];
for (const [name, exported] of Object.entries(mod).toSorted(([left], [right]) =>
left.localeCompare(right),
)) {
if (
typeof exported !== "function" ||
exported.length !== 0 ||
!name.startsWith("create") ||
!name.endsWith("DocumentExtractor")
) {
continue;
}
let candidate: unknown;
try {
candidate = exported();
} catch (error) {
errors.push(error);
continue;
}
if (isDocumentExtractorPlugin(candidate)) {
extractors.push(candidate);
}
}
return { extractors, errors };
}
export function loadBundledDocumentExtractorEntriesFromDir(params: {
dirName: string;
pluginId: string;
}): PluginDocumentExtractorEntry[] | null {
const mod = tryLoadBundledPublicArtifactModule({ dirName: params.dirName });
if (!mod) {
return null;
}
const { extractors, errors } = collectExtractorFactories(mod);
if (extractors.length === 0) {
if (errors.length > 0) {
throw new Error(`Unable to initialize document extractors for plugin ${params.pluginId}`, {
cause: errors.length === 1 ? errors[0] : new AggregateError(errors),
});
}
return null;
}
return extractors.map((extractor) => Object.assign({}, extractor, { pluginId: params.pluginId }));
}