Files
openclaw/src/agents/model-catalog.test.ts
Peter Steinberger bb46b79d3c refactor: internalize OpenClaw agent runtime (#85341)
* refactor: extract agent core package

Introduce packages/agent-core as the OpenClaw-owned home for reusable agent loop, harness, session, prompt, and runtime dependency contracts.

* refactor: extract shared llm runtime

Move provider model registries, stream wrappers, OAuth helpers, and LLM utilities into src/llm with plugin-sdk barrels instead of depending on the old embedded runtime layout.

* refactor: remove pi runtime internals

Rename remaining Pi-shaped agent surfaces to OpenClaw agent runtime names, delete obsolete Pi docs and package graph checks, and add the third-party notice for incorporated code.

* refactor: tighten agent session runtime

Make agent-core/runtime dependencies explicit, consolidate compaction and session transcript helpers, and move model/session helpers behind OpenClaw-owned contracts.

* refactor: remove static model and pi auth paths

Drop static model catalogs and Pi auth bridges, move model/provider facts to manifest-owned runtime contracts, and harden internal embedded-agent utilities.

* refactor: remove legacy provider compat paths

* docs: remove agent parity notes

* fix: skip provider wildcard metadata parsing

* refactor: share session extension sdk loading

* refactor: inline acpx proxy error formatter

* refactor: fold edit recovery into edit tool

* fix: accept extension batch separator

* test: align startup provider plugin expectations

* fix: restore provider-scoped release discovery

* test: align static asset packaging expectations

* fix: run static provider catalogs during scoped discovery

* fix: add provider entry catalogs for scoped live discovery

* fix: load lightweight provider catalog entries

* fix: refresh provider-scoped plugin metadata

* fix: keep provider catalog entries on release live path

* fix: keep static manifest models in release live checks

* fix: harden release model discovery

* fix: reduce OpenAI live cache probe reasoning

* fix: disable OpenAI cache probe reasoning

* ci: extend OpenAI gateway live timeout

* fix: extend live gateway model budget

* fix: stabilize release validation regressions

* fix: honor provider aliases in model rows

* fix: stabilize release validation lanes

* fix: stabilize release memory qa

* ci: stabilize release validation lanes

* ci: prefer ipv4 for live docker node calls

* fix: restore shared tool-call stream wrapper

* ci: remove legacy pi test shard alias

* fix: clean up embedded agent test drift

* fix: stabilize runtime alias status

* fix: clean up embedded agent ci drift

* fix: restore release ci invariants

* fix: clean up post-rebase runtime drift

* fix: restore release ci checks

* fix: restore release ci after rebase

* fix: remove stale pi runtime path

* test: align compaction runtime expectations

* test: update plugin prerelease expectations

* fix: handle claude live tool approvals

* fix: stabilize release validation gates

* fix: finish agent runtime import

* test: finish post-rebase agent runtime mocks

* fix: keep codex compaction native

* fix: stabilize codex app-server hook tests

* test: isolate codex diagnostic active run

* test: remove codex diagnostic completion race

# Conflicts:
#	extensions/codex/src/app-server/run-attempt.test.ts

* ci: fix full release manifest performance run id

* refactor: narrow llm plugin sdk boundary

* chore: drop generated google boundary stamps

* fix: repair rebase fallout

* fix: clean up rebased runtime references

* fix: decode codex jwt payloads as base64url

* fix: preserve shipped pi runtime alias

* fix: add scoped sdk virtual modules

* fix: decode llm codex oauth jwt as base64url

* fix: avoid stale vertex adc negative cache

* fix: harden tool arg decoding and codeql path

* fix: keep vertex adc negative checks live

* refactor: consolidate codex jwt and edit helpers

* fix: await codex oauth node runtime imports

* fix: preserve sdk tool and notice contracts

* fix: preserve shipped compat config boundaries

* fix: align codex oauth callback host

* fix: terminate agent-core loop streams on failure

* fix: keep codex oauth callback alive during fallback

* ci: include session tools in critical codeql scans

* fix: keep Cloudflare Anthropic provider auth header

* docs: redirect legacy pi runtime pages

* fix: honor bundled web provider compat discovery

* fix: protect session output spill files

* fix: keep legacy agent dir env blocked

* fix: contain auto-discovered skill symlinks

* fix: harden agent core sdk proxy surfaces

* fix: restore approval reaction sdk compat

* fix: keep live docker runs bounded

* fix: keep codex oauth redirect host aligned

* fix: resolve post-rebase agent runtime drift

* fix: redact anthropic oauth parse failures

* fix: preserve responses strict tool shaping

* fix: repair agent runtime rebase cleanup

* docs: redirect retired parity pages

* fix: bound auto-discovered resources to roots

* fix: repair post-rebase agent test drift

* fix: preserve bundled provider allowlist migration

* fix: preserve manifest-owned provider aliases

* fix: declare photon image dependency

* fix: keep provider headers out of proxy body

* fix: preserve shipped env aliases

* fix: refresh control ui i18n generated state

* fix: quote read fallback paths

* fix: preview edits through configured backend

* test: satisfy core test typecheck

* fix: preserve ZAI usage auth fallback

* test: repair codex diagnostic test

* fix: repair agent runtime rebase drift

* test: finish embedded runner import rename

* fix: repair agent runtime rebase integrations

* test: align compaction oauth fallback expectations

* fix: allow sdk-auth session models

* fix: update doctor tool schema import

* fix: preserve bedrock plugin region

* fix: stream harmony-like prose immediately

* ci: include session runtime in codeql shards

* fix: repair latest rebase integrations

* fix: honor explicit codex websocket transport

* fix: keep openai-compatible credentials provider-scoped

* fix: refresh sdk api baseline after rebase

* fix: route cli runtime aliases through openclaw harness

* test: rename stale harness mock expectation

* test: rename embedded agent overflow calls

* test: clean embedded auth test wording

* test: use openclaw stream types in deepinfra cache test

* fix: refresh sdk api baseline on latest main

* fix: honor bundled discovery compat allowlists

* fix: refresh sdk api baseline after latest rebase

* fix: remove stale rebase imports

* test: rename stale model catalog mock

* test: mock renamed doctor runtime modules

* fix: map canonical kimi env auth

* fix: use internal model registry in bench script

* fix: migrate deepinfra provider catalog entry

* fix: enforce builtin tool suppression

* fix: route compaction auth and proxy payloads safely

* refactor: prune unused llm registry leftovers

* test: update codex hooks session import

* test: fix model picker ci coverage

* test: align model picker auth mock types
2026-05-27 19:24:04 +01:00

1372 lines
42 KiB
TypeScript

import { afterAll, afterEach, beforeAll, beforeEach, describe, expect, it, vi } from "vitest";
import type { OpenClawConfig } from "../config/config.js";
import { resetLogger, setLoggerOverride } from "../logging/logger.js";
type AgentModelDiscoveryModule = typeof import("./agent-model-discovery.js");
let setModelCatalogImportForTest: typeof import("./model-catalog.js").setModelCatalogImportForTest;
let findModelCatalogEntry: typeof import("./model-catalog.js").findModelCatalogEntry;
let findModelInCatalog: typeof import("./model-catalog.js").findModelInCatalog;
let loadManifestModelCatalog: typeof import("./model-catalog.js").loadManifestModelCatalog;
let loadModelCatalog: typeof import("./model-catalog.js").loadModelCatalog;
let modelSupportsInput: typeof import("./model-catalog.js").modelSupportsInput;
let resetModelCatalogCacheForTest: typeof import("./model-catalog.js").resetModelCatalogCacheForTest;
let augmentCatalogMock: ReturnType<typeof vi.fn>;
let ensureOpenClawModelsJsonMock: ReturnType<typeof vi.fn>;
let currentPluginMetadataSnapshotMock: ReturnType<typeof vi.fn<(...args: unknown[]) => unknown>>;
let loadPluginMetadataSnapshotMock: ReturnType<typeof vi.fn<(...args: unknown[]) => unknown>>;
let readFileMock: ReturnType<typeof vi.fn>;
vi.mock("./model-suppression.runtime.js", () => ({
shouldSuppressBuiltInModel: (params: { provider?: string; id?: string }) =>
isSuppressedModel(params.provider, params.id),
buildShouldSuppressBuiltInModel: () => (params: { provider?: string; id?: string }) =>
isSuppressedModel(params.provider, params.id),
}));
function isSuppressedModel(provider?: string, id?: string): boolean {
const modelId = id?.trim().toLowerCase();
if (!modelId) {
return false;
}
return (
(provider === "openai" ||
provider === "azure-openai-responses" ||
provider === "openai-codex") &&
modelId === "gpt-5.3-codex-spark"
);
}
function mockCatalogImportFailThenRecover() {
let call = 0;
setModelCatalogImportForTest(async () => {
call += 1;
if (call === 1) {
throw new Error("boom");
}
return {
discoverAuthStorage: () => ({}),
AuthStorage: function AuthStorage() {},
discoverModels: () => ({
getAll() {
return [{ id: "gpt-4.1", name: "GPT-4.1", provider: "openai" }];
},
}),
ModelRegistry: class {
getAll() {
return [{ id: "gpt-4.1", name: "GPT-4.1", provider: "openai" }];
}
},
} as unknown as AgentModelDiscoveryModule;
});
return () => call;
}
function mockAgentDiscoveryModels(models: unknown[]) {
setModelCatalogImportForTest(
async () =>
({
discoverAuthStorage: () => ({}),
AuthStorage: function AuthStorage() {},
discoverModels: () => ({
getAll() {
return models;
},
}),
ModelRegistry: class {
getAll() {
return models;
}
},
}) as unknown as AgentModelDiscoveryModule,
);
}
function mockSingleOpenAiCatalogModel() {
mockAgentDiscoveryModels([{ id: "gpt-4.1", provider: "openai", name: "GPT-4.1" }]);
}
function emptyPluginMetadataSnapshot() {
return {
policyHash: "test-policy",
configFingerprint: "test-config",
index: {
policyHash: "test-policy",
plugins: [],
},
plugins: [],
};
}
function modelIdNormalizationSnapshot() {
return {
...emptyPluginMetadataSnapshot(),
configFingerprint: "model-id-normalizers",
plugins: [
{
id: "external-normalizer",
modelIdNormalization: {
providers: {
custom: {
aliases: {
latest: "modern-model",
},
stripPrefixes: ["legacy/"],
prefixWhenBare: "vendor",
},
},
},
},
],
};
}
function manifestModelCatalogSnapshot(model: {
id: string;
name?: string;
input?: Array<"text" | "image">;
reasoning?: boolean;
contextWindow?: number;
}) {
return {
policyHash: "policy",
index: {
policyHash: "policy",
plugins: [
{
pluginId: "external-provider",
enabled: true,
origin: "global",
},
],
},
plugins: [
{
id: "external-provider",
origin: "global",
modelCatalog: {
providers: {
external: {
models: [
{
name: model.id,
...model,
},
],
},
},
},
},
],
};
}
function configuredModel(id: string) {
return {
id,
name: id,
reasoning: false,
input: ["text"] as Array<"text">,
cost: {
input: 0,
output: 0,
cacheRead: 0,
cacheWrite: 0,
},
contextWindow: 128_000,
maxTokens: 8192,
};
}
type ModelCatalogEntry = Awaited<
ReturnType<typeof import("./model-catalog.js").loadModelCatalog>
>[number];
function findCatalogEntry(
entries: readonly ModelCatalogEntry[],
provider: string,
id: string,
): ModelCatalogEntry | undefined {
return entries.find((entry) => entry.provider === provider && entry.id === id);
}
function requireCatalogEntry(
entries: readonly ModelCatalogEntry[],
provider: string,
id: string,
): ModelCatalogEntry {
const entry = findCatalogEntry(entries, provider, id);
if (!entry) {
throw new Error(`expected catalog entry ${provider}/${id}`);
}
return entry;
}
function expectNoCatalogEntry(entries: readonly ModelCatalogEntry[], provider: string, id: string) {
expect(findCatalogEntry(entries, provider, id)).toBeUndefined();
}
function requireMockCallParam(
mock: ReturnType<typeof vi.fn>,
label: string,
): Record<string, unknown> {
const first = mock.mock.calls[0]?.[0];
if (!first || typeof first !== "object" || Array.isArray(first)) {
throw new Error(`expected ${label}`);
}
return first as Record<string, unknown>;
}
describe("loadModelCatalog", () => {
beforeAll(async () => {
readFileMock = vi.fn();
vi.doMock("node:fs/promises", async (importOriginal) => ({
...(await importOriginal<typeof import("node:fs/promises")>()),
readFile: readFileMock,
}));
ensureOpenClawModelsJsonMock = vi.fn().mockResolvedValue({ agentDir: "/tmp", wrote: false });
vi.doMock("./models-config.js", () => ({
ensureOpenClawModelsJson: ensureOpenClawModelsJsonMock,
}));
vi.doMock("./agent-scope.js", () => ({
resolveDefaultAgentDir: () => "/tmp/openclaw",
}));
vi.doMock("../plugins/provider-runtime.runtime.js", () => ({
augmentModelCatalogWithProviderPlugins: vi.fn().mockResolvedValue([]),
}));
currentPluginMetadataSnapshotMock = vi.fn(() => emptyPluginMetadataSnapshot());
loadPluginMetadataSnapshotMock = vi.fn(() => emptyPluginMetadataSnapshot());
vi.doMock("../plugins/current-plugin-metadata-snapshot.js", () => ({
getCurrentPluginMetadataSnapshot: currentPluginMetadataSnapshotMock,
}));
vi.doMock("../plugins/plugin-metadata-snapshot.js", () => ({
loadPluginMetadataSnapshot: loadPluginMetadataSnapshotMock,
resolvePluginMetadataSnapshot: (...args: unknown[]) =>
currentPluginMetadataSnapshotMock(...args) ?? loadPluginMetadataSnapshotMock(...args),
}));
({
setModelCatalogImportForTest,
findModelCatalogEntry,
findModelInCatalog,
loadManifestModelCatalog,
loadModelCatalog,
modelSupportsInput,
resetModelCatalogCacheForTest,
} = await import("./model-catalog.js"));
const providerRuntime = await import("../plugins/provider-runtime.runtime.js");
augmentCatalogMock = vi.mocked(providerRuntime.augmentModelCatalogWithProviderPlugins);
});
beforeEach(() => {
resetModelCatalogCacheForTest();
readFileMock.mockReset();
readFileMock.mockRejectedValue(
Object.assign(new Error("models.json missing"), { code: "ENOENT" }),
);
ensureOpenClawModelsJsonMock.mockClear();
augmentCatalogMock.mockClear();
currentPluginMetadataSnapshotMock.mockReset();
currentPluginMetadataSnapshotMock.mockReturnValue(undefined);
loadPluginMetadataSnapshotMock.mockReset();
loadPluginMetadataSnapshotMock.mockReturnValue(emptyPluginMetadataSnapshot());
});
afterEach(() => {
setModelCatalogImportForTest();
resetModelCatalogCacheForTest();
vi.restoreAllMocks();
});
afterAll(() => {
vi.doUnmock("node:fs/promises");
vi.doUnmock("./models-config.js");
vi.doUnmock("./agent-scope.js");
vi.doUnmock("../plugins/provider-runtime.runtime.js");
vi.doUnmock("../plugins/current-plugin-metadata-snapshot.js");
vi.doUnmock("../plugins/plugin-metadata-snapshot.js");
});
it("retries after import failure without poisoning the cache", async () => {
setLoggerOverride({ level: "silent", consoleLevel: "warn" });
try {
const getCallCount = mockCatalogImportFailThenRecover();
const cfg = {} as OpenClawConfig;
const first = await loadModelCatalog({ config: cfg });
expect(first).toStrictEqual([]);
const second = await loadModelCatalog({ config: cfg });
expect(second).toEqual([{ id: "gpt-4.1", name: "GPT-4.1", provider: "openai" }]);
expect(getCallCount()).toBe(2);
} finally {
setLoggerOverride(null);
resetLogger();
}
});
it("reloads dynamic registry entries after clearing the cache", async () => {
const models = [{ id: "existing", name: "Existing", provider: "ollama" }];
mockAgentDiscoveryModels(models);
const first = await loadModelCatalog({ config: {} as OpenClawConfig });
expect(first).toStrictEqual([
{
id: "existing",
name: "Existing",
provider: "ollama",
contextWindow: undefined,
reasoning: undefined,
input: undefined,
compat: undefined,
},
]);
models.push({ id: "glm-5.1:cloud", name: "GLM 5.1 Cloud", provider: "ollama" });
resetModelCatalogCacheForTest();
mockAgentDiscoveryModels(models);
const second = await loadModelCatalog({ config: {} as OpenClawConfig });
expect(second).toStrictEqual([
{
id: "existing",
name: "Existing",
provider: "ollama",
contextWindow: undefined,
reasoning: undefined,
input: undefined,
compat: undefined,
},
{
id: "glm-5.1:cloud",
name: "GLM 5.1 Cloud",
provider: "ollama",
contextWindow: undefined,
reasoning: undefined,
input: undefined,
compat: undefined,
},
]);
});
it("returns partial results on discovery errors", async () => {
setLoggerOverride({ level: "silent", consoleLevel: "warn" });
try {
setModelCatalogImportForTest(
async () =>
({
discoverAuthStorage: () => ({}),
AuthStorage: function AuthStorage() {},
discoverModels: () => ({
getAll() {
return [
{ id: "gpt-4.1", name: "GPT-4.1", provider: "openai" },
{
get id() {
throw new Error("boom");
},
provider: "openai",
name: "bad",
},
];
},
}),
ModelRegistry: class {
getAll() {
return [
{ id: "gpt-4.1", name: "GPT-4.1", provider: "openai" },
{
get id() {
throw new Error("boom");
},
provider: "openai",
name: "bad",
},
];
}
},
}) as unknown as AgentModelDiscoveryModule,
);
const result = await loadModelCatalog({ config: {} as OpenClawConfig });
expect(result).toEqual([{ id: "gpt-4.1", name: "GPT-4.1", provider: "openai" }]);
} finally {
setLoggerOverride(null);
resetLogger();
}
});
it("does not prepare models.json or import provider discovery when loading fallback catalog in read-only mode", async () => {
const importAgentDiscoveryModule = vi.fn(async () => {
throw new Error("provider discovery should not load");
});
setModelCatalogImportForTest(
importAgentDiscoveryModule as unknown as () => Promise<AgentModelDiscoveryModule>,
);
currentPluginMetadataSnapshotMock.mockReturnValueOnce(undefined);
loadPluginMetadataSnapshotMock.mockImplementationOnce(() => {
throw new Error("metadata scan should not run");
});
const result = await loadModelCatalog({
config: {
models: {
providers: {
openai: {
baseUrl: "https://openai.example.com/v1",
models: [
{
id: "gpt-test",
name: "GPT Test",
reasoning: false,
input: ["text"],
cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
contextWindow: 200_000,
maxTokens: 8192,
},
],
},
},
},
} as OpenClawConfig,
readOnly: true,
});
const entry = requireCatalogEntry(result, "openai", "gpt-test");
expect(entry.name).toBe("GPT Test");
expect(ensureOpenClawModelsJsonMock).not.toHaveBeenCalled();
expect(importAgentDiscoveryModule).not.toHaveBeenCalled();
expect(loadPluginMetadataSnapshotMock).not.toHaveBeenCalled();
});
it("filters suppressed built-ins from persisted read-only catalog rows", async () => {
readFileMock.mockResolvedValueOnce(
JSON.stringify({
providers: {
"openai-codex": {
models: [
{
id: "gpt-5.3-codex-spark",
name: "GPT-5.3 Codex Spark",
reasoning: true,
contextWindow: 128000,
input: ["text"],
},
{
id: "gpt-5.4",
name: "GPT-5.4",
reasoning: true,
contextWindow: 272000,
input: ["text", "image"],
},
],
},
openai: {
models: [
{
id: "gpt-5.3-codex-spark",
name: "GPT-5.3 Codex Spark",
},
],
},
},
}),
);
const result = await loadModelCatalog({ config: {} as OpenClawConfig, readOnly: true });
expect(result).toEqual([
{
provider: "openai-codex",
id: "gpt-5.4",
name: "GPT-5.4",
reasoning: true,
contextWindow: 272000,
input: ["text", "image"],
compat: undefined,
},
]);
expect(ensureOpenClawModelsJsonMock).not.toHaveBeenCalled();
expect(augmentCatalogMock).not.toHaveBeenCalled();
});
it("falls back to manifest catalog rows when persisted read-only catalog has no model rows", async () => {
readFileMock.mockResolvedValueOnce(
JSON.stringify({
providers: {
openai: {
modelOverrides: {
"gpt-4.1": {
contextWindow: 128000,
},
},
},
},
}),
);
currentPluginMetadataSnapshotMock.mockReturnValueOnce({
policyHash: "policy",
index: {
policyHash: "policy",
plugins: [
{
pluginId: "external-provider",
enabled: true,
origin: "global",
},
],
},
plugins: [
{
id: "external-provider",
origin: "global",
modelCatalog: {
providers: {
external: {
models: [{ id: "external-fast", name: "External Fast" }],
},
},
},
},
],
});
const importAgentDiscoveryModule = vi.fn(async () => {
throw new Error("provider discovery should not load");
});
setModelCatalogImportForTest(
importAgentDiscoveryModule as unknown as () => Promise<AgentModelDiscoveryModule>,
);
const result = await loadModelCatalog({ config: {} as OpenClawConfig, readOnly: true });
expect(result).toEqual([
{
provider: "external",
id: "external-fast",
name: "External Fast",
input: ["text"],
reasoning: false,
},
]);
expect(ensureOpenClawModelsJsonMock).not.toHaveBeenCalled();
expect(importAgentDiscoveryModule).not.toHaveBeenCalled();
});
it("preserves registry defaults for minimal persisted read-only catalog rows", async () => {
readFileMock.mockResolvedValueOnce(
JSON.stringify({
providers: {
custom: {
models: [{ id: "local-tiny" }],
},
},
}),
);
const result = await loadModelCatalog({ config: {} as OpenClawConfig, readOnly: true });
expect(result).toEqual([
{
provider: "custom",
id: "local-tiny",
name: "local-tiny",
reasoning: false,
contextWindow: 128000,
input: ["text"],
compat: undefined,
},
]);
expect(ensureOpenClawModelsJsonMock).not.toHaveBeenCalled();
expect(augmentCatalogMock).not.toHaveBeenCalled();
});
it("normalizes persisted read-only catalog rows with manifest model id policies", async () => {
currentPluginMetadataSnapshotMock.mockReturnValue(modelIdNormalizationSnapshot());
readFileMock.mockResolvedValueOnce(
JSON.stringify({
providers: {
custom: {
models: [
{ id: "latest", name: "Latest Alias" },
{ id: "legacy/trimmed" },
{ id: "vendor/already-prefixed" },
],
},
},
}),
);
const result = await loadModelCatalog({ config: {} as OpenClawConfig, readOnly: true });
expect(requireCatalogEntry(result, "custom", "vendor/modern-model").name).toBe("Latest Alias");
expect(requireCatalogEntry(result, "custom", "vendor/trimmed").name).toBe("vendor/trimmed");
expect(requireCatalogEntry(result, "custom", "vendor/already-prefixed").name).toBe(
"vendor/already-prefixed",
);
expect(loadPluginMetadataSnapshotMock).not.toHaveBeenCalled();
});
it("reuses injected metadata for persisted read-only catalog normalization", async () => {
currentPluginMetadataSnapshotMock.mockReturnValue(undefined);
readFileMock.mockResolvedValueOnce(
JSON.stringify({
providers: {
custom: {
models: [{ id: "latest", name: "Latest Alias" }],
},
},
}),
);
const result = await loadModelCatalog({
config: {} as OpenClawConfig,
readOnly: true,
metadataSnapshot: modelIdNormalizationSnapshot() as unknown as NonNullable<
Parameters<typeof loadModelCatalog>[0]
>["metadataSnapshot"],
});
expect(requireCatalogEntry(result, "custom", "vendor/modern-model").name).toBe("Latest Alias");
expect(loadPluginMetadataSnapshotMock).not.toHaveBeenCalled();
});
it("reuses injected metadata when read-only catalog falls back to manifest rows", async () => {
currentPluginMetadataSnapshotMock.mockReturnValue(undefined);
const metadataSnapshot = {
...emptyPluginMetadataSnapshot(),
index: {
policyHash: "policy",
plugins: [
{
pluginId: "external-provider",
enabled: true,
origin: "global",
},
],
},
plugins: [
{
id: "external-provider",
origin: "global",
modelCatalog: {
providers: {
external: {
models: [{ id: "external-fast", name: "External Fast" }],
},
},
},
},
],
};
const result = await loadModelCatalog({
config: {} as OpenClawConfig,
readOnly: true,
metadataSnapshot: metadataSnapshot as unknown as NonNullable<
Parameters<typeof loadModelCatalog>[0]
>["metadataSnapshot"],
});
expect(result).toEqual([
{
provider: "external",
id: "external-fast",
name: "External Fast",
input: ["text"],
reasoning: false,
},
]);
expect(loadPluginMetadataSnapshotMock).not.toHaveBeenCalled();
});
it("loads manifest model id policies once for persisted read-only catalog rows", async () => {
currentPluginMetadataSnapshotMock.mockReturnValue(undefined);
loadPluginMetadataSnapshotMock.mockReturnValue(modelIdNormalizationSnapshot());
readFileMock.mockResolvedValueOnce(
JSON.stringify({
providers: {
custom: {
models: [{ id: "model-a" }, { id: "model-b" }, { id: "model-c" }, { id: "model-d" }],
},
},
}),
);
const result = await loadModelCatalog({ config: {} as OpenClawConfig, readOnly: true });
expect(requireCatalogEntry(result, "custom", "vendor/model-a").id).toBe("vendor/model-a");
expect(requireCatalogEntry(result, "custom", "vendor/model-d").id).toBe("vendor/model-d");
expect(loadPluginMetadataSnapshotMock).toHaveBeenCalledTimes(1);
});
it("loads manifest model id policies once for configured read-only catalog rows", async () => {
currentPluginMetadataSnapshotMock.mockReturnValue(undefined);
loadPluginMetadataSnapshotMock.mockReturnValue(modelIdNormalizationSnapshot());
const result = await loadModelCatalog({
readOnly: true,
config: {
models: {
providers: {
custom: {
api: "openai-completions",
baseUrl: "https://custom.example/v1",
models: [
configuredModel("model-a"),
configuredModel("model-b"),
configuredModel("model-c"),
configuredModel("model-d"),
],
},
},
},
} as OpenClawConfig,
});
expect(requireCatalogEntry(result, "custom", "vendor/model-a").id).toBe("vendor/model-a");
expect(requireCatalogEntry(result, "custom", "vendor/model-d").id).toBe("vendor/model-d");
expect(loadPluginMetadataSnapshotMock).toHaveBeenCalledTimes(1);
});
it("loads manifest model id policies once for discovered catalog rows", async () => {
currentPluginMetadataSnapshotMock.mockReturnValue(undefined);
loadPluginMetadataSnapshotMock.mockReturnValue(modelIdNormalizationSnapshot());
mockAgentDiscoveryModels([
{ provider: "custom", id: "model-a", name: "Model A" },
{ provider: "custom", id: "model-b", name: "Model B" },
{ provider: "custom", id: "model-c", name: "Model C" },
{ provider: "custom", id: "model-d", name: "Model D" },
]);
const result = await loadModelCatalog({ config: {} as OpenClawConfig, useCache: false });
expect(requireCatalogEntry(result, "custom", "vendor/model-a").name).toBe("Model A");
expect(requireCatalogEntry(result, "custom", "vendor/model-d").name).toBe("Model D");
expect(loadPluginMetadataSnapshotMock).toHaveBeenCalledTimes(1);
});
it("preserves provider context defaults for persisted read-only catalog rows", async () => {
readFileMock.mockResolvedValueOnce(
JSON.stringify({
providers: {
custom: {
contextWindow: 262144,
models: [
{ id: "inherits-provider-context" },
{ id: "overrides-context", contextWindow: 65536 },
],
},
},
}),
);
const result = await loadModelCatalog({ config: {} as OpenClawConfig, readOnly: true });
expect(result).toEqual([
{
provider: "custom",
id: "inherits-provider-context",
name: "inherits-provider-context",
reasoning: false,
contextWindow: 262144,
input: ["text"],
compat: undefined,
},
{
provider: "custom",
id: "overrides-context",
name: "overrides-context",
reasoning: false,
contextWindow: 65536,
input: ["text"],
compat: undefined,
},
]);
expect(ensureOpenClawModelsJsonMock).not.toHaveBeenCalled();
expect(augmentCatalogMock).not.toHaveBeenCalled();
});
it("does not synthesize stale openai-codex/gpt-5.3-codex-spark entries from gpt-5.4", async () => {
mockAgentDiscoveryModels([
{
id: "gpt-5.4",
provider: "openai-codex",
name: "GPT-5.3 Codex",
reasoning: true,
contextWindow: 200000,
input: ["text"],
},
{
id: "gpt-5.2-codex",
provider: "openai-codex",
name: "GPT-5.2 Codex",
},
]);
const result = await loadModelCatalog({ config: {} as OpenClawConfig });
expectNoCatalogEntry(result, "openai-codex", "gpt-5.3-codex-spark");
const entry = requireCatalogEntry(result, "openai-codex", "gpt-5.4");
expect(entry.name).toBe("GPT-5.3 Codex");
});
it("filters stale gpt-5.3-codex-spark built-ins from the catalog", async () => {
mockAgentDiscoveryModels([
{
id: "gpt-5.3-codex-spark",
provider: "openai",
name: "GPT-5.3 Codex Spark",
reasoning: true,
contextWindow: 128000,
input: ["text", "image"],
},
{
id: "gpt-5.3-codex-spark",
provider: "azure-openai-responses",
name: "GPT-5.3 Codex Spark",
reasoning: true,
contextWindow: 128000,
input: ["text", "image"],
},
{
id: "gpt-5.3-codex-spark",
provider: "openai-codex",
name: "GPT-5.3 Codex Spark",
reasoning: true,
contextWindow: 128000,
input: ["text"],
},
]);
const result = await loadModelCatalog({ config: {} as OpenClawConfig });
expectNoCatalogEntry(result, "openai", "gpt-5.3-codex-spark");
expectNoCatalogEntry(result, "azure-openai-responses", "gpt-5.3-codex-spark");
expectNoCatalogEntry(result, "openai-codex", "gpt-5.3-codex-spark");
});
it("keeps available openai-codex 5.1/5.2/5.3 built-ins in the catalog", async () => {
mockAgentDiscoveryModels([
{
id: "gpt-5.1-codex-mini",
provider: "openai-codex",
name: "GPT-5.1 Codex Mini",
reasoning: true,
contextWindow: 400000,
input: ["text", "image"],
},
{
id: "gpt-5.2-codex",
provider: "openai-codex",
name: "GPT-5.2 Codex",
reasoning: true,
contextWindow: 400000,
input: ["text", "image"],
},
{
id: "gpt-5.3-codex",
provider: "openai-codex",
name: "GPT-5.3 Codex",
reasoning: true,
contextWindow: 400000,
input: ["text", "image"],
},
{
id: "gpt-5.5",
provider: "openai-codex",
name: "GPT-5.5",
reasoning: true,
contextWindow: 400000,
input: ["text", "image"],
},
]);
const result = await loadModelCatalog({ config: {} as OpenClawConfig });
expect(requireCatalogEntry(result, "openai-codex", "gpt-5.1-codex-mini").name).toBe(
"GPT-5.1 Codex Mini",
);
expect(requireCatalogEntry(result, "openai-codex", "gpt-5.2-codex").name).toBe("GPT-5.2 Codex");
expect(requireCatalogEntry(result, "openai-codex", "gpt-5.3-codex").name).toBe("GPT-5.3 Codex");
expect(requireCatalogEntry(result, "openai-codex", "gpt-5.5").name).toBe("GPT-5.5");
});
it("does not synthesize gpt-5.4 OpenAI forward-compat entries from template models", async () => {
mockAgentDiscoveryModels([
{
id: "gpt-5.2",
provider: "openai",
name: "GPT-5.2",
reasoning: true,
contextWindow: 1_050_000,
input: ["text", "image"],
},
{
id: "gpt-5.2-pro",
provider: "openai",
name: "GPT-5.2 Pro",
reasoning: true,
contextWindow: 1_050_000,
input: ["text", "image"],
},
{
id: "gpt-5-mini",
provider: "openai",
name: "GPT-5 mini",
reasoning: true,
contextWindow: 400_000,
input: ["text", "image"],
},
{
id: "gpt-5-nano",
provider: "openai",
name: "GPT-5 nano",
reasoning: true,
contextWindow: 400_000,
input: ["text", "image"],
},
{
id: "gpt-5.4",
provider: "openai-codex",
name: "GPT-5.3 Codex",
reasoning: true,
contextWindow: 272000,
input: ["text", "image"],
},
]);
const result = await loadModelCatalog({ config: {} as OpenClawConfig });
expect(
result.some((entry) => entry.provider === "openai" && entry.id.startsWith("gpt-5.4")),
).toBe(false);
const entry = requireCatalogEntry(result, "openai-codex", "gpt-5.4");
expect(entry.name).toBe("GPT-5.3 Codex");
expect(
result.some((entry) => entry.provider === "openai-codex" && entry.id === "gpt-5.4-mini"),
).toBe(false);
});
it("merges provider-owned supplemental catalog entries", async () => {
mockSingleOpenAiCatalogModel();
augmentCatalogMock.mockResolvedValueOnce([
{
provider: "kilocode",
id: "google/gemini-3-pro-preview",
name: "Gemini 3 Pro Preview",
input: ["text", "image"],
reasoning: true,
contextWindow: 1048576,
},
]);
const result = await loadModelCatalog({ config: {} as OpenClawConfig });
const entry = requireCatalogEntry(result, "kilocode", "google/gemini-3.1-pro-preview");
expect(entry.name).toBe("Gemini 3 Pro Preview");
});
it("loads manifest catalog rows from the current metadata snapshot without provider runtime", () => {
const snapshot = manifestModelCatalogSnapshot({
id: "external-fast",
name: "External Fast",
input: ["text", "image"],
reasoning: true,
contextWindow: 32000,
});
currentPluginMetadataSnapshotMock.mockReturnValue(snapshot);
const result = loadManifestModelCatalog({ config: {} as OpenClawConfig });
expect(loadPluginMetadataSnapshotMock).not.toHaveBeenCalled();
expect(augmentCatalogMock).not.toHaveBeenCalled();
expect(result).toEqual([
{
provider: "external",
id: "external-fast",
name: "External Fast",
input: ["text", "image"],
reasoning: true,
contextWindow: 32000,
},
]);
});
it("reuses planned manifest catalog rows for the same config and metadata snapshot", () => {
const config = {} as OpenClawConfig;
const snapshot = manifestModelCatalogSnapshot({ id: "external-fast" });
currentPluginMetadataSnapshotMock.mockReturnValue(snapshot);
const first = loadManifestModelCatalog({ config });
const second = loadManifestModelCatalog({ config });
expect(second).toBe(first);
expect(first).toEqual([
{
provider: "external",
id: "external-fast",
name: "external-fast",
input: ["text"],
reasoning: false,
},
]);
expect(loadPluginMetadataSnapshotMock).not.toHaveBeenCalled();
});
it("refreshes manifest catalog rows when the metadata snapshot changes", () => {
const config = {} as OpenClawConfig;
currentPluginMetadataSnapshotMock
.mockReturnValueOnce(manifestModelCatalogSnapshot({ id: "external-fast" }))
.mockReturnValue(manifestModelCatalogSnapshot({ id: "external-slow" }));
const first = loadManifestModelCatalog({ config });
const second = loadManifestModelCatalog({ config });
expect(second).not.toBe(first);
expect(first[0]?.id).toBe("external-fast");
expect(second[0]?.id).toBe("external-slow");
});
it("lets read-only manifest catalog reuse the current workspace-scoped snapshot", () => {
loadManifestModelCatalog({
config: {} as OpenClawConfig,
fallbackToMetadataScan: false,
});
const call = requireMockCallParam(currentPluginMetadataSnapshotMock, "current snapshot params");
expect(call.allowWorkspaceScopedSnapshot).toBe(true);
expect(loadPluginMetadataSnapshotMock).not.toHaveBeenCalled();
});
it("passes explicit env when checking current manifest catalog snapshot compatibility", () => {
const env = { HOME: "/tmp/openclaw-model-catalog-env" } as NodeJS.ProcessEnv;
loadManifestModelCatalog({
config: {} as OpenClawConfig,
env,
fallbackToMetadataScan: false,
});
const call = requireMockCallParam(currentPluginMetadataSnapshotMock, "current snapshot params");
expect(call.env).toBe(env);
expect(call.allowWorkspaceScopedSnapshot).toBe(true);
expect(loadPluginMetadataSnapshotMock).not.toHaveBeenCalled();
});
it("dedupes supplemental models against registry entries", async () => {
mockSingleOpenAiCatalogModel();
augmentCatalogMock.mockResolvedValueOnce([
{
provider: "ollama",
id: "llama3.2",
name: "Llama 3.2",
reasoning: true,
input: ["text"],
contextWindow: 1048576,
},
{
provider: "openai",
id: "gpt-4.1",
name: "Duplicate GPT-4.1",
},
]);
const result = await loadModelCatalog({ config: {} as OpenClawConfig });
expect(requireCatalogEntry(result, "ollama", "llama3.2").name).toBe("Llama 3.2");
expect(
result.filter((entry) => entry.provider === "openai" && entry.id === "gpt-4.1"),
).toHaveLength(1);
});
it("includes configured provider models missing from discovery", async () => {
mockSingleOpenAiCatalogModel();
const result = await loadModelCatalog({
config: {
models: {
providers: {
modelscope: {
baseUrl: "https://api-inference.modelscope.cn/v1",
models: [
{
id: "Qwen/Qwen3.5-35B-A3B",
name: "Qwen3.5 35B",
input: ["text", "image"],
reasoning: true,
contextWindow: 128_000,
maxTokens: 8192,
cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
},
],
},
},
},
} as OpenClawConfig,
});
const entry = requireCatalogEntry(result, "modelscope", "Qwen/Qwen3.5-35B-A3B");
expect(entry.name).toBe("Qwen3.5 35B");
expect(entry.input).toEqual(["text", "image"]);
expect(entry.reasoning).toBe(true);
expect(entry.contextWindow).toBe(128_000);
});
it("overlays configured model compat onto discovered catalog rows", async () => {
mockAgentDiscoveryModels([
{
id: "Qwen/Qwen3-8B",
name: "Qwen3 8B",
provider: "vllm",
reasoning: false,
compat: { supportsStrictMode: false },
},
]);
const result = await loadModelCatalog({
config: {
models: {
providers: {
vllm: {
baseUrl: "http://localhost:9000/v1",
api: "openai-completions",
models: [
{
id: "vllm/Qwen/Qwen3-8B",
name: "Configured Qwen3 8B",
compat: { thinkingFormat: "qwen-chat-template" },
},
],
},
},
},
} as unknown as OpenClawConfig,
});
const entry = requireCatalogEntry(result, "vllm", "Qwen/Qwen3-8B");
expect(result.filter((entry) => entry.provider === "vllm")).toHaveLength(1);
expect(entry.name).toBe("Qwen3 8B");
expect(entry.reasoning).toBe(true);
expect(entry.compat).toEqual(
expect.objectContaining({
supportsStrictMode: false,
thinkingFormat: "qwen-chat-template",
}),
);
});
it("overlays configured model compat onto persisted read-only catalog rows", async () => {
readFileMock.mockResolvedValue(
JSON.stringify({
providers: {
vllm: {
models: [
{
id: "Qwen/Qwen3-8B",
name: "Qwen3 8B",
reasoning: false,
compat: { supportsStrictMode: false },
},
],
},
},
}),
);
const result = await loadModelCatalog({
config: {
models: {
providers: {
vllm: {
baseUrl: "http://localhost:9000/v1",
api: "openai-completions",
models: [
{
id: "vllm/Qwen/Qwen3-8B",
name: "Configured Qwen3 8B",
compat: { thinkingFormat: "qwen-chat-template" },
},
],
},
},
},
} as unknown as OpenClawConfig,
readOnly: true,
});
const entry = requireCatalogEntry(result, "vllm", "Qwen/Qwen3-8B");
expect(result.filter((entry) => entry.provider === "vllm")).toHaveLength(1);
expect(entry.name).toBe("Qwen3 8B");
expect(entry.reasoning).toBe(true);
expect(entry.compat).toEqual(
expect.objectContaining({
supportsStrictMode: false,
thinkingFormat: "qwen-chat-template",
}),
);
});
it("merges manifest model catalog rows on the normal catalog path", async () => {
mockSingleOpenAiCatalogModel();
currentPluginMetadataSnapshotMock.mockReturnValue({
...emptyPluginMetadataSnapshot(),
plugins: [
{
id: "byteplus",
origin: "bundled",
providers: ["byteplus"],
modelCatalog: {
providers: {
byteplus: {
baseUrl: "https://ark.ap-southeast.bytepluses.com/api/v3",
api: "openai-completions",
models: [
{
id: "seed-1-8-251228",
name: "Doubao Seed 1.8",
input: ["text", "image"],
contextWindow: 256_000,
},
],
},
},
},
},
],
});
const result = await loadModelCatalog({ config: {} as OpenClawConfig });
const entry = requireCatalogEntry(result, "byteplus", "seed-1-8-251228");
expect(entry.name).toBe("Doubao Seed 1.8");
expect(entry.input).toEqual(["text", "image"]);
expect(entry.contextWindow).toBe(256_000);
});
it("keeps configured LM Studio models visible without runtime catalog augmentation", async () => {
mockSingleOpenAiCatalogModel();
augmentCatalogMock.mockResolvedValueOnce([]);
const result = await loadModelCatalog({
config: {
models: {
providers: {
lmstudio: {
baseUrl: "http://127.0.0.1:1234/v1",
models: [
{
id: "qwen3.6-27b@iq3_xxs",
name: "Qwen 3.6 27B",
input: ["text"],
reasoning: false,
contextWindow: 128_000,
maxTokens: 8192,
cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
},
],
},
},
},
} as OpenClawConfig,
});
const entry = requireCatalogEntry(result, "lmstudio", "qwen3.6-27b@iq3_xxs");
expect(entry.name).toBe("Qwen 3.6 27B");
expect(entry.contextWindow).toBe(128_000);
});
it("dedupes configured models without rewriting provider ids", async () => {
mockAgentDiscoveryModels([{ id: "glm-5", provider: "z.ai", name: "GLM-5" }]);
const result = await loadModelCatalog({
config: {
models: {
providers: {
"z-ai": {
baseUrl: "https://api.z.ai/v1",
models: [
{
id: "glm-5",
name: "Configured GLM-5",
input: ["text", "image"],
reasoning: false,
contextWindow: 128_000,
maxTokens: 8192,
cost: { input: 0, output: 0, cacheRead: 0, cacheWrite: 0 },
},
],
},
},
},
} as OpenClawConfig,
});
const matches = result.filter((entry) => findModelInCatalog([entry], "z-ai", "glm-5"));
expect(matches).toHaveLength(1);
const match = matches[0];
expect(match?.provider).toBe("z-ai");
expect(match?.id).toBe("glm-5");
expect(match?.name).toBe("Configured GLM-5");
});
it("does not add unrelated models when provider plugins return nothing", async () => {
mockSingleOpenAiCatalogModel();
const result = await loadModelCatalog({ config: {} as OpenClawConfig });
expect(
result.some((entry) => entry.provider === "qianfan" && entry.id === "deepseek-v3.2"),
).toBe(false);
});
it("does not duplicate provider-owned supplemental models already present in ModelRegistry", async () => {
mockAgentDiscoveryModels([
{
id: "kilo/auto",
provider: "kilocode",
name: "Kilo Auto",
},
]);
augmentCatalogMock.mockResolvedValueOnce([
{
provider: "kilocode",
id: "kilo/auto",
name: "Configured Kilo Auto",
reasoning: true,
input: ["text", "image"],
contextWindow: 1000000,
},
]);
const result = await loadModelCatalog({ config: {} as OpenClawConfig });
const matches = result.filter(
(entry) => entry.provider === "kilocode" && entry.id === "kilo/auto",
);
expect(matches).toHaveLength(1);
expect(matches[0]?.name).toBe("Kilo Auto");
});
it("does not match models across provider id variants", () => {
expect(
findModelInCatalog([{ provider: "z.ai", id: "glm-5", name: "GLM-5" }], "z-ai", "glm-5"),
).toBeUndefined();
});
it("resolves catalog entries with explicit providers and unique providerless matches", () => {
const catalog = [
{ provider: "first", id: "shared", name: "First", input: ["text"] },
{ provider: "second", id: "shared", name: "Second", input: ["text", "image"] },
{ provider: "modelscope", id: "qwen/qwen3.5-35b-a3b", name: "Qwen", input: ["text"] },
] satisfies Awaited<ReturnType<typeof loadModelCatalog>>;
expect(findModelCatalogEntry(catalog, { provider: "second", modelId: "SHARED" })).toEqual(
catalog[1],
);
expect(
findModelCatalogEntry(catalog, { provider: "modelscope", modelId: "Qwen/Qwen3.5-35B-A3B" }),
).toEqual(catalog[2]);
expect(findModelCatalogEntry(catalog, { modelId: "shared" })).toBeUndefined();
expect(findModelCatalogEntry(catalog, { modelId: "Qwen/Qwen3.5-35B-A3B" })).toEqual(catalog[2]);
expect(modelSupportsInput(catalog[1], "image")).toBe(true);
expect(modelSupportsInput(catalog[2], "image")).toBe(false);
});
});