mirror of
https://github.com/openclaw/openclaw.git
synced 2026-06-25 05:29:34 +00:00
Summary: - Add a shared live provider catalog runtime for SDK-backed providers. - Route OpenAI, xAI, OpenCode Go, Chutes, DeepInfra, Venice, NVIDIA, and Vercel AI Gateway live model discovery through the shared helper. - Remove duplicated provider-local live catalog caching and harden auth marker stripping, empty live-result retries, and OpenAI custom-base-url handling. Verification: - node scripts/run-vitest.mjs extensions/openai/openai-provider.test.ts src/plugin-sdk/provider-catalog-live-runtime.test.ts src/commands/models/list.source-plan.test.ts extensions/opencode-go/index.test.ts extensions/nvidia/provider-catalog.test.ts - pnpm plugin-sdk:api:check - pnpm lint --threads=8 - pnpm run lint:extensions:bundled - pnpm run test:extensions:package-boundary:compile - pnpm check:import-cycles - pnpm exec oxfmt --check extensions/openai/openai-provider.ts extensions/openai/openai-provider.test.ts - git diff --check origin/main...HEAD - autoreview clean: no accepted/actionable findings reported - AWS Crabbox focused remote proof: run_364680d1bff8 / cbx_2456fffafe01 - Earlier same-PR AWS Crabbox live proof: run_1f05ccab368e / cbx_7375c79fcf9b Known proof gap: - Final current-code true live-provider smoke was blocked by Crabbox secret hydration, documented in the PR proof comment.
347 lines
11 KiB
TypeScript
347 lines
11 KiB
TypeScript
// Chutes tests cover models plugin behavior.
|
|
import { beforeEach, describe, expect, it, vi } from "vitest";
|
|
import {
|
|
buildChutesModelDefinition,
|
|
CHUTES_MODEL_CATALOG,
|
|
clearChutesModelCacheForTests,
|
|
discoverChutesModels,
|
|
} from "./models.js";
|
|
|
|
function restoreEnvVar(name: string, value: string | undefined): void {
|
|
if (value === undefined) {
|
|
delete process.env[name];
|
|
} else {
|
|
process.env[name] = value;
|
|
}
|
|
}
|
|
|
|
async function withLiveChutesDiscovery<T>(
|
|
fetchMock: ReturnType<typeof vi.fn>,
|
|
run: () => Promise<T>,
|
|
options?: { now?: string },
|
|
): Promise<T> {
|
|
const oldNodeEnv = process.env.NODE_ENV;
|
|
const oldVitest = process.env.VITEST;
|
|
delete process.env.NODE_ENV;
|
|
delete process.env.VITEST;
|
|
if (options?.now) {
|
|
vi.useFakeTimers();
|
|
vi.setSystemTime(new Date(options.now));
|
|
}
|
|
vi.stubGlobal("fetch", fetchMock);
|
|
|
|
try {
|
|
return await run();
|
|
} finally {
|
|
restoreEnvVar("NODE_ENV", oldNodeEnv);
|
|
restoreEnvVar("VITEST", oldVitest);
|
|
vi.unstubAllGlobals();
|
|
if (options?.now) {
|
|
vi.useRealTimers();
|
|
}
|
|
}
|
|
}
|
|
|
|
function createAuthEchoFetchMock() {
|
|
return vi.fn().mockImplementation((_url, init?: { headers?: HeadersInit }) => {
|
|
const auth = readAuthorizationHeader(init);
|
|
return Promise.resolve({
|
|
ok: true,
|
|
json: async () => ({
|
|
data: [{ id: auth ? `${auth}-model` : "public-model" }],
|
|
}),
|
|
});
|
|
});
|
|
}
|
|
|
|
function readAuthorizationHeader(init?: { headers?: HeadersInit }): string {
|
|
const headers = init?.headers;
|
|
if (headers instanceof Headers) {
|
|
return headers.get("Authorization") ?? "";
|
|
}
|
|
if (Array.isArray(headers)) {
|
|
return headers.find(([key]) => key.toLowerCase() === "authorization")?.[1] ?? "";
|
|
}
|
|
return headers?.Authorization ?? headers?.authorization ?? "";
|
|
}
|
|
|
|
function requireChutesModel(
|
|
models: Awaited<ReturnType<typeof discoverChutesModels>>,
|
|
index: number,
|
|
): Awaited<ReturnType<typeof discoverChutesModels>>[number] {
|
|
const model = models[index];
|
|
if (!model) {
|
|
throw new Error(`expected Chutes model at index ${index}`);
|
|
}
|
|
return model;
|
|
}
|
|
|
|
describe("chutes-models", () => {
|
|
beforeEach(() => {
|
|
clearChutesModelCacheForTests();
|
|
});
|
|
|
|
it("buildChutesModelDefinition returns config with required fields", () => {
|
|
const entry = CHUTES_MODEL_CATALOG[0];
|
|
const def = buildChutesModelDefinition(entry);
|
|
expect(def.id).toBe(entry.id);
|
|
expect(def.name).toBe(entry.name);
|
|
expect(def.reasoning).toBe(entry.reasoning);
|
|
expect(def.input).toEqual(entry.input);
|
|
expect(def.cost).toEqual(entry.cost);
|
|
expect(def.contextWindow).toBe(entry.contextWindow);
|
|
expect(def.maxTokens).toBe(entry.maxTokens);
|
|
if (!def.compat) {
|
|
throw new Error("expected Chutes model compat");
|
|
}
|
|
expect(def.compat.supportsUsageInStreaming).toBe(false);
|
|
});
|
|
|
|
it("keeps Qwen VL image limits in the runtime catalog", () => {
|
|
const visionModelIds = ["Qwen/Qwen2.5-VL-32B-Instruct", "Qwen/Qwen3-VL-235B-A22B-Instruct"];
|
|
for (const id of visionModelIds) {
|
|
const model = CHUTES_MODEL_CATALOG.find((candidate) => candidate.id === id);
|
|
expect(model).toBeDefined();
|
|
if (!model) {
|
|
throw new Error(`expected ${id}`);
|
|
}
|
|
expect(buildChutesModelDefinition(model).mediaInput).toEqual({
|
|
image: { maxPixels: 12845056, preferredSidePx: 2048, tokenMode: "provider" },
|
|
});
|
|
}
|
|
});
|
|
|
|
it("discoverChutesModels returns static catalog when accessToken is empty", async () => {
|
|
const models = await discoverChutesModels("");
|
|
expect(models).toHaveLength(CHUTES_MODEL_CATALOG.length);
|
|
expect(models.map((m) => m.id)).toEqual(CHUTES_MODEL_CATALOG.map((m) => m.id));
|
|
});
|
|
|
|
it("discoverChutesModels returns static catalog in test env by default", async () => {
|
|
const models = await discoverChutesModels("test-token");
|
|
expect(models).toHaveLength(CHUTES_MODEL_CATALOG.length);
|
|
expect(requireChutesModel(models, 0).id).toBe("Qwen/Qwen3-32B");
|
|
});
|
|
|
|
it("discoverChutesModels correctly maps API response when not in test env", async () => {
|
|
const mockFetch = vi.fn().mockResolvedValue({
|
|
ok: true,
|
|
json: async () => ({
|
|
data: [
|
|
{ id: "zai-org/GLM-4.7-TEE" },
|
|
{
|
|
id: "new-provider/new-model-r1",
|
|
supported_features: ["reasoning"],
|
|
input_modalities: ["text", "image"],
|
|
context_length: 200000,
|
|
max_output_length: 16384,
|
|
pricing: { prompt: 0.1, completion: 0.2 },
|
|
},
|
|
{ id: "new-provider/simple-model" },
|
|
],
|
|
}),
|
|
});
|
|
await withLiveChutesDiscovery(mockFetch, async () => {
|
|
const models = await discoverChutesModels("test-token-real-fetch");
|
|
expect(models.length).toBeGreaterThan(0);
|
|
if (models.length === 3) {
|
|
const firstModel = requireChutesModel(models, 0);
|
|
const secondModel = requireChutesModel(models, 1);
|
|
expect(firstModel.id).toBe("zai-org/GLM-4.7-TEE");
|
|
expect(secondModel.reasoning).toBe(true);
|
|
if (!secondModel.compat) {
|
|
throw new Error("expected Chutes API model compat");
|
|
}
|
|
expect(secondModel.compat.supportsUsageInStreaming).toBe(false);
|
|
}
|
|
});
|
|
});
|
|
|
|
it("falls back from malformed live token metadata", async () => {
|
|
const mockFetch = vi.fn().mockResolvedValue({
|
|
ok: true,
|
|
json: async () => ({
|
|
data: [
|
|
{
|
|
id: "provider/bad-window",
|
|
context_length: -1,
|
|
max_output_length: 16384.5,
|
|
},
|
|
{
|
|
id: "provider/bad-max-output",
|
|
context_length: Number.POSITIVE_INFINITY,
|
|
max_output_length: 0,
|
|
},
|
|
],
|
|
}),
|
|
});
|
|
|
|
await withLiveChutesDiscovery(mockFetch, async () => {
|
|
const models = await discoverChutesModels("malformed-token-metadata");
|
|
|
|
expect(requireChutesModel(models, 0)).toMatchObject({
|
|
id: "provider/bad-window",
|
|
contextWindow: 128000,
|
|
maxTokens: 4096,
|
|
});
|
|
expect(requireChutesModel(models, 1)).toMatchObject({
|
|
id: "provider/bad-max-output",
|
|
contextWindow: 128000,
|
|
maxTokens: 4096,
|
|
});
|
|
});
|
|
});
|
|
|
|
it("discoverChutesModels retries without auth on 401", async () => {
|
|
const mockFetch = vi.fn().mockImplementation((_url, init?: { headers?: HeadersInit }) => {
|
|
if (readAuthorizationHeader(init) === "Bearer test-token-error") {
|
|
return Promise.resolve({
|
|
ok: false,
|
|
status: 401,
|
|
});
|
|
}
|
|
return Promise.resolve({
|
|
ok: true,
|
|
json: async () => ({
|
|
data: [
|
|
{
|
|
id: "Qwen/Qwen3-32B",
|
|
name: "Qwen/Qwen3-32B",
|
|
supported_features: ["reasoning"],
|
|
input_modalities: ["text"],
|
|
context_length: 40960,
|
|
max_output_length: 40960,
|
|
pricing: { prompt: 0.08, completion: 0.24 },
|
|
},
|
|
{
|
|
id: "unsloth/Mistral-Nemo-Instruct-2407",
|
|
name: "unsloth/Mistral-Nemo-Instruct-2407",
|
|
input_modalities: ["text"],
|
|
context_length: 131072,
|
|
max_output_length: 131072,
|
|
pricing: { prompt: 0.02, completion: 0.04 },
|
|
},
|
|
{
|
|
id: "deepseek-ai/DeepSeek-V3-0324-TEE",
|
|
name: "deepseek-ai/DeepSeek-V3-0324-TEE",
|
|
supported_features: ["reasoning"],
|
|
input_modalities: ["text"],
|
|
context_length: 131072,
|
|
max_output_length: 65536,
|
|
pricing: { prompt: 0.28, completion: 0.42 },
|
|
},
|
|
],
|
|
}),
|
|
});
|
|
});
|
|
await withLiveChutesDiscovery(mockFetch, async () => {
|
|
const models = await discoverChutesModels("test-token-error");
|
|
expect(models.length).toBeGreaterThan(0);
|
|
expect(mockFetch).toHaveBeenCalled();
|
|
});
|
|
});
|
|
|
|
it("does not cache fallback static catalog for non-OK responses", async () => {
|
|
const mockFetch = vi.fn().mockResolvedValue({
|
|
ok: false,
|
|
status: 503,
|
|
});
|
|
|
|
await withLiveChutesDiscovery(mockFetch, async () => {
|
|
const first = await discoverChutesModels("chutes-fallback-token");
|
|
const second = await discoverChutesModels("chutes-fallback-token");
|
|
expect(first.map((m) => m.id)).toEqual(CHUTES_MODEL_CATALOG.map((m) => m.id));
|
|
expect(second.map((m) => m.id)).toEqual(CHUTES_MODEL_CATALOG.map((m) => m.id));
|
|
expect(mockFetch).toHaveBeenCalledTimes(2);
|
|
});
|
|
});
|
|
|
|
it("scopes discovery cache by access token", async () => {
|
|
const mockFetch = vi.fn().mockImplementation((_url, init?: { headers?: HeadersInit }) => {
|
|
const auth = readAuthorizationHeader(init);
|
|
if (auth === "Bearer chutes-token-a") {
|
|
return Promise.resolve({
|
|
ok: true,
|
|
json: async () => ({
|
|
data: [{ id: "private/model-a" }],
|
|
}),
|
|
});
|
|
}
|
|
if (auth === "Bearer chutes-token-b") {
|
|
return Promise.resolve({
|
|
ok: true,
|
|
json: async () => ({
|
|
data: [{ id: "private/model-b" }],
|
|
}),
|
|
});
|
|
}
|
|
return Promise.resolve({
|
|
ok: true,
|
|
json: async () => ({
|
|
data: [{ id: "public/model" }],
|
|
}),
|
|
});
|
|
});
|
|
await withLiveChutesDiscovery(mockFetch, async () => {
|
|
const modelsA = await discoverChutesModels("chutes-token-a");
|
|
const modelsB = await discoverChutesModels("chutes-token-b");
|
|
const modelsASecond = await discoverChutesModels("chutes-token-a");
|
|
expect(requireChutesModel(modelsA, 0).id).toBe("private/model-a");
|
|
expect(requireChutesModel(modelsB, 0).id).toBe("private/model-b");
|
|
expect(requireChutesModel(modelsASecond, 0).id).toBe("private/model-a");
|
|
expect(mockFetch).toHaveBeenCalledTimes(2);
|
|
});
|
|
});
|
|
|
|
it("evicts oldest token entries when cache reaches max size", async () => {
|
|
const mockFetch = createAuthEchoFetchMock();
|
|
|
|
await withLiveChutesDiscovery(mockFetch, async () => {
|
|
for (let i = 0; i < 150; i += 1) {
|
|
await discoverChutesModels(`cache-token-${i}`);
|
|
}
|
|
|
|
await discoverChutesModels("cache-token-0");
|
|
expect(mockFetch).toHaveBeenCalledTimes(151);
|
|
});
|
|
});
|
|
|
|
it("prunes expired token cache entries during subsequent discovery", async () => {
|
|
const mockFetch = createAuthEchoFetchMock();
|
|
|
|
await withLiveChutesDiscovery(
|
|
mockFetch,
|
|
async () => {
|
|
await discoverChutesModels("token-a");
|
|
vi.advanceTimersByTime(5 * 60 * 1000 + 1);
|
|
await discoverChutesModels("token-b");
|
|
await discoverChutesModels("token-a");
|
|
expect(mockFetch).toHaveBeenCalledTimes(3);
|
|
},
|
|
{ now: "2026-03-01T00:00:00.000Z" },
|
|
);
|
|
});
|
|
|
|
it("does not cache 401 fallback under the failed token key", async () => {
|
|
const mockFetch = vi.fn().mockImplementation((_url, init?: { headers?: HeadersInit }) => {
|
|
if (readAuthorizationHeader(init) === "Bearer failed-token") {
|
|
return Promise.resolve({
|
|
ok: false,
|
|
status: 401,
|
|
});
|
|
}
|
|
return Promise.resolve({
|
|
ok: true,
|
|
json: async () => ({
|
|
data: [{ id: "public/model" }],
|
|
}),
|
|
});
|
|
});
|
|
await withLiveChutesDiscovery(mockFetch, async () => {
|
|
await discoverChutesModels("failed-token");
|
|
await discoverChutesModels("failed-token");
|
|
expect(mockFetch).toHaveBeenCalledTimes(3);
|
|
});
|
|
});
|
|
});
|