Files
openclaw/extensions/nvidia/provider-catalog.ts
Agustin Rivera 6fd4aa8a27 fix(nvidia): load featured model catalog (#80775)
* fix(nvidia): load featured model catalog

Co-authored-by: CaptainTimon <CaptainTimon@users.noreply.github.com>

* fix(nvidia): widen catalog fetch timeout

* fix(nvidia): cover catalog registration

* fix(picker): include provider catalog loader

* fix(nvidia): guard featured catalog fetch

* fix(nvidia): sync bundled catalog with live API

Replace minimaxai/minimax-m2.5 (MiniMax M2.5) with minimaxai/minimax-m2.7 (Minimax M2.7) and z-ai/glm5 (GLM-5) with z-ai/glm-5.1 (GLM 5.1) in the bundled fallback catalog to match NVIDIA's public featured-models endpoint.

Update docs table and all extension test expectations.

* fix(nvidia): retain shipped catalog refs

* fix(picker): keep alias catalog rows

* fix(nvidia): restore live catalog priority

---------

Co-authored-by: CaptainTimon <CaptainTimon@users.noreply.github.com>
2026-05-28 12:59:55 -07:00

251 lines
7.0 KiB
TypeScript

import { lookup as dnsLookup } from "node:dns/promises";
import { buildManifestModelProviderConfig } from "openclaw/plugin-sdk/provider-catalog-shared";
import type {
ModelDefinitionConfig,
ModelProviderConfig,
} from "openclaw/plugin-sdk/provider-model-shared";
import {
fetchWithSsrFGuard,
type LookupFn,
ssrfPolicyFromHttpBaseUrlAllowedHostname,
} from "openclaw/plugin-sdk/ssrf-runtime";
import manifest from "./openclaw.plugin.json" with { type: "json" };
export const NVIDIA_DEFAULT_MODEL_ID = "nvidia/nemotron-3-super-120b-a12b";
export const NVIDIA_FEATURED_MODELS_URL =
"https://assets.ngc.nvidia.com/products/api-catalog/featured-models.json";
const FEATURED_MODEL_CACHE_TTL_MS = 24 * 60 * 60 * 1000;
const FEATURED_MODEL_FETCH_TIMEOUT_MS = 10_000;
const FEATURED_MODEL_MAX_ROWS = 32;
const FEATURED_MODEL_MAX_ID_LENGTH = 200;
const FEATURED_MODEL_MAX_NAME_LENGTH = 200;
const FEATURED_MODEL_MAX_CONTEXT_WINDOW = 10_000_000;
const FEATURED_MODEL_MAX_OUTPUT_TOKENS = 1_000_000;
const FEATURED_MODEL_COST = {
input: 0,
output: 0,
cacheRead: 0,
cacheWrite: 0,
} as const;
type NvidiaFeaturedModel = {
model: string;
"model-name": string;
context: number;
"max-output": number;
};
let featuredModelCache:
| {
expiresAtMs: number;
models: ModelDefinitionConfig[];
}
| undefined;
let featuredModelRequest: Promise<ModelDefinitionConfig[] | null> | undefined;
type DnsLookupOptions = {
all?: boolean;
family?: number;
hints?: number;
order?: "ipv4first" | "ipv6first" | "verbatim";
verbatim?: boolean;
};
const lookupNvidiaFeaturedModelHostname = (async (
hostname: string,
options?: number | DnsLookupOptions,
) => {
if (typeof options === "object" && options !== null) {
return await dnsLookup(hostname, { ...options, family: 4 });
}
return await dnsLookup(hostname, { family: 4 });
}) as LookupFn;
export function buildNvidiaProvider(): ModelProviderConfig {
return {
...buildManifestModelProviderConfig({
providerId: "nvidia",
catalog: manifest.modelCatalog.providers.nvidia,
}),
apiKey: "NVIDIA_API_KEY",
};
}
export async function buildLiveNvidiaProvider(): Promise<ModelProviderConfig> {
const provider = buildNvidiaProvider();
const featuredModels = await loadNvidiaFeaturedModels();
if (!featuredModels || featuredModels.length === 0) {
return provider;
}
return {
...provider,
models: featuredModels,
};
}
export async function buildSelectableLiveNvidiaProvider(): Promise<ModelProviderConfig> {
const provider = buildNvidiaProvider();
const featuredModels = await loadNvidiaFeaturedModels();
if (!featuredModels || featuredModels.length === 0) {
return {
...provider,
models: [],
};
}
return {
...provider,
models: featuredModels,
};
}
export function clearNvidiaFeaturedModelCacheForTests() {
featuredModelCache = undefined;
featuredModelRequest = undefined;
}
async function loadNvidiaFeaturedModels(): Promise<ModelDefinitionConfig[] | null> {
const now = Date.now();
if (featuredModelCache && featuredModelCache.expiresAtMs > now) {
return featuredModelCache.models;
}
featuredModelRequest ??= fetchNvidiaFeaturedModels();
try {
const models = await featuredModelRequest;
if (models && models.length > 0) {
featuredModelCache = {
expiresAtMs: now + FEATURED_MODEL_CACHE_TTL_MS,
models,
};
}
return models;
} finally {
featuredModelRequest = undefined;
}
}
async function fetchNvidiaFeaturedModels(): Promise<ModelDefinitionConfig[] | null> {
try {
const { response, release } = await fetchWithSsrFGuard({
url: NVIDIA_FEATURED_MODELS_URL,
timeoutMs: FEATURED_MODEL_FETCH_TIMEOUT_MS,
requireHttps: true,
policy: ssrfPolicyFromHttpBaseUrlAllowedHostname(NVIDIA_FEATURED_MODELS_URL),
// The featured catalog is an NVIDIA-owned CloudFront URL. Some resolvers
// stall for seconds on the default all-family lookup; IPv4 pinning keeps
// the guarded fixed-host fetch on the fast path.
lookupFn: lookupNvidiaFeaturedModelHostname,
auditContext: "nvidia-featured-model-catalog",
});
try {
if (!response.ok) {
return null;
}
return parseNvidiaFeaturedModels(await response.json());
} finally {
await release();
}
} catch {
return null;
}
}
function parseNvidiaFeaturedModels(payload: unknown): ModelDefinitionConfig[] | null {
if (!payload || typeof payload !== "object") {
return null;
}
const rows = (payload as { "featured-models"?: unknown })["featured-models"];
if (!Array.isArray(rows)) {
return null;
}
const models = rows
.slice(0, FEATURED_MODEL_MAX_ROWS)
.map(parseNvidiaFeaturedModel)
.filter((model) => model !== null);
return models.length > 0 ? models : null;
}
function parseNvidiaFeaturedModel(row: unknown): ModelDefinitionConfig | null {
if (!row || typeof row !== "object") {
return null;
}
const entry = row as Partial<NvidiaFeaturedModel>;
if (
typeof entry.model !== "string" ||
typeof entry["model-name"] !== "string" ||
!isBoundedPositiveInteger(entry.context, FEATURED_MODEL_MAX_CONTEXT_WINDOW) ||
!isBoundedPositiveInteger(entry["max-output"], FEATURED_MODEL_MAX_OUTPUT_TOKENS)
) {
return null;
}
const id = normalizeNvidiaFeaturedModelId(entry.model);
const name = normalizeFeaturedModelName(entry["model-name"]);
if (!id || !name) {
return null;
}
return {
id,
name,
reasoning: false,
input: ["text"],
contextWindow: entry.context,
maxTokens: entry["max-output"],
cost: { ...FEATURED_MODEL_COST },
compat: {
requiresStringContent: true,
},
};
}
function normalizeNvidiaFeaturedModelId(model: string): string {
const trimmed = model.trim();
if (
!trimmed ||
trimmed.length > FEATURED_MODEL_MAX_ID_LENGTH ||
hasWhitespaceOrControlCharacter(trimmed)
) {
return "";
}
return trimmed.includes("/") ? trimmed : `nvidia/${trimmed}`;
}
function normalizeFeaturedModelName(name: string): string {
const trimmed = name.trim();
if (!trimmed || trimmed.length > FEATURED_MODEL_MAX_NAME_LENGTH || hasControlCharacter(trimmed)) {
return "";
}
return trimmed;
}
function isBoundedPositiveInteger(value: unknown, max: number): value is number {
return typeof value === "number" && Number.isInteger(value) && value > 0 && value <= max;
}
function hasWhitespaceOrControlCharacter(value: string): boolean {
for (const char of value) {
if (isAsciiWhitespaceOrControlCharacter(char)) {
return true;
}
}
return false;
}
function hasControlCharacter(value: string): boolean {
for (const char of value) {
if (isControlCharacter(char)) {
return true;
}
}
return false;
}
function isControlCharacter(char: string): boolean {
const code = char.charCodeAt(0);
return code <= 31 || code === 127;
}
function isAsciiWhitespaceOrControlCharacter(char: string): boolean {
const code = char.charCodeAt(0);
return code <= 32 || code === 127;
}