mirror of
https://github.com/openclaw/openclaw.git
synced 2026-04-12 09:41:11 +00:00
Mistral: enable reasoning_effort for mistral-small-latest
Made-with: Cursor
This commit is contained in:
committed by
Ayaan Zaidi
parent
de2182877a
commit
68bfc6fcf5
@@ -60,6 +60,7 @@ Docs: https://docs.openclaw.ai
|
||||
- Docker/plugins: stop forcing bundled plugin discovery to `/app/extensions` in runtime images so packaged installs use compiled `dist/extensions` artifacts again and Node 24 containers do not boot through source-only plugin entry paths. Fixes #62044. (#62316) Thanks @gumadeiras.
|
||||
- Cron: load `jobId` into `id` when the on-disk store omits `id`, matching doctor migration and fixing `unknown cron job id` for hand-edited `jobs.json`. (#62246) Thanks @neeravmakwana.
|
||||
- Agents/model fallback: classify minimal HTTP 404 API errors (for example `404 status code (no body)`) as `model_not_found` so assistant failures throw into the fallback chain instead of stopping at the first fallback candidate. (#62119) Thanks @neeravmakwana.
|
||||
- Providers/Mistral: send `reasoning_effort` for `mistral/mistral-small-latest` (Mistral Small 4) with thinking-level mapping, and mark the catalog entry as reasoning-capable so adjustable reasoning matches Mistral’s Chat Completions API. (#62162) Thanks @neeravmakwana.
|
||||
|
||||
## 2026.4.5
|
||||
|
||||
|
||||
@@ -33,15 +33,15 @@ openclaw onboard --mistral-api-key "$MISTRAL_API_KEY"
|
||||
|
||||
OpenClaw currently ships this bundled Mistral catalog:
|
||||
|
||||
| Model ref | Input | Context | Max output | Notes |
|
||||
| -------------------------------- | ----------- | ------- | ---------- | ------------------------ |
|
||||
| `mistral/mistral-large-latest` | text, image | 262,144 | 16,384 | Default model |
|
||||
| `mistral/mistral-medium-2508` | text, image | 262,144 | 8,192 | Mistral Medium 3.1 |
|
||||
| `mistral/mistral-small-latest` | text, image | 128,000 | 16,384 | Smaller multimodal model |
|
||||
| `mistral/pixtral-large-latest` | text, image | 128,000 | 32,768 | Pixtral |
|
||||
| `mistral/codestral-latest` | text | 256,000 | 4,096 | Coding |
|
||||
| `mistral/devstral-medium-latest` | text | 262,144 | 32,768 | Devstral 2 |
|
||||
| `mistral/magistral-small` | text | 128,000 | 40,000 | Reasoning-enabled |
|
||||
| Model ref | Input | Context | Max output | Notes |
|
||||
| -------------------------------- | ----------- | ------- | ---------- | ---------------------------------------------------------------- |
|
||||
| `mistral/mistral-large-latest` | text, image | 262,144 | 16,384 | Default model |
|
||||
| `mistral/mistral-medium-2508` | text, image | 262,144 | 8,192 | Mistral Medium 3.1 |
|
||||
| `mistral/mistral-small-latest` | text, image | 128,000 | 16,384 | Mistral Small 4; adjustable reasoning via API `reasoning_effort` |
|
||||
| `mistral/pixtral-large-latest` | text, image | 128,000 | 32,768 | Pixtral |
|
||||
| `mistral/codestral-latest` | text | 256,000 | 4,096 | Coding |
|
||||
| `mistral/devstral-medium-latest` | text | 262,144 | 32,768 | Devstral 2 |
|
||||
| `mistral/magistral-small` | text | 128,000 | 40,000 | Reasoning-enabled |
|
||||
|
||||
## Config snippet (audio transcription with Voxtral)
|
||||
|
||||
@@ -58,6 +58,17 @@ OpenClaw currently ships this bundled Mistral catalog:
|
||||
}
|
||||
```
|
||||
|
||||
## Adjustable reasoning (`mistral-small-latest`)
|
||||
|
||||
`mistral/mistral-small-latest` maps to Mistral Small 4 and supports [adjustable reasoning](https://docs.mistral.ai/capabilities/reasoning/adjustable) on the Chat Completions API via `reasoning_effort` (`none` minimizes extra thinking in the output; `high` surfaces full thinking traces before the final answer).
|
||||
|
||||
OpenClaw maps the session **thinking** level to Mistral’s API:
|
||||
|
||||
- **off** / **minimal** → `none`
|
||||
- **low** / **medium** / **high** / **xhigh** / **adaptive** → `high`
|
||||
|
||||
Other bundled Mistral catalog models do not use this parameter; keep using `magistral-*` models (for example `magistral-small`) when you want Mistral’s native reasoning-first behavior.
|
||||
|
||||
## Notes
|
||||
|
||||
- Mistral auth uses `MISTRAL_API_KEY`.
|
||||
|
||||
@@ -1,29 +1,65 @@
|
||||
import { describe, expect, it } from "vitest";
|
||||
import { applyMistralModelCompat } from "./api.js";
|
||||
import {
|
||||
applyMistralModelCompat,
|
||||
MISTRAL_MODEL_TRANSPORT_PATCH,
|
||||
MISTRAL_SMALL_LATEST_ID,
|
||||
resolveMistralCompatPatch,
|
||||
} from "./api.js";
|
||||
import { default as mistralPlugin } from "./index.js";
|
||||
|
||||
function supportsStore(model: { compat?: unknown }): boolean | undefined {
|
||||
return (model.compat as { supportsStore?: boolean } | undefined)?.supportsStore;
|
||||
function readCompat<T>(model: unknown): T | undefined {
|
||||
return (model as { compat?: T }).compat;
|
||||
}
|
||||
|
||||
function supportsReasoningEffort(model: { compat?: unknown }): boolean | undefined {
|
||||
return (model.compat as { supportsReasoningEffort?: boolean } | undefined)
|
||||
?.supportsReasoningEffort;
|
||||
function supportsStore(model: unknown): boolean | undefined {
|
||||
return readCompat<{ supportsStore?: boolean }>(model)?.supportsStore;
|
||||
}
|
||||
|
||||
function maxTokensField(model: {
|
||||
compat?: unknown;
|
||||
}): "max_completion_tokens" | "max_tokens" | undefined {
|
||||
return (model.compat as { maxTokensField?: "max_completion_tokens" | "max_tokens" } | undefined)
|
||||
function supportsReasoningEffort(model: unknown): boolean | undefined {
|
||||
return readCompat<{ supportsReasoningEffort?: boolean }>(model)?.supportsReasoningEffort;
|
||||
}
|
||||
|
||||
function maxTokensField(model: unknown): "max_completion_tokens" | "max_tokens" | undefined {
|
||||
return readCompat<{ maxTokensField?: "max_completion_tokens" | "max_tokens" }>(model)
|
||||
?.maxTokensField;
|
||||
}
|
||||
|
||||
function reasoningEffortMap(model: unknown): Record<string, string> | undefined {
|
||||
return readCompat<{ reasoningEffortMap?: Record<string, string> }>(model)?.reasoningEffortMap;
|
||||
}
|
||||
|
||||
describe("resolveMistralCompatPatch", () => {
|
||||
it("enables reasoning_effort mapping for mistral-small-latest", () => {
|
||||
expect(resolveMistralCompatPatch({ id: MISTRAL_SMALL_LATEST_ID })).toMatchObject({
|
||||
supportsStore: false,
|
||||
supportsReasoningEffort: true,
|
||||
maxTokensField: "max_tokens",
|
||||
reasoningEffortMap: expect.objectContaining({ high: "high", off: "none" }),
|
||||
});
|
||||
});
|
||||
|
||||
it("disables reasoning_effort for other Mistral model ids", () => {
|
||||
expect(resolveMistralCompatPatch({ id: "mistral-large-latest" })).toEqual({
|
||||
...MISTRAL_MODEL_TRANSPORT_PATCH,
|
||||
supportsReasoningEffort: false,
|
||||
});
|
||||
});
|
||||
});
|
||||
|
||||
describe("applyMistralModelCompat", () => {
|
||||
it("applies the Mistral request-shape compat flags", () => {
|
||||
const normalized = applyMistralModelCompat({});
|
||||
expect(supportsStore(normalized)).toBe(false);
|
||||
expect(supportsReasoningEffort(normalized)).toBe(false);
|
||||
expect(maxTokensField(normalized)).toBe("max_tokens");
|
||||
expect(reasoningEffortMap(normalized)).toBeUndefined();
|
||||
});
|
||||
|
||||
it("applies reasoning compat for mistral-small-latest", () => {
|
||||
const normalized = applyMistralModelCompat({ id: MISTRAL_SMALL_LATEST_ID });
|
||||
expect(supportsReasoningEffort(normalized)).toBe(true);
|
||||
expect(reasoningEffortMap(normalized)?.high).toBe("high");
|
||||
expect(reasoningEffortMap(normalized)?.off).toBe("none");
|
||||
});
|
||||
|
||||
it("overrides explicit compat values that would trigger 422s", () => {
|
||||
@@ -39,6 +75,20 @@ describe("applyMistralModelCompat", () => {
|
||||
expect(maxTokensField(normalized)).toBe("max_tokens");
|
||||
});
|
||||
|
||||
it("overrides explicit compat on mistral-small-latest except reasoning enablement", () => {
|
||||
const normalized = applyMistralModelCompat({
|
||||
id: MISTRAL_SMALL_LATEST_ID,
|
||||
compat: {
|
||||
supportsStore: true,
|
||||
supportsReasoningEffort: false,
|
||||
maxTokensField: "max_completion_tokens" as const,
|
||||
},
|
||||
});
|
||||
expect(supportsStore(normalized)).toBe(false);
|
||||
expect(supportsReasoningEffort(normalized)).toBe(true);
|
||||
expect(maxTokensField(normalized)).toBe("max_tokens");
|
||||
});
|
||||
|
||||
it("returns the same object when the compat patch is already present", () => {
|
||||
const model = {
|
||||
compat: {
|
||||
@@ -50,7 +100,15 @@ describe("applyMistralModelCompat", () => {
|
||||
expect(applyMistralModelCompat(model)).toBe(model);
|
||||
});
|
||||
|
||||
it("contributes Mistral compat for native, provider-family, and hinted custom routes", () => {
|
||||
it("returns the same object when mistral-small-latest compat is fully normalized", () => {
|
||||
const model = {
|
||||
id: MISTRAL_SMALL_LATEST_ID,
|
||||
compat: resolveMistralCompatPatch({ id: MISTRAL_SMALL_LATEST_ID }),
|
||||
};
|
||||
expect(applyMistralModelCompat(model)).toBe(model);
|
||||
});
|
||||
|
||||
it("contributes Mistral transport compat for native, provider-family, and hinted custom routes", () => {
|
||||
const registerProvider = (mistralPlugin as { register?: (api: unknown) => void }).register;
|
||||
let contributeResolvedModelCompat:
|
||||
| ((params: { modelId: string; model: Record<string, unknown> }) => unknown)
|
||||
@@ -74,7 +132,7 @@ describe("applyMistralModelCompat", () => {
|
||||
baseUrl: "https://proxy.example/v1",
|
||||
},
|
||||
}),
|
||||
).toBeDefined();
|
||||
).toEqual(MISTRAL_MODEL_TRANSPORT_PATCH);
|
||||
|
||||
expect(
|
||||
contributeResolvedModelCompat?.({
|
||||
@@ -85,7 +143,7 @@ describe("applyMistralModelCompat", () => {
|
||||
baseUrl: "https://api.mistral.ai/v1",
|
||||
},
|
||||
}),
|
||||
).toBeDefined();
|
||||
).toEqual(MISTRAL_MODEL_TRANSPORT_PATCH);
|
||||
|
||||
expect(
|
||||
contributeResolvedModelCompat?.({
|
||||
@@ -96,6 +154,6 @@ describe("applyMistralModelCompat", () => {
|
||||
baseUrl: "https://openrouter.ai/api/v1",
|
||||
},
|
||||
}),
|
||||
).toBeDefined();
|
||||
).toEqual(MISTRAL_MODEL_TRANSPORT_PATCH);
|
||||
});
|
||||
});
|
||||
|
||||
@@ -12,32 +12,97 @@ export {
|
||||
|
||||
const MISTRAL_MAX_TOKENS_FIELD = "max_tokens";
|
||||
|
||||
export const MISTRAL_MODEL_COMPAT_PATCH = {
|
||||
/** Transport-only flags merged for hinted Mistral routes; omits reasoning so `mistral-small-latest` is not clobbered after normalization. */
|
||||
export const MISTRAL_MODEL_TRANSPORT_PATCH = {
|
||||
supportsStore: false,
|
||||
supportsReasoningEffort: false,
|
||||
maxTokensField: MISTRAL_MAX_TOKENS_FIELD,
|
||||
} as const satisfies {
|
||||
supportsStore: boolean;
|
||||
supportsReasoningEffort: boolean;
|
||||
maxTokensField: "max_tokens";
|
||||
};
|
||||
|
||||
export function applyMistralModelCompat<T extends { compat?: unknown }>(model: T): T {
|
||||
/** Resolves to Mistral Chat Completions `reasoning_effort` (`none` | `high`). */
|
||||
export const MISTRAL_SMALL_LATEST_REASONING_EFFORT_MAP: Record<string, string> = {
|
||||
off: "none",
|
||||
minimal: "none",
|
||||
low: "high",
|
||||
medium: "high",
|
||||
high: "high",
|
||||
xhigh: "high",
|
||||
adaptive: "high",
|
||||
};
|
||||
|
||||
export const MISTRAL_SMALL_LATEST_ID = "mistral-small-latest";
|
||||
|
||||
function mistralReasoningCompatForModelId(modelId: string | undefined): {
|
||||
supportsReasoningEffort: boolean;
|
||||
reasoningEffortMap?: Record<string, string>;
|
||||
} {
|
||||
if (modelId === MISTRAL_SMALL_LATEST_ID) {
|
||||
return {
|
||||
supportsReasoningEffort: true,
|
||||
reasoningEffortMap: MISTRAL_SMALL_LATEST_REASONING_EFFORT_MAP,
|
||||
};
|
||||
}
|
||||
return { supportsReasoningEffort: false };
|
||||
}
|
||||
|
||||
export function resolveMistralCompatPatch(model: { id?: string }): {
|
||||
supportsStore: boolean;
|
||||
supportsReasoningEffort: boolean;
|
||||
maxTokensField: "max_tokens";
|
||||
reasoningEffortMap?: Record<string, string>;
|
||||
} {
|
||||
return {
|
||||
...MISTRAL_MODEL_TRANSPORT_PATCH,
|
||||
...mistralReasoningCompatForModelId(model.id),
|
||||
};
|
||||
}
|
||||
|
||||
function compatMatchesResolved(
|
||||
compat: Record<string, unknown> | undefined,
|
||||
modelId: string | undefined,
|
||||
): boolean {
|
||||
const expected = resolveMistralCompatPatch({ id: modelId });
|
||||
for (const [key, value] of Object.entries(expected)) {
|
||||
if (key === "reasoningEffortMap") {
|
||||
const a = compat?.[key];
|
||||
const b = value;
|
||||
if (a === b) {
|
||||
continue;
|
||||
}
|
||||
if (
|
||||
a &&
|
||||
b &&
|
||||
typeof a === "object" &&
|
||||
typeof b === "object" &&
|
||||
JSON.stringify(a) === JSON.stringify(b)
|
||||
) {
|
||||
continue;
|
||||
}
|
||||
return false;
|
||||
}
|
||||
if (compat?.[key] !== value) {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
return true;
|
||||
}
|
||||
|
||||
export function applyMistralModelCompat<T extends { compat?: unknown; id?: string }>(model: T): T {
|
||||
const compat =
|
||||
model.compat && typeof model.compat === "object"
|
||||
? (model.compat as Record<string, unknown>)
|
||||
: undefined;
|
||||
if (
|
||||
compat &&
|
||||
Object.entries(MISTRAL_MODEL_COMPAT_PATCH).every(([key, value]) => compat[key] === value)
|
||||
) {
|
||||
if (compatMatchesResolved(compat, model.id)) {
|
||||
return model;
|
||||
}
|
||||
const patch = resolveMistralCompatPatch(model);
|
||||
return {
|
||||
...model,
|
||||
compat: {
|
||||
...compat,
|
||||
...MISTRAL_MODEL_COMPAT_PATCH,
|
||||
...patch,
|
||||
} as T extends { compat?: infer TCompat } ? TCompat : never,
|
||||
} as T;
|
||||
}
|
||||
|
||||
@@ -1,7 +1,7 @@
|
||||
import { defineSingleProviderPluginEntry } from "openclaw/plugin-sdk/provider-entry";
|
||||
import { resolveProviderRequestCapabilities } from "openclaw/plugin-sdk/provider-http";
|
||||
import { readStringValue } from "openclaw/plugin-sdk/text-runtime";
|
||||
import { applyMistralModelCompat, MISTRAL_MODEL_COMPAT_PATCH } from "./api.js";
|
||||
import { applyMistralModelCompat, MISTRAL_MODEL_TRANSPORT_PATCH } from "./api.js";
|
||||
import { mistralMediaUnderstandingProvider } from "./media-understanding-provider.js";
|
||||
import { applyMistralConfig, MISTRAL_DEFAULT_MODEL_REF } from "./onboard.js";
|
||||
import { buildMistralProvider } from "./provider-catalog.js";
|
||||
@@ -94,7 +94,7 @@ export default defineSingleProviderPluginEntry({
|
||||
/\bmistral\b.*(?:input.*too long|token limit.*exceeded)/i.test(errorMessage),
|
||||
normalizeResolvedModel: ({ model }) => applyMistralModelCompat(model),
|
||||
contributeResolvedModelCompat: ({ modelId, model }) =>
|
||||
shouldContributeMistralCompat({ modelId, model }) ? MISTRAL_MODEL_COMPAT_PATCH : undefined,
|
||||
shouldContributeMistralCompat({ modelId, model }) ? MISTRAL_MODEL_TRANSPORT_PATCH : undefined,
|
||||
buildReplayPolicy: () => buildMistralReplayPolicy(),
|
||||
},
|
||||
register(api) {
|
||||
|
||||
@@ -41,6 +41,13 @@ describe("mistral model definitions", () => {
|
||||
contextWindow: 128000,
|
||||
maxTokens: 40000,
|
||||
}),
|
||||
expect.objectContaining({
|
||||
id: "mistral-small-latest",
|
||||
reasoning: true,
|
||||
input: ["text", "image"],
|
||||
contextWindow: 128000,
|
||||
maxTokens: 16384,
|
||||
}),
|
||||
expect.objectContaining({
|
||||
id: "pixtral-large-latest",
|
||||
input: ["text", "image"],
|
||||
|
||||
@@ -61,7 +61,7 @@ const MISTRAL_MODEL_CATALOG = [
|
||||
{
|
||||
id: "mistral-small-latest",
|
||||
name: "Mistral Small (latest)",
|
||||
reasoning: false,
|
||||
reasoning: true,
|
||||
input: ["text", "image"],
|
||||
cost: { input: 0.1, output: 0.3, cacheRead: 0, cacheWrite: 0 },
|
||||
contextWindow: 128000,
|
||||
|
||||
Reference in New Issue
Block a user