mirror of
https://github.com/openclaw/openclaw.git
synced 2026-04-12 01:31:08 +00:00
docs(inferrs): fix Gemma model id from gg-hf-gg to google (#62586)
This commit is contained in:
@@ -23,7 +23,7 @@ backend, not a dedicated OpenClaw provider plugin.
|
||||
Example:
|
||||
|
||||
```bash
|
||||
inferrs serve gg-hf-gg/gemma-4-E2B-it \
|
||||
inferrs serve google/gemma-4-E2B-it \
|
||||
--host 127.0.0.1 \
|
||||
--port 8080 \
|
||||
--device metal
|
||||
@@ -46,9 +46,9 @@ This example uses Gemma 4 on a local `inferrs` server.
|
||||
{
|
||||
agents: {
|
||||
defaults: {
|
||||
model: { primary: "inferrs/gg-hf-gg/gemma-4-E2B-it" },
|
||||
model: { primary: "inferrs/google/gemma-4-E2B-it" },
|
||||
models: {
|
||||
"inferrs/gg-hf-gg/gemma-4-E2B-it": {
|
||||
"inferrs/google/gemma-4-E2B-it": {
|
||||
alias: "Gemma 4 (inferrs)",
|
||||
},
|
||||
},
|
||||
@@ -63,7 +63,7 @@ This example uses Gemma 4 on a local `inferrs` server.
|
||||
api: "openai-completions",
|
||||
models: [
|
||||
{
|
||||
id: "gg-hf-gg/gemma-4-E2B-it",
|
||||
id: "google/gemma-4-E2B-it",
|
||||
name: "Gemma 4 E2B (inferrs)",
|
||||
reasoning: false,
|
||||
input: ["text"],
|
||||
@@ -132,10 +132,10 @@ Once configured, test both layers:
|
||||
```bash
|
||||
curl http://127.0.0.1:8080/v1/chat/completions \
|
||||
-H 'content-type: application/json' \
|
||||
-d '{"model":"gg-hf-gg/gemma-4-E2B-it","messages":[{"role":"user","content":"What is 2 + 2?"}],"stream":false}'
|
||||
-d '{"model":"google/gemma-4-E2B-it","messages":[{"role":"user","content":"What is 2 + 2?"}],"stream":false}'
|
||||
|
||||
openclaw infer model run \
|
||||
--model inferrs/gg-hf-gg/gemma-4-E2B-it \
|
||||
--model inferrs/google/gemma-4-E2B-it \
|
||||
--prompt "What is 2 + 2? Reply with one short sentence." \
|
||||
--json
|
||||
```
|
||||
|
||||
@@ -1082,7 +1082,7 @@ describe("openai transport stream", () => {
|
||||
it("flattens pure text content arrays for string-only completions backends when opted in", () => {
|
||||
const params = buildOpenAICompletionsParams(
|
||||
{
|
||||
id: "gg-hf-gg/gemma-4-E2B-it",
|
||||
id: "google/gemma-4-E2B-it",
|
||||
name: "Gemma 4 E2B",
|
||||
api: "openai-completions",
|
||||
provider: "inferrs",
|
||||
|
||||
@@ -567,11 +567,11 @@ describe("applyExtraParamsToAgent", () => {
|
||||
it("flattens pure text OpenAI completions message arrays for string-only compat models", () => {
|
||||
const payload = runResponsesPayloadMutationCase({
|
||||
applyProvider: "inferrs",
|
||||
applyModelId: "gg-hf-gg/gemma-4-E2B-it",
|
||||
applyModelId: "google/gemma-4-E2B-it",
|
||||
model: {
|
||||
api: "openai-completions",
|
||||
provider: "inferrs",
|
||||
id: "gg-hf-gg/gemma-4-E2B-it",
|
||||
id: "google/gemma-4-E2B-it",
|
||||
name: "Gemma 4 E2B (inferrs)",
|
||||
baseUrl: "http://127.0.0.1:8080/v1",
|
||||
reasoning: false,
|
||||
|
||||
Reference in New Issue
Block a user