{ "id": "cerebras", "activation": { "onStartup": false }, "enabledByDefault": true, "providers": ["cerebras"], "providerEndpoints": [ { "endpointClass": "cerebras-native", "hosts": ["api.cerebras.ai"] } ], "providerRequest": { "providers": { "cerebras": { "family": "cerebras" } } }, "modelCatalog": { "providers": { "cerebras": { "baseUrl": "https://api.cerebras.ai/v1", "api": "openai-completions", "models": [ { "id": "zai-glm-4.7", "name": "Z.ai GLM 4.7", "input": ["text"], "reasoning": true, "contextWindow": 128000, "maxTokens": 8192, "cost": { "input": 2.25, "output": 2.75, "cacheRead": 2.25, "cacheWrite": 2.75 } }, { "id": "gpt-oss-120b", "name": "GPT OSS 120B", "input": ["text"], "reasoning": true, "contextWindow": 128000, "maxTokens": 8192, "cost": { "input": 0.35, "output": 0.75, "cacheRead": 0.35, "cacheWrite": 0.75 } }, { "id": "qwen-3-235b-a22b-instruct-2507", "name": "Qwen 3 235B Instruct", "input": ["text"], "contextWindow": 128000, "maxTokens": 8192, "cost": { "input": 0.6, "output": 1.2, "cacheRead": 0.6, "cacheWrite": 1.2 } }, { "id": "llama3.1-8b", "name": "Llama 3.1 8B", "input": ["text"], "contextWindow": 128000, "maxTokens": 8192, "cost": { "input": 0.1, "output": 0.1, "cacheRead": 0.1, "cacheWrite": 0.1 } } ] } }, "discovery": { "cerebras": "static" } }, "providerAuthEnvVars": { "cerebras": ["CEREBRAS_API_KEY"] }, "providerAuthChoices": [ { "provider": "cerebras", "method": "api-key", "choiceId": "cerebras-api-key", "choiceLabel": "Cerebras API key", "groupId": "cerebras", "groupLabel": "Cerebras", "groupHint": "Fast OpenAI-compatible inference", "optionKey": "cerebrasApiKey", "cliFlag": "--cerebras-api-key", "cliOption": "--cerebras-api-key ", "cliDescription": "Cerebras API key" } ], "configSchema": { "type": "object", "additionalProperties": false, "properties": {} } }