import type { ModelDefinitionConfig } from
"openclaw/plugin-sdk/provider-model-shared" ;
import { createSubsystemLogger, retryAsync } from "openclaw/plugin-sdk/runtime-env" ;
import { fetchWithSsrFGuard } from "openclaw/plugin-sdk/ssrf-runtime" ;
import { normalizeLowercaseStringOrEmpty } from "openclaw/plugin-sdk/text-runtime" ;
const log = createSubsystemLogger("venice-models" );
export const VENICE_BASE_URL = "https://api.venice.ai/api/v1 ";
export const VENICE_DEFAULT_MODEL_ID = "kimi-k2-5" ;
export const VENICE_DEFAULT_MODEL_REF = `venice/${VENICE_DEFAULT_MODEL_ID}`;
const VENICE_ALLOWED_HOSTNAMES = ["api.venice.ai" ];
export const VENICE_DEFAULT_COST = {
input: 0 ,
output: 0 ,
cacheRead: 0 ,
cacheWrite: 0 ,
};
const VENICE_DEFAULT_CONTEXT_WINDOW = 128 _000 ;
const VENICE_DEFAULT_MAX_TOKENS = 4096 ;
const VENICE_DISCOVERY_HARD_MAX_TOKENS = 131 _072 ;
const VENICE_DISCOVERY_TIMEOUT_MS = 10 _000 ;
const VENICE_DISCOVERY_RETRYABLE_HTTP_STATUS = new Set([408 , 425 , 429 , 500 , 502 , 503 , 504 ]);
const VENICE_DISCOVERY_RETRYABLE_NETWORK_CODES = new Set([
"ECONNABORTED" ,
"ECONNREFUSED" ,
"ECONNRESET" ,
"EAI_AGAIN" ,
"ENETDOWN" ,
"ENETUNREACH" ,
"ENOTFOUND" ,
"ETIMEDOUT" ,
"UND_ERR_BODY_TIMEOUT" ,
"UND_ERR_CONNECT_TIMEOUT" ,
"UND_ERR_CONNECT_ERROR" ,
"UND_ERR_HEADERS_TIMEOUT" ,
"UND_ERR_SOCKET" ,
]);
export const VENICE_MODEL_CATALOG = [
{
id: "llama-3.3-70b" ,
name: "Llama 3.3 70B" ,
reasoning: false ,
input: ["text" ],
contextWindow: 128000 ,
maxTokens: 4096 ,
privacy: "private" ,
},
{
id: "llama-3.2-3b" ,
name: "Llama 3.2 3B" ,
reasoning: false ,
input: ["text" ],
contextWindow: 128000 ,
maxTokens: 4096 ,
privacy: "private" ,
},
{
id: "hermes-3-llama-3.1-405b" ,
name: "Hermes 3 Llama 3.1 405B" ,
reasoning: false ,
input: ["text" ],
contextWindow: 128000 ,
maxTokens: 16384 ,
supportsTools: false ,
privacy: "private" ,
},
{
id: "qwen3-235b-a22b-thinking-2507" ,
name: "Qwen3 235B Thinking" ,
reasoning: true ,
input: ["text" ],
contextWindow: 128000 ,
maxTokens: 16384 ,
privacy: "private" ,
},
{
id: "qwen3-235b-a22b-instruct-2507" ,
name: "Qwen3 235B Instruct" ,
reasoning: false ,
input: ["text" ],
contextWindow: 128000 ,
maxTokens: 16384 ,
privacy: "private" ,
},
{
id: "qwen3-coder-480b-a35b-instruct" ,
name: "Qwen3 Coder 480B" ,
reasoning: false ,
input: ["text" ],
contextWindow: 256000 ,
maxTokens: 65536 ,
privacy: "private" ,
},
{
id: "qwen3-coder-480b-a35b-instruct-turbo" ,
name: "Qwen3 Coder 480B Turbo" ,
reasoning: false ,
input: ["text" ],
contextWindow: 256000 ,
maxTokens: 65536 ,
privacy: "private" ,
},
{
id: "qwen3-5-35b-a3b" ,
name: "Qwen3.5 35B A3B" ,
reasoning: true ,
input: ["text" , "image" ],
contextWindow: 256000 ,
maxTokens: 65536 ,
privacy: "private" ,
},
{
id: "qwen3-next-80b" ,
name: "Qwen3 Next 80B" ,
reasoning: false ,
input: ["text" ],
contextWindow: 256000 ,
maxTokens: 16384 ,
privacy: "private" ,
},
{
id: "qwen3-vl-235b-a22b" ,
name: "Qwen3 VL 235B (Vision)" ,
reasoning: false ,
input: ["text" , "image" ],
contextWindow: 256000 ,
maxTokens: 16384 ,
privacy: "private" ,
},
{
id: "qwen3-4b" ,
name: "Venice Small (Qwen3 4B)" ,
reasoning: true ,
input: ["text" ],
contextWindow: 32000 ,
maxTokens: 4096 ,
privacy: "private" ,
},
{
id: "deepseek-v3.2" ,
name: "DeepSeek V3.2" ,
reasoning: true ,
input: ["text" ],
contextWindow: 160000 ,
maxTokens: 32768 ,
supportsTools: false ,
privacy: "private" ,
},
{
id: "venice-uncensored" ,
name: "Venice Uncensored (Dolphin-Mistral)" ,
reasoning: false ,
input: ["text" ],
contextWindow: 32000 ,
maxTokens: 4096 ,
supportsTools: false ,
privacy: "private" ,
},
{
id: "mistral-31-24b" ,
name: "Venice Medium (Mistral)" ,
reasoning: false ,
input: ["text" , "image" ],
contextWindow: 128000 ,
maxTokens: 4096 ,
privacy: "private" ,
},
{
id: "google-gemma-3-27b-it" ,
name: "Google Gemma 3 27B Instruct" ,
reasoning: false ,
input: ["text" , "image" ],
contextWindow: 198000 ,
maxTokens: 16384 ,
privacy: "private" ,
},
{
id: "openai-gpt-oss-120b" ,
name: "OpenAI GPT OSS 120B" ,
reasoning: false ,
input: ["text" ],
contextWindow: 128000 ,
maxTokens: 16384 ,
privacy: "private" ,
},
{
id: "nvidia-nemotron-3-nano-30b-a3b" ,
name: "NVIDIA Nemotron 3 Nano 30B" ,
reasoning: false ,
input: ["text" ],
contextWindow: 128000 ,
maxTokens: 16384 ,
privacy: "private" ,
},
{
id: "olafangensan-glm-4.7-flash-heretic" ,
name: "GLM 4.7 Flash Heretic" ,
reasoning: true ,
input: ["text" ],
contextWindow: 128000 ,
maxTokens: 24000 ,
privacy: "private" ,
},
{
id: "zai-org-glm-4.6" ,
name: "GLM 4.6" ,
reasoning: false ,
input: ["text" ],
contextWindow: 198000 ,
maxTokens: 16384 ,
privacy: "private" ,
},
{
id: "zai-org-glm-4.7" ,
name: "GLM 4.7" ,
reasoning: true ,
input: ["text" ],
contextWindow: 198000 ,
maxTokens: 16384 ,
privacy: "private" ,
},
{
id: "zai-org-glm-4.7-flash" ,
name: "GLM 4.7 Flash" ,
reasoning: true ,
input: ["text" ],
contextWindow: 128000 ,
maxTokens: 16384 ,
privacy: "private" ,
},
{
id: "zai-org-glm-5" ,
name: "GLM 5" ,
reasoning: true ,
input: ["text" ],
contextWindow: 198000 ,
maxTokens: 32000 ,
privacy: "private" ,
},
{
id: "kimi-k2-5" ,
name: "Kimi K2.5" ,
reasoning: true ,
input: ["text" , "image" ],
contextWindow: 256000 ,
maxTokens: 65536 ,
privacy: "private" ,
},
{
id: "kimi-k2-thinking" ,
name: "Kimi K2 Thinking" ,
reasoning: true ,
input: ["text" ],
contextWindow: 256000 ,
maxTokens: 65536 ,
privacy: "private" ,
},
{
id: "minimax-m21" ,
name: "MiniMax M2.1" ,
reasoning: true ,
input: ["text" ],
contextWindow: 198000 ,
maxTokens: 32768 ,
privacy: "private" ,
},
{
id: "minimax-m25" ,
name: "MiniMax M2.5" ,
reasoning: true ,
input: ["text" ],
contextWindow: 198000 ,
maxTokens: 32768 ,
privacy: "private" ,
},
{
id: "claude-opus-4-5" ,
name: "Claude Opus 4.5 (via Venice)" ,
reasoning: true ,
input: ["text" , "image" ],
contextWindow: 198000 ,
maxTokens: 32768 ,
privacy: "anonymized" ,
},
{
id: "claude-opus-4-6" ,
name: "Claude Opus 4.6 (via Venice)" ,
reasoning: true ,
input: ["text" , "image" ],
contextWindow: 1000000 ,
maxTokens: 128000 ,
privacy: "anonymized" ,
},
{
id: "claude-sonnet-4-5" ,
name: "Claude Sonnet 4.5 (via Venice)" ,
reasoning: true ,
input: ["text" , "image" ],
contextWindow: 198000 ,
maxTokens: 64000 ,
privacy: "anonymized" ,
},
{
id: "claude-sonnet-4-6" ,
name: "Claude Sonnet 4.6 (via Venice)" ,
reasoning: true ,
input: ["text" , "image" ],
contextWindow: 1000000 ,
maxTokens: 64000 ,
privacy: "anonymized" ,
},
{
id: "openai-gpt-52" ,
name: "GPT-5.2 (via Venice)" ,
reasoning: true ,
input: ["text" ],
contextWindow: 256000 ,
maxTokens: 65536 ,
privacy: "anonymized" ,
},
{
id: "openai-gpt-52-codex" ,
name: "GPT-5.2 Codex (via Venice)" ,
reasoning: true ,
input: ["text" , "image" ],
contextWindow: 256000 ,
maxTokens: 65536 ,
privacy: "anonymized" ,
},
{
id: "openai-gpt-53-codex" ,
name: "GPT-5.3 Codex (via Venice)" ,
reasoning: true ,
input: ["text" , "image" ],
contextWindow: 400000 ,
maxTokens: 128000 ,
privacy: "anonymized" ,
},
{
id: "openai-gpt-54" ,
name: "GPT-5.4 (via Venice)" ,
reasoning: true ,
input: ["text" , "image" ],
contextWindow: 1000000 ,
maxTokens: 131072 ,
privacy: "anonymized" ,
},
{
id: "openai-gpt-4o-2024-11-20" ,
name: "GPT-4o (via Venice)" ,
reasoning: false ,
input: ["text" , "image" ],
contextWindow: 128000 ,
maxTokens: 16384 ,
privacy: "anonymized" ,
},
{
id: "openai-gpt-4o-mini-2024-07-18" ,
name: "GPT-4o Mini (via Venice)" ,
reasoning: false ,
input: ["text" , "image" ],
contextWindow: 128000 ,
maxTokens: 16384 ,
privacy: "anonymized" ,
},
{
id: "gemini-3-pro-preview" ,
name: "Gemini 3 Pro (via Venice)" ,
reasoning: true ,
input: ["text" , "image" ],
contextWindow: 198000 ,
maxTokens: 32768 ,
privacy: "anonymized" ,
},
{
id: "gemini-3-1-pro-preview" ,
name: "Gemini 3.1 Pro (via Venice)" ,
reasoning: true ,
input: ["text" , "image" ],
contextWindow: 1000000 ,
maxTokens: 32768 ,
privacy: "anonymized" ,
},
{
id: "gemini-3-flash-preview" ,
name: "Gemini 3 Flash (via Venice)" ,
reasoning: true ,
input: ["text" , "image" ],
contextWindow: 256000 ,
maxTokens: 65536 ,
privacy: "anonymized" ,
},
{
id: "grok-41-fast" ,
name: "Grok 4.1 Fast (via Venice)" ,
reasoning: true ,
input: ["text" , "image" ],
contextWindow: 1000000 ,
maxTokens: 30000 ,
privacy: "anonymized" ,
},
{
id: "grok-code-fast-1" ,
name: "Grok Code Fast 1 (via Venice)" ,
reasoning: true ,
input: ["text" ],
contextWindow: 256000 ,
maxTokens: 10000 ,
privacy: "anonymized" ,
},
] as const ;
export type VeniceCatalogEntry = (typeof VENICE_MODEL_CATALOG)[number];
export function buildVeniceModelDefinition(entry: VeniceCatalogEntry): ModelDefinitionConfig {
return {
id: entry.id,
name: entry.name,
reasoning: entry.reasoning,
input: [...entry.input],
cost: VENICE_DEFAULT_COST,
contextWindow: entry.contextWindow,
maxTokens: entry.maxTokens,
compat: {
supportsUsageInStreaming: false ,
...("supportsTools" in entry && !entry.supportsTools ? { supportsTools: false } : {}),
},
};
}
interface VeniceModelSpec {
name: string;
privacy: "private" | "anonymized" ;
availableContextTokens?: number;
maxCompletionTokens?: number;
capabilities?: {
supportsReasoning?: boolean ;
supportsVision?: boolean ;
supportsFunctionCalling?: boolean ;
};
}
interface VeniceModel {
id: string;
model_spec?: VeniceModelSpec;
}
interface VeniceModelsResponse {
data: VeniceModel[];
}
class VeniceDiscoveryHttpError extends Error {
readonly status: number;
constructor(status: number) {
super (`HTTP ${status}`);
this .name = "VeniceDiscoveryHttpError" ;
this .status = status;
}
}
function staticVeniceModelDefinitions(): ModelDefinitionConfig[] {
return VENICE_MODEL_CATALOG.map(buildVeniceModelDefinition);
}
function hasRetryableNetworkCode(err: unknown): boolean {
const queue: unknown[] = [err];
const seen = new Set<unknown>();
while (queue.length > 0 ) {
const current = queue.shift();
if (!current || typeof current !== "object" || seen.has(current)) {
continue ;
}
seen.add(current);
const candidate = current as {
cause?: unknown;
errors?: unknown;
code?: unknown;
errno?: unknown;
};
const code =
typeof candidate.code === "string"
? candidate.code
: typeof candidate.errno === "string"
? candidate.errno
: undefined;
if (code && VENICE_DISCOVERY_RETRYABLE_NETWORK_CODES.has(code)) {
return true ;
}
if (candidate.cause) {
queue.push(candidate.cause);
}
if (Array.isArray(candidate.errors)) {
queue.push(...candidate.errors);
}
}
return false ;
}
function isRetryableVeniceDiscoveryError(err: unknown): boolean {
if (err instanceof VeniceDiscoveryHttpError) {
return true ;
}
if (err instanceof Error && err.name === "AbortError" ) {
return true ;
}
if (err instanceof TypeError && normalizeLowercaseStringOrEmpty(err.message) === "fetch failed" ) {
return true ;
}
return hasRetryableNetworkCode(err);
}
function normalizePositiveInt(value: unknown): number | undefined {
if (typeof value !== "number" || !Number.isFinite(value) || value <= 0 ) {
return undefined;
}
return Math.floor(value);
}
function resolveApiMaxCompletionTokens(params: {
apiModel: VeniceModel;
knownMaxTokens?: number;
}): number | undefined {
const raw = normalizePositiveInt(params.apiModel.model_spec?.maxCompletionTokens);
if (!raw) {
return undefined;
}
const contextWindow = normalizePositiveInt(params.apiModel.model_spec?.availableContextTokens);
const knownMaxTokens =
typeof params.knownMaxTokens === "number" && Number.isFinite(params.knownMaxTokens)
? Math.floor(params.knownMaxTokens)
: undefined;
const hardCap = knownMaxTokens ?? VENICE_DISCOVERY_HARD_MAX_TOKENS;
const fallbackContextWindow = knownMaxTokens ?? VENICE_DEFAULT_CONTEXT_WINDOW;
return Math.min(raw, contextWindow ?? fallbackContextWindow, hardCap);
}
function resolveApiSupportsTools(apiModel: VeniceModel): boolean | undefined {
const supportsFunctionCalling = apiModel.model_spec?.capabilities?.supportsFunctionCalling;
return typeof supportsFunctionCalling === "boolean" ? supportsFunctionCalling : undefined;
}
type VeniceModelDiscoveryOptions = {
retryDelayMs?: number;
};
export async function discoverVeniceModels(
options: VeniceModelDiscoveryOptions = {},
): Promise<ModelDefinitionConfig[]> {
if (process.env.NODE_ENV === "test" || process.env.VITEST) {
return staticVeniceModelDefinitions();
}
try {
const { response, release } = await retryAsync(
async () => {
const result = await fetchWithSsrFGuard({
url: `${VENICE_BASE_URL}/models`,
signal: AbortSignal.timeout(VENICE_DISCOVERY_TIMEOUT_MS),
init: {
headers: {
Accept: "application/json" ,
},
},
policy: { allowedHostnames: VENICE_ALLOWED_HOSTNAMES },
auditContext: "venice-model-discovery" ,
});
const currentResponse = result.response;
if (
!currentResponse.ok &&
VENICE_DISCOVERY_RETRYABLE_HTTP_STATUS.has(currentResponse.status)
) {
await result.release();
throw new VeniceDiscoveryHttpError(currentResponse.status);
}
return result;
},
{
attempts: 3 ,
minDelayMs: options.retryDelayMs ?? 300 ,
maxDelayMs: options.retryDelayMs ?? 2000 ,
jitter: options.retryDelayMs === undefined ? 0 .2 : 0 ,
label: "venice-model-discovery" ,
shouldRetry: isRetryableVeniceDiscoveryError,
},
);
try {
if (!response.ok) {
log.warn(`Failed to discover models: HTTP ${response.status}, using static catalog`);
return staticVeniceModelDefinitions();
}
const data = (await response.json()) as VeniceModelsResponse;
if (!Array.isArray(data.data) || data.data.length === 0 ) {
log.warn("No models found from API, using static catalog" );
return staticVeniceModelDefinitions();
}
const catalogById = new Map<string, VeniceCatalogEntry>(
VENICE_MODEL_CATALOG.map((m) => [m.id, m]),
);
const models: ModelDefinitionConfig[] = [];
for (const apiModel of data.data) {
const catalogEntry = catalogById.get(apiModel.id);
const apiMaxTokens = resolveApiMaxCompletionTokens({
apiModel,
knownMaxTokens: catalogEntry?.maxTokens,
});
const apiSupportsTools = resolveApiSupportsTools(apiModel);
if (catalogEntry) {
const definition = buildVeniceModelDefinition(catalogEntry);
if (apiMaxTokens !== undefined) {
definition.maxTokens = apiMaxTokens;
}
if (apiSupportsTools === false ) {
definition.compat = {
...definition.compat,
supportsTools: false ,
};
}
models.push(definition);
} else {
const apiSpec = apiModel.model_spec;
const lowerModelId = normalizeLowercaseStringOrEmpty(apiModel.id);
const isReasoning =
apiSpec?.capabilities?.supportsReasoning ||
lowerModelId.includes("thinking" ) ||
lowerModelId.includes("reason" ) ||
lowerModelId.includes("r1" );
const hasVision = apiSpec?.capabilities?.supportsVision === true ;
models.push({
id: apiModel.id,
name: apiSpec?.name || apiModel.id,
reasoning: isReasoning,
input: hasVision ? ["text" , "image" ] : ["text" ],
cost: VENICE_DEFAULT_COST,
contextWindow:
normalizePositiveInt(apiSpec?.availableContextTokens) ??
VENICE_DEFAULT_CONTEXT_WINDOW,
maxTokens: apiMaxTokens ?? VENICE_DEFAULT_MAX_TOKENS,
compat: {
supportsUsageInStreaming: false ,
...(apiSupportsTools === false ? { supportsTools: false } : {}),
},
});
}
}
return models.length > 0 ? models : staticVeniceModelDefinitions();
} finally {
await release();
}
} catch (error) {
if (error instanceof VeniceDiscoveryHttpError) {
log.warn(`Failed to discover models: HTTP ${error.status}, using static catalog`);
return staticVeniceModelDefinitions();
}
log.warn(`Discovery failed: ${String(error)}, using static catalog`);
return staticVeniceModelDefinitions();
}
}
Messung V0.5 in Prozent C=100 H=98 G=98
¤ Dauer der Verarbeitung: 0.10 Sekunden
(vorverarbeitet am 2026-06-05)
¤
*© Formatika GbR, Deutschland