@mastra/core
Version:
Mastra is a framework for building AI-powered applications and agents with a modern TypeScript stack.
1,519 lines (1,514 loc) • 104 kB
JavaScript
'use strict';
var fs = require('fs');
var module$1 = require('module');
var os = require('os');
var path = require('path');
var _documentCurrentScript = typeof document !== 'undefined' ? document.currentScript : null;
function _interopDefault (e) { return e && e.__esModule ? e : { default: e }; }
var fs__default = /*#__PURE__*/_interopDefault(fs);
var os__default = /*#__PURE__*/_interopDefault(os);
var path__default = /*#__PURE__*/_interopDefault(path);
// src/llm/model/provider-registry.ts
// src/llm/model/provider-registry.json
var provider_registry_default = {
providers: {
"moonshotai-cn": {
url: "https://api.moonshot.cn/v1",
apiKeyEnvVar: "MOONSHOT_API_KEY",
apiKeyHeader: "Authorization",
name: "Moonshot AI (China)",
models: [
"kimi-k2-0711-preview",
"kimi-k2-0905-preview",
"kimi-k2-thinking",
"kimi-k2-thinking-turbo",
"kimi-k2-turbo-preview"
],
docUrl: "https://platform.moonshot.cn/docs/api/chat",
gateway: "models.dev"
},
lucidquery: {
url: "https://lucidquery.com/api/v1",
apiKeyEnvVar: "LUCIDQUERY_API_KEY",
apiKeyHeader: "Authorization",
name: "LucidQuery AI",
models: ["lucidnova-rf1-100b", "lucidquery-nexus-coder"],
docUrl: "https://lucidquery.com/api/docs",
gateway: "models.dev"
},
moonshotai: {
url: "https://api.moonshot.ai/v1",
apiKeyEnvVar: "MOONSHOT_API_KEY",
apiKeyHeader: "Authorization",
name: "Moonshot AI",
models: [
"kimi-k2-0711-preview",
"kimi-k2-0905-preview",
"kimi-k2-thinking",
"kimi-k2-thinking-turbo",
"kimi-k2-turbo-preview"
],
docUrl: "https://platform.moonshot.ai/docs/api/chat",
gateway: "models.dev"
},
"zai-coding-plan": {
url: "https://api.z.ai/api/coding/paas/v4",
apiKeyEnvVar: "ZHIPU_API_KEY",
apiKeyHeader: "Authorization",
name: "Z.AI Coding Plan",
models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
docUrl: "https://docs.z.ai/devpack/overview",
gateway: "models.dev"
},
alibaba: {
url: "https://dashscope-intl.aliyuncs.com/compatible-mode/v1",
apiKeyEnvVar: "DASHSCOPE_API_KEY",
apiKeyHeader: "Authorization",
name: "Alibaba",
models: [
"qvq-max",
"qwen-flash",
"qwen-max",
"qwen-mt-plus",
"qwen-mt-turbo",
"qwen-omni-turbo",
"qwen-omni-turbo-realtime",
"qwen-plus",
"qwen-plus-character-ja",
"qwen-turbo",
"qwen-vl-max",
"qwen-vl-ocr",
"qwen-vl-plus",
"qwen2-5-14b-instruct",
"qwen2-5-32b-instruct",
"qwen2-5-72b-instruct",
"qwen2-5-7b-instruct",
"qwen2-5-omni-7b",
"qwen2-5-vl-72b-instruct",
"qwen2-5-vl-7b-instruct",
"qwen3-14b",
"qwen3-235b-a22b",
"qwen3-32b",
"qwen3-8b",
"qwen3-asr-flash",
"qwen3-coder-30b-a3b-instruct",
"qwen3-coder-480b-a35b-instruct",
"qwen3-coder-flash",
"qwen3-coder-plus",
"qwen3-livetranslate-flash-realtime",
"qwen3-max",
"qwen3-next-80b-a3b-instruct",
"qwen3-next-80b-a3b-thinking",
"qwen3-omni-flash",
"qwen3-omni-flash-realtime",
"qwen3-vl-235b-a22b",
"qwen3-vl-30b-a3b",
"qwen3-vl-plus",
"qwq-plus"
],
docUrl: "https://www.alibabacloud.com/help/en/model-studio/models",
gateway: "models.dev"
},
xai: {
apiKeyEnvVar: "XAI_API_KEY",
name: "xAI",
models: [
"grok-2",
"grok-2-1212",
"grok-2-latest",
"grok-2-vision",
"grok-2-vision-1212",
"grok-2-vision-latest",
"grok-3",
"grok-3-fast",
"grok-3-fast-latest",
"grok-3-latest",
"grok-3-mini",
"grok-3-mini-fast",
"grok-3-mini-fast-latest",
"grok-3-mini-latest",
"grok-4",
"grok-4-1-fast",
"grok-4-1-fast-non-reasoning",
"grok-4-fast",
"grok-4-fast-non-reasoning",
"grok-beta",
"grok-code-fast-1",
"grok-vision-beta"
],
docUrl: "https://docs.x.ai/docs/models",
gateway: "models.dev"
},
vultr: {
url: "https://api.vultrinference.com/v1",
apiKeyEnvVar: "VULTR_API_KEY",
apiKeyHeader: "Authorization",
name: "Vultr",
models: [
"deepseek-r1-distill-llama-70b",
"deepseek-r1-distill-qwen-32b",
"gpt-oss-120b",
"kimi-k2-instruct",
"qwen2.5-coder-32b-instruct"
],
docUrl: "https://api.vultrinference.com/",
gateway: "models.dev"
},
nvidia: {
url: "https://integrate.api.nvidia.com/v1",
apiKeyEnvVar: "NVIDIA_API_KEY",
apiKeyHeader: "Authorization",
name: "Nvidia",
models: [
"black-forest-labs/flux.1-dev",
"deepseek-ai/deepseek-v3.1",
"deepseek-ai/deepseek-v3.1-terminus",
"google/gemma-3-27b-it",
"microsoft/phi-4-mini-instruct",
"minimaxai/minimax-m2",
"moonshotai/kimi-k2-instruct",
"moonshotai/kimi-k2-instruct-0905",
"nvidia/cosmos-nemotron-34b",
"nvidia/llama-3.1-nemotron-ultra-253b-v1",
"nvidia/llama-embed-nemotron-8b",
"nvidia/nemoretriever-ocr-v1",
"nvidia/nvidia-nemotron-nano-9b-v2",
"nvidia/parakeet-tdt-0.6b-v2",
"openai/gpt-oss-120b",
"openai/whisper-large-v3",
"qwen/qwen3-235b-a22b",
"qwen/qwen3-coder-480b-a35b-instruct",
"qwen/qwen3-next-80b-a3b-instruct",
"qwen/qwen3-next-80b-a3b-thinking"
],
docUrl: "https://docs.api.nvidia.com/nim/",
gateway: "models.dev"
},
upstage: {
url: "https://api.upstage.ai",
apiKeyEnvVar: "UPSTAGE_API_KEY",
apiKeyHeader: "Authorization",
name: "Upstage",
models: ["solar-mini", "solar-pro2"],
docUrl: "https://developers.upstage.ai/docs/apis/chat",
gateway: "models.dev"
},
groq: {
url: "https://api.groq.com/openai/v1",
apiKeyEnvVar: "GROQ_API_KEY",
apiKeyHeader: "Authorization",
name: "Groq",
models: [
"deepseek-r1-distill-llama-70b",
"gemma2-9b-it",
"llama-3.1-8b-instant",
"llama-3.3-70b-versatile",
"llama-guard-3-8b",
"llama3-70b-8192",
"llama3-8b-8192",
"meta-llama/llama-4-maverick-17b-128e-instruct",
"meta-llama/llama-4-scout-17b-16e-instruct",
"meta-llama/llama-guard-4-12b",
"mistral-saba-24b",
"moonshotai/kimi-k2-instruct",
"moonshotai/kimi-k2-instruct-0905",
"openai/gpt-oss-120b",
"openai/gpt-oss-20b",
"qwen-qwq-32b",
"qwen/qwen3-32b"
],
docUrl: "https://console.groq.com/docs/models",
gateway: "models.dev"
},
mistral: {
url: "https://api.mistral.ai/v1",
apiKeyEnvVar: "MISTRAL_API_KEY",
name: "Mistral",
models: [
"codestral-latest",
"devstral-medium-2507",
"devstral-small-2505",
"devstral-small-2507",
"magistral-medium-latest",
"magistral-small",
"ministral-3b-latest",
"ministral-8b-latest",
"mistral-large-latest",
"mistral-medium-2505",
"mistral-medium-2508",
"mistral-medium-latest",
"mistral-nemo",
"mistral-small-latest",
"open-mistral-7b",
"open-mixtral-8x22b",
"open-mixtral-8x7b",
"pixtral-12b",
"pixtral-large-latest"
],
docUrl: "https://docs.mistral.ai/getting-started/models/",
gateway: "models.dev"
},
vercel: {
url: "https://ai-gateway.vercel.sh/v1",
apiKeyEnvVar: "AI_GATEWAY_API_KEY",
apiKeyHeader: "Authorization",
name: "Vercel AI Gateway",
models: [
"alibaba/qwen3-coder-plus",
"alibaba/qwen3-max",
"alibaba/qwen3-next-80b-a3b-instruct",
"alibaba/qwen3-next-80b-a3b-thinking",
"alibaba/qwen3-vl-instruct",
"alibaba/qwen3-vl-thinking",
"amazon/nova-lite",
"amazon/nova-micro",
"amazon/nova-pro",
"anthropic/claude-3-haiku",
"anthropic/claude-3-opus",
"anthropic/claude-3.5-haiku",
"anthropic/claude-3.5-sonnet",
"anthropic/claude-3.7-sonnet",
"anthropic/claude-4-1-opus",
"anthropic/claude-4-opus",
"anthropic/claude-4-sonnet",
"anthropic/claude-4.5-sonnet",
"anthropic/claude-haiku-4.5",
"anthropic/claude-opus-4.5",
"deepseek/deepseek-r1",
"deepseek/deepseek-r1-distill-llama-70b",
"deepseek/deepseek-v3.1-terminus",
"deepseek/deepseek-v3.2-exp",
"deepseek/deepseek-v3.2-exp-thinking",
"google/gemini-2.0-flash",
"google/gemini-2.0-flash-lite",
"google/gemini-2.5-flash",
"google/gemini-2.5-flash-lite",
"google/gemini-2.5-flash-lite-preview-09-2025",
"google/gemini-2.5-flash-preview-09-2025",
"google/gemini-2.5-pro",
"google/gemini-3-pro-preview",
"meta/llama-3.3-70b",
"meta/llama-4-maverick",
"meta/llama-4-scout",
"minimax/minimax-m2",
"mistral/codestral",
"mistral/magistral-medium",
"mistral/magistral-small",
"mistral/ministral-3b",
"mistral/ministral-8b",
"mistral/mistral-large",
"mistral/mistral-small",
"mistral/mixtral-8x22b-instruct",
"mistral/pixtral-12b",
"mistral/pixtral-large",
"moonshotai/kimi-k2",
"morph/morph-v3-fast",
"morph/morph-v3-large",
"openai/gpt-4-turbo",
"openai/gpt-4.1",
"openai/gpt-4.1-mini",
"openai/gpt-4.1-nano",
"openai/gpt-4o",
"openai/gpt-4o-mini",
"openai/gpt-5",
"openai/gpt-5-codex",
"openai/gpt-5-mini",
"openai/gpt-5-nano",
"openai/gpt-oss-120b",
"openai/gpt-oss-20b",
"openai/o1",
"openai/o3",
"openai/o3-mini",
"openai/o4-mini",
"perplexity/sonar",
"perplexity/sonar-pro",
"perplexity/sonar-reasoning",
"perplexity/sonar-reasoning-pro",
"vercel/v0-1.0-md",
"vercel/v0-1.5-md",
"xai/grok-2",
"xai/grok-2-vision",
"xai/grok-3",
"xai/grok-3-fast",
"xai/grok-3-mini",
"xai/grok-3-mini-fast",
"xai/grok-4",
"xai/grok-4-fast",
"xai/grok-4-fast-non-reasoning",
"xai/grok-code-fast-1",
"zai/glm-4.5",
"zai/glm-4.5-air",
"zai/glm-4.5v",
"zai/glm-4.6"
],
docUrl: "https://github.com/vercel/ai/tree/5eb85cc45a259553501f535b8ac79a77d0e79223/packages/gateway",
gateway: "models.dev"
},
nebius: {
url: "https://api.tokenfactory.nebius.com/v1",
apiKeyEnvVar: "NEBIUS_API_KEY",
apiKeyHeader: "Authorization",
name: "Nebius Token Factory",
models: [
"NousResearch/hermes-4-405b",
"NousResearch/hermes-4-70b",
"deepseek-ai/deepseek-v3",
"meta-llama/llama-3.3-70b-instruct-base",
"meta-llama/llama-3.3-70b-instruct-fast",
"meta-llama/llama-3_1-405b-instruct",
"moonshotai/kimi-k2-instruct",
"nvidia/llama-3_1-nemotron-ultra-253b-v1",
"openai/gpt-oss-120b",
"openai/gpt-oss-20b",
"qwen/qwen3-235b-a22b-instruct-2507",
"qwen/qwen3-235b-a22b-thinking-2507",
"qwen/qwen3-coder-480b-a35b-instruct",
"zai-org/glm-4.5",
"zai-org/glm-4.5-air"
],
docUrl: "https://docs.tokenfactory.nebius.com/",
gateway: "models.dev"
},
deepseek: {
url: "https://api.deepseek.com",
apiKeyEnvVar: "DEEPSEEK_API_KEY",
apiKeyHeader: "Authorization",
name: "DeepSeek",
models: ["deepseek-chat", "deepseek-reasoner"],
docUrl: "https://platform.deepseek.com/api-docs/pricing",
gateway: "models.dev"
},
"alibaba-cn": {
url: "https://dashscope.aliyuncs.com/compatible-mode/v1",
apiKeyEnvVar: "DASHSCOPE_API_KEY",
apiKeyHeader: "Authorization",
name: "Alibaba (China)",
models: [
"deepseek-r1",
"deepseek-r1-0528",
"deepseek-r1-distill-llama-70b",
"deepseek-r1-distill-llama-8b",
"deepseek-r1-distill-qwen-1-5b",
"deepseek-r1-distill-qwen-14b",
"deepseek-r1-distill-qwen-32b",
"deepseek-r1-distill-qwen-7b",
"deepseek-v3",
"deepseek-v3-1",
"deepseek-v3-2-exp",
"moonshot-kimi-k2-instruct",
"qvq-max",
"qwen-deep-research",
"qwen-doc-turbo",
"qwen-flash",
"qwen-long",
"qwen-math-plus",
"qwen-math-turbo",
"qwen-max",
"qwen-mt-plus",
"qwen-mt-turbo",
"qwen-omni-turbo",
"qwen-omni-turbo-realtime",
"qwen-plus",
"qwen-plus-character",
"qwen-turbo",
"qwen-vl-max",
"qwen-vl-ocr",
"qwen-vl-plus",
"qwen2-5-14b-instruct",
"qwen2-5-32b-instruct",
"qwen2-5-72b-instruct",
"qwen2-5-7b-instruct",
"qwen2-5-coder-32b-instruct",
"qwen2-5-coder-7b-instruct",
"qwen2-5-math-72b-instruct",
"qwen2-5-math-7b-instruct",
"qwen2-5-omni-7b",
"qwen2-5-vl-72b-instruct",
"qwen2-5-vl-7b-instruct",
"qwen3-14b",
"qwen3-235b-a22b",
"qwen3-32b",
"qwen3-8b",
"qwen3-asr-flash",
"qwen3-coder-30b-a3b-instruct",
"qwen3-coder-480b-a35b-instruct",
"qwen3-coder-flash",
"qwen3-coder-plus",
"qwen3-max",
"qwen3-next-80b-a3b-instruct",
"qwen3-next-80b-a3b-thinking",
"qwen3-omni-flash",
"qwen3-omni-flash-realtime",
"qwen3-vl-235b-a22b",
"qwen3-vl-30b-a3b",
"qwen3-vl-plus",
"qwq-32b",
"qwq-plus",
"tongyi-intent-detect-v3"
],
docUrl: "https://www.alibabacloud.com/help/en/model-studio/models",
gateway: "models.dev"
},
venice: {
url: "https://api.venice.ai/api/v1",
apiKeyEnvVar: "VENICE_API_KEY",
apiKeyHeader: "Authorization",
name: "Venice AI",
models: [
"deepseek-coder-v2-lite",
"deepseek-r1-671b",
"dolphin-2.9.2-qwen2-72b",
"llama-3.1-405b",
"llama-3.2-3b",
"llama-3.3-70b",
"mistral-31-24b",
"qwen-2.5-coder-32b",
"qwen-2.5-qwq-32b",
"qwen-2.5-vl",
"qwen3-235b",
"qwen3-4b",
"venice-uncensored",
"zai-org-glm-4.6"
],
docUrl: "https://docs.venice.ai",
gateway: "models.dev"
},
chutes: {
url: "https://llm.chutes.ai/v1",
apiKeyEnvVar: "CHUTES_API_KEY",
apiKeyHeader: "Authorization",
name: "Chutes",
models: [
"Alibaba-NLP/Tongyi-DeepResearch-30B-A3B",
"ArliAI/QwQ-32B-ArliAI-RpR-v1",
"MiniMaxAI/MiniMax-M2",
"NousResearch/DeepHermes-3-Mistral-24B-Preview",
"NousResearch/Hermes-4-14B",
"NousResearch/Hermes-4-405B-FP8",
"NousResearch/Hermes-4-70B",
"OpenGVLab/InternVL3-78B",
"Qwen/Qwen2.5-72B-Instruct",
"Qwen/Qwen2.5-Coder-32B-Instruct",
"Qwen/Qwen2.5-VL-32B-Instruct",
"Qwen/Qwen2.5-VL-72B-Instruct",
"Qwen/Qwen3-14B",
"Qwen/Qwen3-235B-A22B",
"Qwen/Qwen3-235B-A22B-Instruct-2507",
"Qwen/Qwen3-235B-A22B-Thinking-2507",
"Qwen/Qwen3-30B-A3B",
"Qwen/Qwen3-30B-A3B-Instruct-2507",
"Qwen/Qwen3-32B",
"Qwen/Qwen3-Coder-30B-A3B-Instruct",
"Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
"Qwen/Qwen3-Next-80B-A3B-Instruct",
"Qwen/Qwen3-VL-235B-A22B-Instruct",
"Qwen/Qwen3-VL-235B-A22B-Thinking",
"chutesai/Mistral-Small-3.1-24B-Instruct-2503",
"chutesai/Mistral-Small-3.2-24B-Instruct-2506",
"deepseek-ai/DeepSeek-R1",
"deepseek-ai/DeepSeek-R1-0528",
"deepseek-ai/DeepSeek-R1-0528-Qwen3-8B",
"deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
"deepseek-ai/DeepSeek-V3",
"deepseek-ai/DeepSeek-V3-0324",
"deepseek-ai/DeepSeek-V3.1",
"deepseek-ai/DeepSeek-V3.1-Terminus",
"deepseek-ai/DeepSeek-V3.2-Exp",
"meituan-longcat/LongCat-Flash-Chat-FP8",
"microsoft/MAI-DS-R1-FP8",
"moonshotai/Kimi-K2-Instruct-0905",
"moonshotai/Kimi-K2-Thinking",
"openai/gpt-oss-120b",
"openai/gpt-oss-20b",
"rednote-hilab/dots.ocr",
"tngtech/DeepSeek-R1T-Chimera",
"tngtech/DeepSeek-TNG-R1T2-Chimera",
"unsloth/Mistral-Nemo-Instruct-2407",
"unsloth/Mistral-Small-24B-Instruct-2501",
"unsloth/gemma-3-12b-it",
"unsloth/gemma-3-27b-it",
"unsloth/gemma-3-4b-it",
"zai-org/GLM-4.5",
"zai-org/GLM-4.5-Air",
"zai-org/GLM-4.6"
],
docUrl: "https://llm.chutes.ai/v1/models",
gateway: "models.dev"
},
cortecs: {
url: "https://api.cortecs.ai/v1",
apiKeyEnvVar: "CORTECS_API_KEY",
apiKeyHeader: "Authorization",
name: "Cortecs",
models: [
"claude-4-5-sonnet",
"claude-sonnet-4",
"deepseek-v3-0324",
"gemini-2.5-pro",
"gpt-4.1",
"gpt-oss-120b",
"kimi-k2-instruct",
"llama-3.1-405b-instruct",
"nova-pro-v1",
"qwen3-32b",
"qwen3-coder-480b-a35b-instruct"
],
docUrl: "https://api.cortecs.ai/v1/models",
gateway: "models.dev"
},
"github-models": {
url: "https://models.github.ai/inference",
apiKeyEnvVar: "GITHUB_TOKEN",
apiKeyHeader: "Authorization",
name: "GitHub Models",
models: [
"ai21-labs/ai21-jamba-1.5-large",
"ai21-labs/ai21-jamba-1.5-mini",
"cohere/cohere-command-a",
"cohere/cohere-command-r",
"cohere/cohere-command-r-08-2024",
"cohere/cohere-command-r-plus",
"cohere/cohere-command-r-plus-08-2024",
"core42/jais-30b-chat",
"deepseek/deepseek-r1",
"deepseek/deepseek-r1-0528",
"deepseek/deepseek-v3-0324",
"meta/llama-3.2-11b-vision-instruct",
"meta/llama-3.2-90b-vision-instruct",
"meta/llama-3.3-70b-instruct",
"meta/llama-4-maverick-17b-128e-instruct-fp8",
"meta/llama-4-scout-17b-16e-instruct",
"meta/meta-llama-3-70b-instruct",
"meta/meta-llama-3-8b-instruct",
"meta/meta-llama-3.1-405b-instruct",
"meta/meta-llama-3.1-70b-instruct",
"meta/meta-llama-3.1-8b-instruct",
"microsoft/mai-ds-r1",
"microsoft/phi-3-medium-128k-instruct",
"microsoft/phi-3-medium-4k-instruct",
"microsoft/phi-3-mini-128k-instruct",
"microsoft/phi-3-mini-4k-instruct",
"microsoft/phi-3-small-128k-instruct",
"microsoft/phi-3-small-8k-instruct",
"microsoft/phi-3.5-mini-instruct",
"microsoft/phi-3.5-moe-instruct",
"microsoft/phi-3.5-vision-instruct",
"microsoft/phi-4",
"microsoft/phi-4-mini-instruct",
"microsoft/phi-4-mini-reasoning",
"microsoft/phi-4-multimodal-instruct",
"microsoft/phi-4-reasoning",
"mistral-ai/codestral-2501",
"mistral-ai/ministral-3b",
"mistral-ai/mistral-large-2411",
"mistral-ai/mistral-medium-2505",
"mistral-ai/mistral-nemo",
"mistral-ai/mistral-small-2503",
"openai/gpt-4.1",
"openai/gpt-4.1-mini",
"openai/gpt-4.1-nano",
"openai/gpt-4o",
"openai/gpt-4o-mini",
"openai/o1",
"openai/o1-mini",
"openai/o1-preview",
"openai/o3",
"openai/o3-mini",
"openai/o4-mini",
"xai/grok-3",
"xai/grok-3-mini"
],
docUrl: "https://docs.github.com/en/github-models",
gateway: "models.dev"
},
togetherai: {
url: "https://api.together.xyz/v1",
apiKeyEnvVar: "TOGETHER_API_KEY",
apiKeyHeader: "Authorization",
name: "Together AI",
models: [
"Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
"deepseek-ai/DeepSeek-R1",
"deepseek-ai/DeepSeek-V3",
"meta-llama/Llama-3.3-70B-Instruct-Turbo",
"moonshotai/Kimi-K2-Instruct",
"openai/gpt-oss-120b"
],
docUrl: "https://docs.together.ai/docs/serverless-models",
gateway: "models.dev"
},
baseten: {
url: "https://inference.baseten.co/v1",
apiKeyEnvVar: "BASETEN_API_KEY",
apiKeyHeader: "Authorization",
name: "Baseten",
models: [
"Qwen/Qwen3-Coder-480B-A35B-Instruct",
"moonshotai/Kimi-K2-Instruct-0905",
"moonshotai/Kimi-K2-Thinking",
"zai-org/GLM-4.6"
],
docUrl: "https://docs.baseten.co/development/model-apis/overview",
gateway: "models.dev"
},
siliconflow: {
url: "https://api.siliconflow.com/v1",
apiKeyEnvVar: "SILICONFLOW_API_KEY",
apiKeyHeader: "Authorization",
name: "SiliconFlow",
models: [
"baidu-ernie-4.5-300b-a47b",
"bytedance-seed-seed-oss-36b-instruct",
"deepseek-ai-deepseek-r1",
"deepseek-ai-deepseek-r1-distill-qwen-14b",
"deepseek-ai-deepseek-r1-distill-qwen-32b",
"deepseek-ai-deepseek-r1-distill-qwen-7b",
"deepseek-ai-deepseek-v3",
"deepseek-ai-deepseek-v3.1",
"deepseek-ai-deepseek-v3.1-terminus",
"deepseek-ai-deepseek-v3.2-exp",
"deepseek-ai-deepseek-vl2",
"inclusionai-ling-flash-2.0",
"inclusionai-ling-mini-2.0",
"inclusionai-ring-flash-2.0",
"meta-llama-meta-llama-3.1-8b-instruct",
"minimaxai-minimax-m1-80k",
"minimaxai-minimax-m2",
"moonshotai-kimi-dev-72b",
"moonshotai-kimi-k2-instruct",
"moonshotai-kimi-k2-instruct-0905",
"moonshotai-kimi-k2-thinking",
"nex-agi-deepseek-v3.1-nex-n1",
"openai-gpt-oss-120b",
"openai-gpt-oss-20b",
"qwen-qwen2.5-14b-instruct",
"qwen-qwen2.5-32b-instruct",
"qwen-qwen2.5-72b-instruct",
"qwen-qwen2.5-72b-instruct-128k",
"qwen-qwen2.5-7b-instruct",
"qwen-qwen2.5-coder-32b-instruct",
"qwen-qwen2.5-vl-32b-instruct",
"qwen-qwen2.5-vl-72b-instruct",
"qwen-qwen2.5-vl-7b-instruct",
"qwen-qwen3-14b",
"qwen-qwen3-235b-a22b",
"qwen-qwen3-235b-a22b-instruct-2507",
"qwen-qwen3-235b-a22b-thinking-2507",
"qwen-qwen3-30b-a3b",
"qwen-qwen3-30b-a3b-instruct-2507",
"qwen-qwen3-30b-a3b-thinking-2507",
"qwen-qwen3-32b",
"qwen-qwen3-8b",
"qwen-qwen3-coder-30b-a3b-instruct",
"qwen-qwen3-coder-480b-a35b-instruct",
"qwen-qwen3-next-80b-a3b-instruct",
"qwen-qwen3-next-80b-a3b-thinking",
"qwen-qwen3-omni-30b-a3b-captioner",
"qwen-qwen3-omni-30b-a3b-instruct",
"qwen-qwen3-omni-30b-a3b-thinking",
"qwen-qwen3-vl-235b-a22b-instruct",
"qwen-qwen3-vl-235b-a22b-thinking",
"qwen-qwen3-vl-30b-a3b-instruct",
"qwen-qwen3-vl-30b-a3b-thinking",
"qwen-qwen3-vl-32b-instruct",
"qwen-qwen3-vl-32b-thinking",
"qwen-qwen3-vl-8b-instruct",
"qwen-qwen3-vl-8b-thinking",
"qwen-qwq-32b",
"stepfun-ai-step3",
"tencent-hunyuan-a13b-instruct",
"tencent-hunyuan-mt-7b",
"thudm-glm-4-32b-0414",
"thudm-glm-4-9b-0414",
"thudm-glm-4.1v-9b-thinking",
"thudm-glm-z1-32b-0414",
"thudm-glm-z1-9b-0414",
"z-ai-glm-4.5",
"z-ai-glm-4.5-air",
"zai-org-glm-4.5",
"zai-org-glm-4.5-air",
"zai-org-glm-4.5v",
"zai-org-glm-4.6"
],
docUrl: "https://cloud.siliconflow.com/models",
gateway: "models.dev"
},
huggingface: {
url: "https://router.huggingface.co/v1",
apiKeyEnvVar: "HF_TOKEN",
apiKeyHeader: "Authorization",
name: "Hugging Face",
models: [
"MiniMaxAI/MiniMax-M2",
"Qwen/Qwen3-235B-A22B-Thinking-2507",
"Qwen/Qwen3-Coder-480B-A35B-Instruct",
"Qwen/Qwen3-Embedding-4B",
"Qwen/Qwen3-Embedding-8B",
"Qwen/Qwen3-Next-80B-A3B-Instruct",
"Qwen/Qwen3-Next-80B-A3B-Thinking",
"deepseek-ai/DeepSeek-R1-0528",
"deepseek-ai/Deepseek-V3-0324",
"moonshotai/Kimi-K2-Instruct",
"moonshotai/Kimi-K2-Instruct-0905",
"zai-org/GLM-4.5",
"zai-org/GLM-4.5-Air",
"zai-org/GLM-4.6"
],
docUrl: "https://huggingface.co/docs/inference-providers",
gateway: "models.dev"
},
opencode: {
url: "https://opencode.ai/zen/v1",
apiKeyEnvVar: "OPENCODE_API_KEY",
apiKeyHeader: "Authorization",
name: "OpenCode Zen",
models: [
"alpha-doubao-seed-code",
"alpha-gd4",
"alpha-minimax-m2",
"big-pickle",
"claude-3-5-haiku",
"claude-haiku-4-5",
"claude-opus-4-1",
"claude-opus-4-5",
"claude-sonnet-4",
"claude-sonnet-4-5",
"gemini-3-pro",
"glm-4.6",
"gpt-5",
"gpt-5-codex",
"gpt-5-nano",
"gpt-5.1",
"gpt-5.1-codex",
"grok-code",
"kimi-k2",
"kimi-k2-thinking",
"qwen3-coder"
],
docUrl: "https://opencode.ai/docs/zen",
gateway: "models.dev"
},
fastrouter: {
url: "https://go.fastrouter.ai/api/v1",
apiKeyEnvVar: "FASTROUTER_API_KEY",
apiKeyHeader: "Authorization",
name: "FastRouter",
models: [
"anthropic/claude-opus-4.1",
"anthropic/claude-sonnet-4",
"deepseek-ai/deepseek-r1-distill-llama-70b",
"google/gemini-2.5-flash",
"google/gemini-2.5-pro",
"moonshotai/kimi-k2",
"openai/gpt-4.1",
"openai/gpt-5",
"openai/gpt-5-mini",
"openai/gpt-5-nano",
"openai/gpt-oss-120b",
"openai/gpt-oss-20b",
"qwen/qwen3-coder",
"x-ai/grok-4"
],
docUrl: "https://fastrouter.ai/models",
gateway: "models.dev"
},
minimax: {
url: "https://api.minimax.io/anthropic/v1",
apiKeyEnvVar: "MINIMAX_API_KEY",
apiKeyHeader: "Authorization",
name: "Minimax",
models: ["MiniMax-M2"],
docUrl: "https://platform.minimax.io/docs/guides/quickstart",
gateway: "models.dev"
},
google: {
apiKeyEnvVar: "GOOGLE_GENERATIVE_AI_API_KEY",
name: "Google",
models: [
"gemini-1.5-flash",
"gemini-1.5-flash-8b",
"gemini-1.5-pro",
"gemini-2.0-flash",
"gemini-2.0-flash-lite",
"gemini-2.5-flash",
"gemini-2.5-flash-image",
"gemini-2.5-flash-image-preview",
"gemini-2.5-flash-lite",
"gemini-2.5-flash-lite-preview-06-17",
"gemini-2.5-flash-lite-preview-09-2025",
"gemini-2.5-flash-preview-04-17",
"gemini-2.5-flash-preview-05-20",
"gemini-2.5-flash-preview-09-2025",
"gemini-2.5-flash-preview-tts",
"gemini-2.5-pro",
"gemini-2.5-pro-preview-05-06",
"gemini-2.5-pro-preview-06-05",
"gemini-2.5-pro-preview-tts",
"gemini-3-pro-preview",
"gemini-embedding-001",
"gemini-flash-latest",
"gemini-flash-lite-latest",
"gemini-live-2.5-flash",
"gemini-live-2.5-flash-preview-native-audio"
],
docUrl: "https://ai.google.dev/gemini-api/docs/pricing",
gateway: "models.dev"
},
inception: {
url: "https://api.inceptionlabs.ai/v1/",
apiKeyEnvVar: "INCEPTION_API_KEY",
apiKeyHeader: "Authorization",
name: "Inception",
models: ["mercury", "mercury-coder"],
docUrl: "https://platform.inceptionlabs.ai/docs",
gateway: "models.dev"
},
wandb: {
url: "https://api.inference.wandb.ai/v1",
apiKeyEnvVar: "WANDB_API_KEY",
apiKeyHeader: "Authorization",
name: "Weights & Biases",
models: [
"Qwen/Qwen3-235B-A22B-Instruct-2507",
"Qwen/Qwen3-235B-A22B-Thinking-2507",
"Qwen/Qwen3-Coder-480B-A35B-Instruct",
"deepseek-ai/DeepSeek-R1-0528",
"deepseek-ai/DeepSeek-V3-0324",
"meta-llama/Llama-3.1-8B-Instruct",
"meta-llama/Llama-3.3-70B-Instruct",
"meta-llama/Llama-4-Scout-17B-16E-Instruct",
"microsoft/Phi-4-mini-instruct",
"moonshotai/Kimi-K2-Instruct"
],
docUrl: "https://weave-docs.wandb.ai/guides/integrations/inference/",
gateway: "models.dev"
},
openai: {
apiKeyEnvVar: "OPENAI_API_KEY",
name: "OpenAI",
models: [
"codex-mini-latest",
"gpt-3.5-turbo",
"gpt-4",
"gpt-4-turbo",
"gpt-4.1",
"gpt-4.1-mini",
"gpt-4.1-nano",
"gpt-4o",
"gpt-4o-2024-05-13",
"gpt-4o-2024-08-06",
"gpt-4o-2024-11-20",
"gpt-4o-mini",
"gpt-5",
"gpt-5-chat-latest",
"gpt-5-codex",
"gpt-5-mini",
"gpt-5-nano",
"gpt-5-pro",
"gpt-5.1",
"gpt-5.1-chat-latest",
"gpt-5.1-codex",
"gpt-5.1-codex-mini",
"o1",
"o1-mini",
"o1-preview",
"o1-pro",
"o3",
"o3-deep-research",
"o3-mini",
"o3-pro",
"o4-mini",
"o4-mini-deep-research",
"text-embedding-3-large",
"text-embedding-3-small",
"text-embedding-ada-002"
],
docUrl: "https://platform.openai.com/docs/models",
gateway: "models.dev"
},
"zhipuai-coding-plan": {
url: "https://open.bigmodel.cn/api/coding/paas/v4",
apiKeyEnvVar: "ZHIPU_API_KEY",
apiKeyHeader: "Authorization",
name: "Zhipu AI Coding Plan",
models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
docUrl: "https://docs.bigmodel.cn/cn/coding-plan/overview",
gateway: "models.dev"
},
perplexity: {
url: "https://api.perplexity.ai",
apiKeyEnvVar: "PERPLEXITY_API_KEY",
apiKeyHeader: "Authorization",
name: "Perplexity",
models: ["sonar", "sonar-pro", "sonar-reasoning", "sonar-reasoning-pro"],
docUrl: "https://docs.perplexity.ai",
gateway: "models.dev"
},
openrouter: {
url: "https://openrouter.ai/api/v1",
apiKeyEnvVar: "OPENROUTER_API_KEY",
name: "OpenRouter",
models: [
"anthropic/claude-3.5-haiku",
"anthropic/claude-3.7-sonnet",
"anthropic/claude-haiku-4.5",
"anthropic/claude-opus-4",
"anthropic/claude-opus-4.1",
"anthropic/claude-opus-4.5",
"anthropic/claude-sonnet-4",
"anthropic/claude-sonnet-4.5",
"cognitivecomputations/dolphin3.0-mistral-24b",
"cognitivecomputations/dolphin3.0-r1-mistral-24b",
"deepseek/deepseek-chat-v3-0324",
"deepseek/deepseek-chat-v3.1",
"deepseek/deepseek-r1-0528-qwen3-8b:free",
"deepseek/deepseek-r1-0528:free",
"deepseek/deepseek-r1-distill-llama-70b",
"deepseek/deepseek-r1-distill-qwen-14b",
"deepseek/deepseek-r1:free",
"deepseek/deepseek-v3-base:free",
"deepseek/deepseek-v3.1-terminus",
"deepseek/deepseek-v3.1-terminus:exacto",
"featherless/qwerky-72b",
"google/gemini-2.0-flash-001",
"google/gemini-2.0-flash-exp:free",
"google/gemini-2.5-flash",
"google/gemini-2.5-flash-lite",
"google/gemini-2.5-flash-lite-preview-09-2025",
"google/gemini-2.5-flash-preview-09-2025",
"google/gemini-2.5-pro",
"google/gemini-2.5-pro-preview-05-06",
"google/gemini-2.5-pro-preview-06-05",
"google/gemini-3-pro-preview",
"google/gemma-2-9b-it:free",
"google/gemma-3-12b-it",
"google/gemma-3-27b-it",
"google/gemma-3n-e4b-it",
"google/gemma-3n-e4b-it:free",
"kwaipilot/kat-coder-pro:free",
"meta-llama/llama-3.2-11b-vision-instruct",
"meta-llama/llama-3.3-70b-instruct:free",
"meta-llama/llama-4-scout:free",
"microsoft/mai-ds-r1:free",
"minimax/minimax-01",
"minimax/minimax-m1",
"minimax/minimax-m2",
"mistralai/codestral-2508",
"mistralai/devstral-medium-2507",
"mistralai/devstral-small-2505",
"mistralai/devstral-small-2505:free",
"mistralai/devstral-small-2507",
"mistralai/mistral-7b-instruct:free",
"mistralai/mistral-medium-3",
"mistralai/mistral-medium-3.1",
"mistralai/mistral-nemo:free",
"mistralai/mistral-small-3.1-24b-instruct",
"mistralai/mistral-small-3.2-24b-instruct",
"mistralai/mistral-small-3.2-24b-instruct:free",
"moonshotai/kimi-dev-72b:free",
"moonshotai/kimi-k2",
"moonshotai/kimi-k2-0905",
"moonshotai/kimi-k2-0905:exacto",
"moonshotai/kimi-k2-thinking",
"moonshotai/kimi-k2:free",
"nousresearch/deephermes-3-llama-3-8b-preview",
"nousresearch/hermes-4-405b",
"nousresearch/hermes-4-70b",
"nvidia/nemotron-nano-9b-v2",
"openai/gpt-4.1",
"openai/gpt-4.1-mini",
"openai/gpt-4o-mini",
"openai/gpt-5",
"openai/gpt-5-chat",
"openai/gpt-5-codex",
"openai/gpt-5-image",
"openai/gpt-5-mini",
"openai/gpt-5-nano",
"openai/gpt-5-pro",
"openai/gpt-5.1",
"openai/gpt-5.1-chat",
"openai/gpt-5.1-codex",
"openai/gpt-5.1-codex-mini",
"openai/gpt-oss-120b",
"openai/gpt-oss-120b:exacto",
"openai/gpt-oss-20b",
"openai/gpt-oss-safeguard-20b",
"openai/o4-mini",
"qwen/qwen-2.5-coder-32b-instruct",
"qwen/qwen2.5-vl-32b-instruct:free",
"qwen/qwen2.5-vl-72b-instruct",
"qwen/qwen2.5-vl-72b-instruct:free",
"qwen/qwen3-14b:free",
"qwen/qwen3-235b-a22b-07-25",
"qwen/qwen3-235b-a22b-07-25:free",
"qwen/qwen3-235b-a22b-thinking-2507",
"qwen/qwen3-235b-a22b:free",
"qwen/qwen3-30b-a3b-instruct-2507",
"qwen/qwen3-30b-a3b-thinking-2507",
"qwen/qwen3-30b-a3b:free",
"qwen/qwen3-32b:free",
"qwen/qwen3-8b:free",
"qwen/qwen3-coder",
"qwen/qwen3-coder-flash",
"qwen/qwen3-coder:exacto",
"qwen/qwen3-coder:free",
"qwen/qwen3-max",
"qwen/qwen3-next-80b-a3b-instruct",
"qwen/qwen3-next-80b-a3b-thinking",
"qwen/qwq-32b:free",
"rekaai/reka-flash-3",
"sarvamai/sarvam-m:free",
"thudm/glm-z1-32b:free",
"tngtech/deepseek-r1t2-chimera:free",
"x-ai/grok-3",
"x-ai/grok-3-beta",
"x-ai/grok-3-mini",
"x-ai/grok-3-mini-beta",
"x-ai/grok-4",
"x-ai/grok-4-fast",
"x-ai/grok-4.1-fast",
"x-ai/grok-code-fast-1",
"z-ai/glm-4.5",
"z-ai/glm-4.5-air",
"z-ai/glm-4.5-air:free",
"z-ai/glm-4.5v",
"z-ai/glm-4.6",
"z-ai/glm-4.6:exacto"
],
docUrl: "https://openrouter.ai/models",
gateway: "models.dev"
},
zenmux: {
url: "https://zenmux.ai/api/v1",
apiKeyEnvVar: "ZENMUX_API_KEY",
apiKeyHeader: "Authorization",
name: "ZenMux",
models: [
"anthropic/claude-haiku-4.5",
"anthropic/claude-opus-4.1",
"anthropic/claude-sonnet-4.5",
"deepseek/deepseek-chat",
"google/gemini-2.5-pro",
"inclusionai/lint-1t",
"inclusionai/ring-1t",
"kuaishou/kat-coder-pro-v1",
"minimax/minimax-m2",
"moonshotai/kimi-k2-0905",
"moonshotai/kimi-k2-thinking",
"moonshotai/kimi-k2-thinking-turbo",
"openai/gpt-5",
"openai/gpt-5-codex",
"qwen/qwen3-coder-plus",
"x-ai/grok-4",
"x-ai/grok-4-fast",
"x-ai/grok-4-fast-non-reasoning",
"x-ai/grok-code-fast-1",
"z-ai/glm-4.5-air",
"z-ai/glm-4.6"
],
docUrl: "https://docs.zenmux.ai",
gateway: "models.dev"
},
ovhcloud: {
url: "https://oai.endpoints.kepler.ai.cloud.ovh.net/v1",
apiKeyEnvVar: "OVHCLOUD_API_KEY",
apiKeyHeader: "Authorization",
name: "OVHcloud AI Endpoints",
models: [
"deepseek-r1-distill-llama-70b",
"gpt-oss-120b",
"gpt-oss-20b",
"llama-3.1-8b-instruct",
"llava-next-mistral-7b",
"meta-llama-3_1-70b-instruct",
"meta-llama-3_3-70b-instruct",
"mistral-7b-instruct-v0.3",
"mistral-nemo-instruct-2407",
"mistral-small-3.2-24b-instruct-2506",
"mixtral-8x7b-instruct-v0.1",
"qwen2.5-coder-32b-instruct",
"qwen2.5-vl-72b-instruct",
"qwen3-32b",
"qwen3-coder-30b-a3b-instruct"
],
docUrl: "https://www.ovhcloud.com/en/public-cloud/ai-endpoints/catalog//",
gateway: "models.dev"
},
iflowcn: {
url: "https://apis.iflow.cn/v1",
apiKeyEnvVar: "IFLOW_API_KEY",
apiKeyHeader: "Authorization",
name: "iFlow",
models: [
"deepseek-r1",
"deepseek-v3",
"deepseek-v3.1",
"deepseek-v3.2",
"glm-4.6",
"kimi-k2",
"kimi-k2-0905",
"minimax-m2",
"qwen3-235b",
"qwen3-235b-a22b-instruct",
"qwen3-235b-a22b-thinking-2507",
"qwen3-32b",
"qwen3-coder",
"qwen3-coder-plus",
"qwen3-max",
"qwen3-max-preview",
"qwen3-vl-plus",
"tstars2.0"
],
docUrl: "https://platform.iflow.cn/en/docs",
gateway: "models.dev"
},
synthetic: {
url: "https://api.synthetic.new/v1",
apiKeyEnvVar: "SYNTHETIC_API_KEY",
apiKeyHeader: "Authorization",
name: "Synthetic",
models: [
"hf:MiniMaxAI/MiniMax-M2",
"hf:Qwen/Qwen2.5-Coder-32B-Instruct",
"hf:Qwen/Qwen3-235B-A22B-Instruct-2507",
"hf:Qwen/Qwen3-235B-A22B-Thinking-2507",
"hf:Qwen/Qwen3-Coder-480B-A35B-Instruct",
"hf:deepseek-ai/DeepSeek-R1",
"hf:deepseek-ai/DeepSeek-R1-0528",
"hf:deepseek-ai/DeepSeek-V3",
"hf:deepseek-ai/DeepSeek-V3-0324",
"hf:deepseek-ai/DeepSeek-V3.1",
"hf:deepseek-ai/DeepSeek-V3.1-Terminus",
"hf:meta-llama/Llama-3.1-405B-Instruct",
"hf:meta-llama/Llama-3.1-70B-Instruct",
"hf:meta-llama/Llama-3.1-8B-Instruct",
"hf:meta-llama/Llama-3.3-70B-Instruct",
"hf:meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
"hf:meta-llama/Llama-4-Scout-17B-16E-Instruct",
"hf:moonshotai/Kimi-K2-Instruct",
"hf:moonshotai/Kimi-K2-Instruct-0905",
"hf:moonshotai/Kimi-K2-Thinking",
"hf:openai/gpt-oss-120b",
"hf:zai-org/GLM-4.5",
"hf:zai-org/GLM-4.6"
],
docUrl: "https://synthetic.new/pricing",
gateway: "models.dev"
},
deepinfra: {
url: "https://api.deepinfra.com/v1/openai",
apiKeyEnvVar: "DEEPINFRA_API_KEY",
apiKeyHeader: "Authorization",
name: "Deep Infra",
models: [
"Qwen/Qwen3-Coder-480B-A35B-Instruct",
"Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo",
"moonshotai/Kimi-K2-Instruct",
"openai/gpt-oss-120b",
"openai/gpt-oss-20b",
"zai-org/GLM-4.5"
],
docUrl: "https://deepinfra.com/models",
gateway: "models.dev"
},
zhipuai: {
url: "https://open.bigmodel.cn/api/paas/v4",
apiKeyEnvVar: "ZHIPU_API_KEY",
apiKeyHeader: "Authorization",
name: "Zhipu AI",
models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
docUrl: "https://docs.z.ai/guides/overview/pricing",
gateway: "models.dev"
},
submodel: {
url: "https://llm.submodel.ai/v1",
apiKeyEnvVar: "SUBMODEL_INSTAGEN_ACCESS_KEY",
apiKeyHeader: "Authorization",
name: "submodel",
models: [
"Qwen/Qwen3-235B-A22B-Instruct-2507",
"Qwen/Qwen3-235B-A22B-Thinking-2507",
"Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8",
"deepseek-ai/DeepSeek-R1-0528",
"deepseek-ai/DeepSeek-V3-0324",
"deepseek-ai/DeepSeek-V3.1",
"openai/gpt-oss-120b",
"zai-org/GLM-4.5-Air",
"zai-org/GLM-4.5-FP8"
],
docUrl: "https://submodel.gitbook.io",
gateway: "models.dev"
},
zai: {
url: "https://api.z.ai/api/paas/v4",
apiKeyEnvVar: "ZHIPU_API_KEY",
apiKeyHeader: "Authorization",
name: "Z.AI",
models: ["glm-4.5", "glm-4.5-air", "glm-4.5-flash", "glm-4.5v", "glm-4.6"],
docUrl: "https://docs.z.ai/guides/overview/pricing",
gateway: "models.dev"
},
inference: {
url: "https://inference.net/v1",
apiKeyEnvVar: "INFERENCE_API_KEY",
apiKeyHeader: "Authorization",
name: "Inference",
models: [
"google/gemma-3",
"meta/llama-3.1-8b-instruct",
"meta/llama-3.2-11b-vision-instruct",
"meta/llama-3.2-1b-instruct",
"meta/llama-3.2-3b-instruct",
"mistral/mistral-nemo-12b-instruct",
"osmosis/osmosis-structure-0.6b",
"qwen/qwen-2.5-7b-vision-instruct",
"qwen/qwen3-embedding-4b"
],
docUrl: "https://inference.net/models",
gateway: "models.dev"
},
requesty: {
url: "https://router.requesty.ai/v1",
apiKeyEnvVar: "REQUESTY_API_KEY",
apiKeyHeader: "Authorization",
name: "Requesty",
models: [
"anthropic/claude-3-7-sonnet",
"anthropic/claude-haiku-4-5",
"anthropic/claude-opus-4",
"anthropic/claude-opus-4-1",
"anthropic/claude-sonnet-4",
"anthropic/claude-sonnet-4-5",
"google/gemini-2.5-flash",
"google/gemini-2.5-pro",
"openai/gpt-4.1",
"openai/gpt-4.1-mini",
"openai/gpt-4o-mini",
"openai/gpt-5",
"openai/gpt-5-mini",
"openai/gpt-5-nano",
"openai/o4-mini",
"xai/grok-4",
"xai/grok-4-fast"
],
docUrl: "https://requesty.ai/solution/llm-routing/models",
gateway: "models.dev"
},
morph: {
url: "https://api.morphllm.com/v1",
apiKeyEnvVar: "MORPH_API_KEY",
apiKeyHeader: "Authorization",
name: "Morph",
models: ["auto", "morph-v3-fast", "morph-v3-large"],
docUrl: "https://docs.morphllm.com/api-reference/introduction",
gateway: "models.dev"
},
lmstudio: {
url: "http://127.0.0.1:1234/v1",
apiKeyEnvVar: "LMSTUDIO_API_KEY",
apiKeyHeader: "Authorization",
name: "LMStudio",
models: ["openai/gpt-oss-20b", "qwen/qwen3-30b-a3b-2507", "qwen/qwen3-coder-30b"],
docUrl: "https://lmstudio.ai/models",
gateway: "models.dev"
},
anthropic: {
apiKeyEnvVar: "ANTHROPIC_API_KEY",
name: "Anthropic",
models: [
"claude-3-5-haiku-20241022",
"claude-3-5-haiku-latest",
"claude-3-5-sonnet-20240620",
"claude-3-5-sonnet-20241022",
"claude-3-7-sonnet-20250219",
"claude-3-7-sonnet-latest",
"claude-3-haiku-20240307",
"claude-3-opus-20240229",
"claude-3-sonnet-20240229",
"claude-haiku-4-5",
"claude-haiku-4-5-20251001",
"claude-opus-4-0",
"claude-opus-4-1",
"claude-opus-4-1-20250805",
"claude-opus-4-20250514",
"claude-opus-4-5",
"claude-sonnet-4-0",
"claude-sonnet-4-20250514",
"claude-sonnet-4-5",
"claude-sonnet-4-5-20250929"
],
docUrl: "https://docs.anthropic.com/en/docs/about-claude/models",
gateway: "models.dev"
},
"fireworks-ai": {
url: "https://api.fireworks.ai/inference/v1/",
apiKeyEnvVar: "FIREWORKS_API_KEY",
apiKeyHeader: "Authorization",
name: "Fireworks AI",
models: [
"accounts/fireworks/models/deepseek-r1-0528",
"accounts/fireworks/models/deepseek-v3-0324",
"accounts/fireworks/models/deepseek-v3p1",
"accounts/fireworks/models/glm-4p5",
"accounts/fireworks/models/glm-4p5-air",
"accounts/fireworks/models/gpt-oss-120b",
"accounts/fireworks/models/gpt-oss-20b",
"accounts/fireworks/models/kimi-k2-instruct",
"accounts/fireworks/models/kimi-k2-thinking",
"accounts/fireworks/models/minimax-m2",
"accounts/fireworks/models/qwen3-235b-a22b",
"accounts/fireworks/models/qwen3-coder-480b-a35b-instruct"
],
docUrl: "https://fireworks.ai/docs/",
gateway: "models.dev"
},
modelscope: {
url: "https://api-inference.modelscope.cn/v1",
apiKeyEnvVar: "MODELSCOPE_API_KEY",
apiKeyHeader: "Authorization",
name: "ModelScope",
models: [
"Qwen/Qwen3-235B-A22B-Instruct-2507",
"Qwen/Qwen3-235B-A22B-Thinking-2507",
"Qwen/Qwen3-30B-A3B-Instruct-2507",
"Qwen/Qwen3-30B-A3B-Thinking-2507",
"Qwen/Qwen3-Coder-30B-A3B-Instruct",
"ZhipuAI/GLM-4.5",
"ZhipuAI/GLM-4.6"
],
docUrl: "https://modelscope.cn/docs/model-service/API-Inference/intro",
gateway: "models.dev"
},
llama: {
url: "https://api.llama.com/compat/v1/",
apiKeyEnvVar: "LLAMA_API_KEY",
apiKeyHeader: "Authorization",
name: "Llama",
models: [
"cerebras-llama-4-maverick-17b-128e-instruct",
"cerebras-llama-4-scout-17b-16e-instruct",
"groq-llama-4-maverick-17b-128e-instruct",
"llama-3.3-70b-instruct",
"llama-3.3-8b-instruct",
"llama-4-maverick-17b-128e-instruct-fp8",
"llama-4-scout-17b-16e-instruct-fp8"
],
docUrl: "https://llama.developer.meta.com/docs/models",
gateway: "models.dev"
},
scaleway: {
url: "https://api.scaleway.ai/v1",
apiKeyEnvVar: "SCALEWAY_API_KEY",
apiKeyHeader: "Authorization",
name: "Scaleway",
models: [
"bge-multilingual-gemma2",
"deepseek-r1-distill-llama-70b",
"gemma-3-27b-it",
"gpt-oss-120b",
"llama-3.1-8b-instruct",
"llama-3.3-70b-instruct",
"mistral-nemo-instruct-2407",
"mistral-small-3.2-24b-instruct-2506",
"pixtral-12b-2409",
"qwen3-235b-a22b-instruct-2507",
"qwen3-coder-30b-a3b-instruct",
"voxtral-small-24b-2507",
"whisper-large-v3"
],
docUrl: "https://www.scaleway.com/en/docs/generative-apis/",
gateway: "models.dev"
},
poe: {
url: "https://api.poe.com/v1",
apiKeyEnvVar: "POE_API_KEY",
apiKeyHeader: "Authorization",
name: "Poe",
models: [
"anthropic/claude-haiku-3",
"anthropic/claude-haiku-3.5",
"anthropic/claude-haiku-3.5-search",
"anthropic/claude-haiku-4.5",
"anthropic/claude-opus-3",
"anthropic/claude-opus-4",
"anthropic/claude-opus-4-reasoning",
"anthropic/claude-opus-4-search",
"anthropic/claude-opus-4.1",
"anthropic/claude-sonnet-3.5",
"anthropic/claude-sonnet-3.5-june",
"anthropic/claude-sonnet-3.7",
"anthropic/claude-sonnet-3.7-reasoning",
"anthropic/claude-sonnet-3.7-search",
"anthropic/claude-sonnet-4",
"anthropic/claude-sonnet-4-reasoning",
"anthropic/claude-sonnet-4-search",
"anthropic/claude-sonnet-4.5",
"elevenlabs/elevenlabs-music",
"elevenlabs/elevenlabs-v2.5-turbo",
"elevenlabs/elevenlabs-v3",
"facebook/llama-3.1-405b",
"facebook/llama-3.1-70b",
"facebook/llama-3.1-8b",
"google/gemini-2.0-flash",
"google/gemini-2.0-flash-lite",
"google/gemini-2.5-flash",
"google/gemini-2.5-flash-lite",
"google/gemini-2.5-pro",
"google/gemini-3.0-pro",
"google/imagen-3",
"google/imagen-3-fast",
"google/imagen-4",
"google/imagen-4-fast",
"google/imagen-4-ultra",
"google/lyria",
"google/nano-banana",
"google/veo-2",
"google/veo-3",
"google/veo-3-fast",
"google/veo-3.1",
"google/veo-3.1-fast",
"ideogramai/ideogram",
"ideogramai/ideogram-v2",
"ideogramai/ideogram-v2a",
"ideogramai/ideogram-v2a-turbo",
"lumalabs/dream-machine",
"lumalabs/ray2",
"novita/glm-4.6",
"openAi/chatgpt-4o-latest",
"openAi/dall-e-3",
"openAi/gpt-3.5-turbo",
"openAi/gpt-3.5-turbo-instruct",
"openAi/gpt-3.5-turbo-raw",
"openAi/gpt-4-classic",
"openAi/gpt-4-classic-0314",
"openAi/gpt-4-turbo",
"openAi/gpt-4.1",
"openAi/gpt-4.1-mini",
"openAi/gpt-4.1-nano",
"openAi/gpt-4o",
"openAi/gpt-4o-aug",
"openAi/gpt-4o-mini",
"openAi/gpt-4o-mini-search",
"openAi/gpt-4o-search",
"openAi/gpt-5",
"openAi/gpt-5-chat",
"openAi/gpt-5-codex",
"openAi/gpt-5-mini",
"openAi/gpt-5-nano",
"openAi/gpt-5-pro",
"openAi/gpt-image-1",
"openAi/gpt-image-1-mini",
"openAi/o1",
"openAi/o1-pro",
"openAi/o3",
"openAi/o3-deep-research",
"openAi/o3-mini",
"openAi/o3-mini-high",
"openAi/o3-pro",
"openAi/o4-mini",
"openAi/o4-mini-deep-research",
"openAi/sora-2",
"openAi/sora-2-pro",
"openai/gpt-5.1",
"openai/gpt-5.1-codex",
"openai/gpt-5.1-