@juspay/neurolink
Version:
Universal AI Development Platform with working MCP integration, multi-provider support, voice (TTS/STT/realtime), and professional CLI. 58+ external MCP servers discoverable, multimodal file processing, RAG pipelines. Build, test, and deploy AI applicatio
955 lines (954 loc) • 40.8 kB
TypeScript
/**
* Supported AI Provider Names
*/
export declare enum AIProviderName {
BEDROCK = "bedrock",
OPENAI = "openai",
OPENAI_COMPATIBLE = "openai-compatible",
OPENROUTER = "openrouter",
VERTEX = "vertex",
ANTHROPIC = "anthropic",
AZURE = "azure",
GOOGLE_AI = "google-ai",
HUGGINGFACE = "huggingface",
OLLAMA = "ollama",
MISTRAL = "mistral",
LITELLM = "litellm",
SAGEMAKER = "sagemaker",
DEEPSEEK = "deepseek",
NVIDIA_NIM = "nvidia-nim",
LM_STUDIO = "lm-studio",
LLAMACPP = "llamacpp",
XAI = "xai",
GROQ = "groq",
COHERE = "cohere",
TOGETHER_AI = "together-ai",
FIREWORKS = "fireworks",
PERPLEXITY = "perplexity",
CLOUDFLARE = "cloudflare",
REPLICATE = "replicate",
VOYAGE = "voyage",
JINA = "jina",
STABILITY = "stability",
IDEOGRAM = "ideogram",
RECRAFT = "recraft",
AUTO = "auto"
}
/**
* Popular Models for OpenRouter (300+ available at openrouter.ai/models)
* OpenRouter uses 'provider/model' format
*/
export declare enum OpenRouterModels {
CLAUDE_OPUS_4_6 = "anthropic/claude-opus-4.6",
CLAUDE_SONNET_4_6 = "anthropic/claude-sonnet-4.6",
CLAUDE_SONNET_4_5 = "anthropic/claude-sonnet-4.5",
CLAUDE_HAIKU_4_5 = "anthropic/claude-haiku-4.5",
CLAUDE_3_7_SONNET = "anthropic/claude-3.7-sonnet",
CLAUDE_3_5_HAIKU = "anthropic/claude-3-5-haiku",
CLAUDE_3_OPUS = "anthropic/claude-3-opus",
GPT_5_2 = "openai/gpt-5.2",
GPT_5 = "openai/gpt-5",
GPT_4O = "openai/gpt-4o",
GPT_4O_MINI = "openai/gpt-4o-mini",
GPT_4_TURBO = "openai/gpt-4-turbo",
GEMINI_3_1_PRO_PREVIEW = "google/gemini-3.1-pro-preview",
GEMINI_3_FLASH_PREVIEW = "google/gemini-3-flash-preview",
GEMINI_2_5_FLASH = "google/gemini-2.5-flash",
GEMINI_2_5_FLASH_LITE = "google/gemini-2.5-flash-lite",
GEMINI_2_0_FLASH = "google/gemini-2.0-flash",
LLAMA_3_1_70B = "meta-llama/llama-3.1-70b-instruct",
LLAMA_3_1_8B = "meta-llama/llama-3.1-8b-instruct",
MISTRAL_LARGE = "mistralai/mistral-large",
MIXTRAL_8X7B = "mistralai/mixtral-8x7b-instruct",
DEEPSEEK_R1 = "deepseek/deepseek-r1",
GROK_4_1_FAST = "xai/grok-4.1-fast"
}
/**
* Supported Models for Amazon Bedrock
*/
export declare enum BedrockModels {
CLAUDE_4_6_OPUS = "anthropic.claude-opus-4-6-v1:0",
CLAUDE_4_6_SONNET = "anthropic.claude-sonnet-4-6",
CLAUDE_4_5_OPUS = "anthropic.claude-opus-4-5-20251124-v1:0",
CLAUDE_4_5_SONNET = "anthropic.claude-sonnet-4-5-20250929-v1:0",
CLAUDE_4_5_HAIKU = "anthropic.claude-haiku-4-5-20251001-v1:0",
CLAUDE_4_1_OPUS = "anthropic.claude-opus-4-1-20250805-v1:0",
CLAUDE_4_SONNET = "anthropic.claude-sonnet-4-20250514-v1:0",
/** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */
CLAUDE_3_7_SONNET = "anthropic.claude-3-7-sonnet-20250219-v1:0",
/** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */
CLAUDE_3_5_SONNET = "anthropic.claude-3-5-sonnet-20241022-v1:0",
/** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */
CLAUDE_3_5_HAIKU = "anthropic.claude-3-5-haiku-20241022-v1:0",
/** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */
CLAUDE_3_SONNET = "anthropic.claude-3-sonnet-20240229-v1:0",
/** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */
CLAUDE_3_HAIKU = "anthropic.claude-3-haiku-20240307-v1:0",
NOVA_PREMIER = "amazon.nova-premier-v1:0",
NOVA_PRO = "amazon.nova-pro-v1:0",
NOVA_LITE = "amazon.nova-lite-v1:0",
NOVA_MICRO = "amazon.nova-micro-v1:0",
NOVA_2_LITE = "amazon.nova-2-lite-v1:0",
NOVA_2_SONIC = "amazon.nova-2-sonic-v1:0",
NOVA_SONIC = "amazon.nova-sonic-v1:0",
NOVA_CANVAS = "amazon.nova-canvas-v1:0",
NOVA_REEL = "amazon.nova-reel-v1:0",
NOVA_REEL_V1_1 = "amazon.nova-reel-v1:1",
NOVA_MULTIMODAL_EMBEDDINGS = "amazon.nova-2-multimodal-embeddings-v1:0",
TITAN_TEXT_LARGE = "amazon.titan-tg1-large",
TITAN_EMBED_TEXT_V2 = "amazon.titan-embed-text-v2:0",
TITAN_EMBED_TEXT_V1 = "amazon.titan-embed-text-v1",
TITAN_EMBED_G1_TEXT_02 = "amazon.titan-embed-g1-text-02",
TITAN_EMBED_IMAGE_V1 = "amazon.titan-embed-image-v1",
TITAN_IMAGE_GENERATOR_V2 = "amazon.titan-image-generator-v2:0",
LLAMA_4_MAVERICK_17B = "meta.llama4-maverick-17b-instruct-v1:0",
LLAMA_4_SCOUT_17B = "meta.llama4-scout-17b-instruct-v1:0",
LLAMA_3_3_70B = "meta.llama3-3-70b-instruct-v1:0",
LLAMA_3_2_90B = "meta.llama3-2-90b-instruct-v1:0",
LLAMA_3_2_11B = "meta.llama3-2-11b-instruct-v1:0",
LLAMA_3_2_3B = "meta.llama3-2-3b-instruct-v1:0",
LLAMA_3_2_1B = "meta.llama3-2-1b-instruct-v1:0",
LLAMA_3_1_405B = "meta.llama3-1-405b-instruct-v1:0",
LLAMA_3_1_70B = "meta.llama3-1-70b-instruct-v1:0",
LLAMA_3_1_8B = "meta.llama3-1-8b-instruct-v1:0",
LLAMA_3_70B = "meta.llama3-70b-instruct-v1:0",
LLAMA_3_8B = "meta.llama3-8b-instruct-v1:0",
MISTRAL_LARGE_3 = "mistral.mistral-large-3-675b-instruct",
MISTRAL_LARGE_2407 = "mistral.mistral-large-2407-v1:0",
MISTRAL_LARGE_2402 = "mistral.mistral-large-2402-v1:0",
MAGISTRAL_SMALL_2509 = "mistral.magistral-small-2509",
MINISTRAL_3_14B = "mistral.ministral-3-14b-instruct",
MINISTRAL_3_8B = "mistral.ministral-3-8b-instruct",
MINISTRAL_3_3B = "mistral.ministral-3-3b-instruct",
MISTRAL_7B = "mistral.mistral-7b-instruct-v0:2",
MIXTRAL_8x7B = "mistral.mixtral-8x7b-instruct-v0:1",
PIXTRAL_LARGE_2502 = "mistral.pixtral-large-2502-v1:0",
VOXTRAL_SMALL_24B = "mistral.voxtral-small-24b-2507",
VOXTRAL_MINI_3B = "mistral.voxtral-mini-3b-2507",
COHERE_COMMAND_R_PLUS = "cohere.command-r-plus-v1:0",
COHERE_COMMAND_R = "cohere.command-r-v1:0",
DEEPSEEK_R1 = "deepseek.r1-v1:0",
DEEPSEEK_V3 = "deepseek.v3-v1:0",
QWEN_3_235B_A22B = "qwen.qwen3-235b-a22b-2507-v1:0",
QWEN_3_CODER_480B_A35B = "qwen.qwen3-coder-480b-a35b-v1:0",
QWEN_3_CODER_30B_A3B = "qwen.qwen3-coder-30b-a3b-v1:0",
QWEN_3_32B = "qwen.qwen3-32b-v1:0",
QWEN_3_NEXT_80B_A3B = "qwen.qwen3-next-80b-a3b",
QWEN_3_VL_235B_A22B = "qwen.qwen3-vl-235b-a22b",
GEMMA_3_27B_IT = "google.gemma-3-27b-it",
GEMMA_3_12B_IT = "google.gemma-3-12b-it",
GEMMA_3_4B_IT = "google.gemma-3-4b-it",
JAMBA_1_5_LARGE = "ai21.jamba-1-5-large-v1:0",
JAMBA_1_5_MINI = "ai21.jamba-1-5-mini-v1:0",
WRITER_PALMYRA_X5 = "writer.palmyra-x5-v1:0",
WRITER_PALMYRA_X4 = "writer.palmyra-x4-v1:0",
MINIMAX_M2_1 = "minimax.minimax-m2.1",
MINIMAX_M2 = "minimax.minimax-m2",
KIMI_K2_THINKING = "moonshot.kimi-k2-thinking",
KIMI_K2_5 = "moonshotai.kimi-k2.5",
NVIDIA_NEMOTRON_NANO_3_30B = "nvidia.nemotron-nano-3-30b",
NVIDIA_NEMOTRON_NANO_12B_V2 = "nvidia.nemotron-nano-12b-v2",
NVIDIA_NEMOTRON_NANO_9B_V2 = "nvidia.nemotron-nano-9b-v2",
OPENAI_GPT_OSS_120B = "openai.gpt-oss-120b-1:0",
OPENAI_GPT_OSS_20B = "openai.gpt-oss-20b-1:0",
GLM_4_7 = "zai.glm-4.7",
GLM_4_7_FLASH = "zai.glm-4.7-flash",
COHERE_EMBED_ENGLISH_V3 = "cohere.embed-english-v3",
COHERE_EMBED_MULTILINGUAL_V3 = "cohere.embed-multilingual-v3",
COHERE_EMBED_V4 = "cohere.embed-v4:0",
COHERE_RERANK_V3_5 = "cohere.rerank-v3-5:0",
AMAZON_RERANK_V1 = "amazon.rerank-v1:0",
DEVSTRAL_2_123B = "mistral.devstral-2-123b"
}
/**
* Supported Models for OpenAI
*/
export declare enum OpenAIModels {
GPT_5_3_CODEX = "gpt-5.3-codex",
GPT_5_4 = "gpt-5.4",
GPT_5_4_MINI = "gpt-5.4-mini",
GPT_5_4_NANO = "gpt-5.4-nano",
GPT_5_4_PRO = "gpt-5.4-pro",
GPT_5_2 = "gpt-5.2",
GPT_5_2_CHAT_LATEST = "gpt-5.2-chat-latest",
GPT_5_2_PRO = "gpt-5.2-pro",
GPT_5_2_CODEX = "gpt-5.2-codex",
GPT_5_1 = "gpt-5.1",
GPT_5_1_CHAT_LATEST = "gpt-5.1-chat-latest",
GPT_5_1_CODEX = "gpt-5.1-codex",
GPT_5_1_CODEX_MAX = "gpt-5.1-codex-max",
GPT_5_1_CODEX_MINI = "gpt-5.1-codex-mini",
GPT_5 = "gpt-5",
GPT_5_MINI = "gpt-5-mini",
GPT_5_NANO = "gpt-5-nano",
GPT_5_PRO = "gpt-5-pro",
GPT_5_CHAT_LATEST = "gpt-5-chat-latest",
GPT_5_CODEX = "gpt-5-codex",
GPT_OSS_120B = "gpt-oss-120b",
GPT_OSS_20B = "gpt-oss-20b",
GPT_4_1 = "gpt-4.1",
GPT_4_1_MINI = "gpt-4.1-mini",
GPT_4_1_NANO = "gpt-4.1-nano",
GPT_4O = "gpt-4o",
GPT_4O_MINI = "gpt-4o-mini",
O3 = "o3",
O3_MINI = "o3-mini",
O3_PRO = "o3-pro",
O4_MINI = "o4-mini",
O1 = "o1",
/** @deprecated Turned off Jul 14, 2025. Use GPT_4_1 or O3. */
O1_PREVIEW = "o1-preview",
/** @deprecated Replaced by o3-mini. */
O1_MINI = "o1-mini",
GPT_4 = "gpt-4",
GPT_4_TURBO = "gpt-4-turbo",
GPT_3_5_TURBO = "gpt-3.5-turbo",
GPT_IMAGE_1 = "gpt-image-1",
DALL_E_3 = "dall-e-3",
DALL_E_2 = "dall-e-2"
}
/**
* Supported Models for Azure OpenAI
* Note: Azure uses deployment names, these are model identifiers
*/
export declare enum AzureOpenAIModels {
GPT_5_2 = "gpt-5.2",
GPT_5_2_CHAT = "gpt-5.2-chat",
GPT_5_2_PRO = "gpt-5.2-pro",
GPT_5_2_CODEX = "gpt-5.2-codex",
GPT_5_4 = "gpt-5.4",
GPT_5_4_MINI = "gpt-5.4-mini",
GPT_5_4_NANO = "gpt-5.4-nano",
GPT_5_1 = "gpt-5.1",
GPT_5_1_CHAT = "gpt-5.1-chat",
GPT_5_1_CODEX = "gpt-5.1-codex",
GPT_5_1_CODEX_MINI = "gpt-5.1-codex-mini",
GPT_5_1_CODEX_MAX = "gpt-5.1-codex-max",
GPT_5 = "gpt-5",
GPT_5_MINI = "gpt-5-mini",
GPT_5_NANO = "gpt-5-nano",
GPT_5_CHAT = "gpt-5-chat",
GPT_5_CODEX = "gpt-5-codex",
GPT_5_PRO = "gpt-5-pro",
GPT_5_TURBO = "gpt-5-turbo",
O4_MINI = "o4-mini",
O3 = "o3",
O3_MINI = "o3-mini",
O3_PRO = "o3-pro",
O1 = "o1",
O1_MINI = "o1-mini",
O1_PREVIEW = "o1-preview",
CODEX_MINI = "codex-mini",
GPT_4_1 = "gpt-4.1",
GPT_4_1_NANO = "gpt-4.1-nano",
GPT_4_1_MINI = "gpt-4.1-mini",
GPT_4O = "gpt-4o",
GPT_4O_MINI = "gpt-4o-mini",
GPT_4_TURBO = "gpt-4-turbo",
GPT_4 = "gpt-4",
GPT_4_32K = "gpt-4-32k",
GPT_3_5_TURBO = "gpt-35-turbo",
GPT_3_5_TURBO_INSTRUCT = "gpt-35-turbo-instruct"
}
/**
* Supported Models for Google Vertex AI
*/
export declare enum VertexModels {
CLAUDE_4_6_OPUS = "claude-opus-4-6",
CLAUDE_4_6_SONNET = "claude-sonnet-4-6",
CLAUDE_4_5_OPUS = "claude-opus-4-5@20251124",
CLAUDE_4_5_SONNET = "claude-sonnet-4-5@20250929",
CLAUDE_4_5_HAIKU = "claude-haiku-4-5@20251001",
CLAUDE_4_0_SONNET = "claude-sonnet-4@20250514",
CLAUDE_4_0_OPUS = "claude-opus-4@20250514",
/** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */
CLAUDE_3_7_SONNET = "claude-3-7-sonnet@20250219",
/** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */
CLAUDE_3_5_SONNET = "claude-3-5-sonnet-20241022",
/** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */
CLAUDE_3_5_HAIKU = "claude-3-5-haiku-20241022",
/** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */
CLAUDE_3_SONNET = "claude-3-sonnet-20240229",
/** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */
CLAUDE_3_OPUS = "claude-3-opus-20240229",
/** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */
CLAUDE_3_HAIKU = "claude-3-haiku-20240307",
GEMINI_3_1_PRO_PREVIEW = "gemini-3.1-pro-preview",
GEMINI_3_1_FLASH_LITE_PREVIEW = "gemini-3.1-flash-lite-preview",
GEMINI_3_1_FLASH_IMAGE_PREVIEW = "gemini-3.1-flash-image-preview",
GEMINI_3_1_PRO_PREVIEW_CUSTOMTOOLS = "gemini-3.1-pro-preview-customtools",
GEMINI_3_FLASH_PREVIEW = "gemini-3-flash-preview",
GEMINI_3_PRO_IMAGE_PREVIEW = "gemini-3-pro-image-preview",
/** @deprecated SHUT DOWN March 9, 2026. Migrate to GEMINI_3_1_PRO_PREVIEW. */
GEMINI_3_PRO_PREVIEW = "gemini-3-pro-preview",
GEMINI_2_5_PRO = "gemini-2.5-pro",
GEMINI_2_5_FLASH = "gemini-2.5-flash",
GEMINI_2_5_FLASH_LITE = "gemini-2.5-flash-lite",
GEMINI_2_5_FLASH_IMAGE = "gemini-2.5-flash-image",
GEMINI_2_0_FLASH = "gemini-2.0-flash",
GEMINI_2_0_FLASH_001 = "gemini-2.0-flash-001",
GEMINI_2_0_FLASH_LITE = "gemini-2.0-flash-lite",
/** @deprecated SHUT DOWN. Returns 404. Use GEMINI_2_5_FLASH or newer. */
GEMINI_1_5_PRO = "gemini-1.5-pro-002",
/** @deprecated SHUT DOWN. Returns 404. Use GEMINI_2_5_FLASH or newer. */
GEMINI_1_5_FLASH = "gemini-1.5-flash-002"
}
/**
* Supported Models for Google AI Studio
*/
export declare enum GoogleAIModels {
GEMINI_3_1_PRO_PREVIEW = "gemini-3.1-pro-preview",
GEMINI_3_1_FLASH_LITE_PREVIEW = "gemini-3.1-flash-lite-preview",
GEMINI_3_1_FLASH_IMAGE_PREVIEW = "gemini-3.1-flash-image-preview",
GEMINI_3_1_PRO_PREVIEW_CUSTOMTOOLS = "gemini-3.1-pro-preview-customtools",
GEMINI_3_FLASH_PREVIEW = "gemini-3-flash-preview",
GEMINI_3_PRO_IMAGE_PREVIEW = "gemini-3-pro-image-preview",
/** @deprecated SHUT DOWN March 9, 2026. Migrate to GEMINI_3_1_PRO_PREVIEW. */
GEMINI_3_PRO_PREVIEW = "gemini-3-pro-preview",
GEMINI_2_5_PRO = "gemini-2.5-pro",
GEMINI_2_5_FLASH = "gemini-2.5-flash",
GEMINI_2_5_FLASH_LITE = "gemini-2.5-flash-lite",
GEMINI_2_5_FLASH_IMAGE = "gemini-2.5-flash-image",
GEMINI_2_5_FLASH_PREVIEW_TTS = "gemini-2.5-flash-preview-tts",
GEMINI_2_5_PRO_PREVIEW_TTS = "gemini-2.5-pro-preview-tts",
/** @deprecated Retiring June 1, 2026. Use GEMINI_2_5_FLASH instead. */
GEMINI_2_0_FLASH = "gemini-2.0-flash",
GEMINI_2_0_FLASH_001 = "gemini-2.0-flash-001",
GEMINI_2_0_FLASH_LITE = "gemini-2.0-flash-lite",
GEMINI_2_0_FLASH_IMAGE = "gemini-2.0-flash-preview-image-generation",
/** @deprecated SHUT DOWN. Returns 404. Use GEMINI_2_5_FLASH or newer. */
GEMINI_1_5_PRO = "gemini-1.5-pro",
/** @deprecated SHUT DOWN. Returns 404. Use GEMINI_2_5_FLASH or newer. */
GEMINI_1_5_FLASH = "gemini-1.5-flash",
GEMINI_EMBEDDING = "gemini-embedding-001",
GEMINI_EMBEDDING_2_PREVIEW = "gemini-embedding-2-preview",
/** @deprecated SHUT DOWN Jan 14, 2026. Use GEMINI_EMBEDDING instead. */
TEXT_EMBEDDING_004 = "text-embedding-004"
}
/**
* Supported Models for Anthropic (Direct API)
*/
export declare enum AnthropicModels {
CLAUDE_OPUS_4_6 = "claude-opus-4-6",
CLAUDE_SONNET_4_6 = "claude-sonnet-4-6",
CLAUDE_OPUS_4_5 = "claude-opus-4-5-20251101",
CLAUDE_SONNET_4_5 = "claude-sonnet-4-5-20250929",
CLAUDE_4_5_HAIKU = "claude-haiku-4-5-20251001",
CLAUDE_OPUS_4_1 = "claude-opus-4-1-20250805",
CLAUDE_OPUS_4_0 = "claude-opus-4-20250514",
CLAUDE_SONNET_4_0 = "claude-sonnet-4-20250514",
/** @deprecated Retired from Anthropic API. Use CLAUDE_SONNET_4_6 instead. */
CLAUDE_SONNET_3_7 = "claude-3-7-sonnet-20250219",
/** @deprecated Retired from Anthropic API. Use CLAUDE_SONNET_4_6 instead. */
CLAUDE_3_5_SONNET = "claude-3-5-sonnet-20241022",
/** @deprecated Retired from Anthropic API. Use CLAUDE_SONNET_4_6 instead. */
CLAUDE_3_5_HAIKU = "claude-3-5-haiku-20241022",
/** @deprecated Retired from Anthropic API. Use CLAUDE_SONNET_4_6 instead. */
CLAUDE_3_SONNET = "claude-3-sonnet-20240229",
/** @deprecated Retired from Anthropic API. Use CLAUDE_SONNET_4_6 instead. */
CLAUDE_3_OPUS = "claude-3-opus-20240229",
/** @deprecated Retired from Anthropic API. Use CLAUDE_SONNET_4_6 instead. */
CLAUDE_3_HAIKU = "claude-3-haiku-20240307"
}
/**
* Supported Models for Mistral AI
*/
export declare enum MistralModels {
MISTRAL_LARGE_LATEST = "mistral-large-latest",
MISTRAL_LARGE_2512 = "mistral-large-2512",
MISTRAL_MEDIUM_LATEST = "mistral-medium-latest",
MISTRAL_MEDIUM_2508 = "mistral-medium-2508",
MISTRAL_SMALL_LATEST = "mistral-small-latest",
MISTRAL_SMALL_2506 = "mistral-small-2506",
MAGISTRAL_MEDIUM_LATEST = "magistral-medium-latest",
MAGISTRAL_SMALL_LATEST = "magistral-small-latest",
MINISTRAL_14B_2512 = "ministral-14b-2512",
MINISTRAL_8B_2512 = "ministral-8b-2512",
MINISTRAL_3B_2512 = "ministral-3b-2512",
CODESTRAL_LATEST = "codestral-latest",
CODESTRAL_2508 = "codestral-2508",
CODESTRAL_EMBED = "codestral-embed",
DEVSTRAL_MEDIUM_LATEST = "devstral-medium-latest",
DEVSTRAL_SMALL_LATEST = "devstral-small-latest",
PIXTRAL_LARGE = "pixtral-large",
PIXTRAL_12B = "pixtral-12b",
VOXTRAL_SMALL_LATEST = "voxtral-small-latest",
VOXTRAL_MINI_LATEST = "voxtral-mini-latest",
DEVSTRAL_2 = "devstral-2512",
DEVSTRAL_SMALL_2 = "devstral-small-2512",
MAGISTRAL_MEDIUM_2509 = "magistral-medium-2509",
MAGISTRAL_SMALL_2509 = "magistral-small-2509",
VOXTRAL_MINI_TRANSCRIBE_2 = "voxtral-mini-2602",
MISTRAL_OCR_3 = "mistral-ocr-2512",
MISTRAL_OCR_LATEST = "mistral-ocr-latest",
MISTRAL_NEMO = "mistral-nemo",
MISTRAL_EMBED = "mistral-embed",
MISTRAL_MODERATION_LATEST = "mistral-moderation-latest",
MISTRAL_SMALL_4 = "mistral-small-2603",
MISTRAL_SMALL_CREATIVE = "mistral-small-creative"
}
/**
* Supported Models for Ollama (Local)
* All models can be run locally without requiring API keys or cloud services
*/
export declare enum OllamaModels {
LLAMA4_SCOUT = "llama4:scout",
LLAMA4_MAVERICK = "llama4:maverick",
LLAMA4_LATEST = "llama4:latest",
LLAMA3_3_LATEST = "llama3.3:latest",
LLAMA3_3_70B = "llama3.3:70b",
LLAMA3_2_LATEST = "llama3.2:latest",
LLAMA3_2_3B = "llama3.2:3b",
LLAMA3_2_1B = "llama3.2:1b",
LLAMA3_1_8B = "llama3.1:8b",
LLAMA3_1_70B = "llama3.1:70b",
LLAMA3_1_405B = "llama3.1:405b",
QWEN3_4B = "qwen3:4b",
QWEN3_8B = "qwen3:8b",
QWEN3_14B = "qwen3:14b",
QWEN3_32B = "qwen3:32b",
QWEN3_72B = "qwen3:72b",
QWEN2_5_3B = "qwen2.5:3b",
QWEN2_5_7B = "qwen2.5:7b",
QWEN2_5_14B = "qwen2.5:14b",
QWEN2_5_32B = "qwen2.5:32b",
QWEN2_5_72B = "qwen2.5:72b",
QWQ_32B = "qwq:32b",
QWQ_LATEST = "qwq:latest",
DEEPSEEK_R1_1_5B = "deepseek-r1:1.5b",
DEEPSEEK_R1_7B = "deepseek-r1:7b",
DEEPSEEK_R1_8B = "deepseek-r1:8b",
DEEPSEEK_R1_14B = "deepseek-r1:14b",
DEEPSEEK_R1_32B = "deepseek-r1:32b",
DEEPSEEK_R1_70B = "deepseek-r1:70b",
DEEPSEEK_V3_671B = "deepseek-v3:671b",
DEEPSEEK_V3_LATEST = "deepseek-v3:latest",
MISTRAL_LATEST = "mistral:latest",
MISTRAL_7B = "mistral:7b",
MISTRAL_SMALL_LATEST = "mistral-small:latest",
MISTRAL_NEMO_LATEST = "mistral-nemo:latest",
MISTRAL_LARGE_LATEST = "mistral-large:latest",
GEMMA3_LATEST = "gemma3:latest",
GEMMA2_2B = "gemma2:2b",
GEMMA2_9B = "gemma2:9b",
GEMMA2_27B = "gemma2:27b",
PHI4_LATEST = "phi4:latest",
PHI4_14B = "phi4:14b",
PHI3_MINI = "phi3:mini",
PHI3_3_8B = "phi3:3.8b",
PHI3_MEDIUM = "phi3:medium",
PHI3_14B = "phi3:14b",
LLAVA_7B = "llava:7b",
LLAVA_13B = "llava:13b",
LLAVA_34B = "llava:34b",
LLAVA_LLAMA3_8B = "llava-llama3:8b",
CODELLAMA_7B = "codellama:7b",
CODELLAMA_13B = "codellama:13b",
CODELLAMA_34B = "codellama:34b",
CODELLAMA_70B = "codellama:70b",
QWEN2_5_CODER_7B = "qwen2.5-coder:7b",
QWEN2_5_CODER_32B = "qwen2.5-coder:32b",
STARCODER2_3B = "starcoder2:3b",
STARCODER2_7B = "starcoder2:7b",
STARCODER2_15B = "starcoder2:15b",
MIXTRAL_8X7B = "mixtral:8x7b",
MIXTRAL_8X22B = "mixtral:8x22b",
COMMAND_R_PLUS = "command-r-plus:104b",
GLM_5_LATEST = "glm-5:latest",
KIMI_K2_5_LATEST = "kimi-k2.5:latest",
QWEN3_5_LATEST = "qwen3.5:latest",
QWEN3_CODER_LATEST = "qwen3-coder:latest",
QWEN3_CODER_30B = "qwen3-coder:30b",
DEEPSEEK_V3_2_LATEST = "deepseek-v3.2:latest",
NEMOTRON_3_NANO_LATEST = "nemotron-3-nano:latest",
NEMOTRON_3_NANO_30B = "nemotron-3-nano:30b",
SMOLLM3_3B = "smollm3:3b",
GPT_OSS_LATEST = "gpt-oss:latest"
}
/**
* Common Models for LiteLLM Proxy
* LiteLLM supports 100+ models through unified proxy interface
* Models use provider-specific prefixes (e.g., "openai/", "anthropic/")
*/
export declare enum LiteLLMModels {
OPENAI_GPT_5 = "openai/gpt-5",
OPENAI_GPT_4O = "openai/gpt-4o",
OPENAI_GPT_4O_MINI = "openai/gpt-4o-mini",
OPENAI_GPT_4_TURBO = "openai/gpt-4-turbo",
OPENAI_GPT_4 = "openai/gpt-4",
OPENAI_GPT_3_5_TURBO = "openai/gpt-3.5-turbo",
ANTHROPIC_CLAUDE_SONNET_4_5 = "anthropic/claude-sonnet-4-5-20250929",
ANTHROPIC_CLAUDE_OPUS_4_1 = "anthropic/claude-opus-4-1-20250805",
ANTHROPIC_CLAUDE_3_5_SONNET = "anthropic/claude-3-5-sonnet-20240620",
ANTHROPIC_CLAUDE_3_HAIKU = "anthropic/claude-3-haiku-20240307",
VERTEX_GEMINI_2_5_PRO = "vertex_ai/gemini-2.5-pro",
VERTEX_GEMINI_1_5_PRO = "vertex_ai/gemini-1.5-pro",
VERTEX_GEMINI_1_5_FLASH = "vertex_ai/gemini-1.5-flash",
GEMINI_2_5_PRO = "gemini/gemini-2.5-pro",
GEMINI_2_0_FLASH = "gemini/gemini-2.0-flash",
GEMINI_1_5_PRO = "gemini/gemini-1.5-pro",
GEMINI_1_5_FLASH = "gemini/gemini-1.5-flash",
GROQ_LLAMA_3_1_70B_VERSATILE = "groq/llama-3.1-70b-versatile",
GROQ_LLAMA_3_1_8B_INSTANT = "groq/llama-3.1-8b-instant",
GROQ_LLAMA_3_2_11B_VISION = "groq/llama-3.2-11b-vision-preview",
GROQ_MIXTRAL_8X7B = "groq/mixtral-8x7b-32768",
TOGETHER_LLAMA_2_70B_CHAT = "together_ai/togethercomputer/llama-2-70b-chat",
TOGETHER_MIXTRAL_8X7B = "together_ai/mistralai/Mixtral-8x7B-Instruct-v0.1",
TOGETHER_CODELLAMA_34B = "together_ai/codellama/CodeLlama-34b-Instruct-hf",
DEEPINFRA_LLAMA_3_70B = "deepinfra/meta-llama/Meta-Llama-3-70B-Instruct",
DEEPINFRA_LLAMA_2_70B = "deepinfra/meta-llama/Llama-2-70b-chat-hf",
DEEPINFRA_MISTRAL_7B = "deepinfra/mistralai/Mistral-7B-Instruct-v0.1",
MISTRAL_LARGE = "mistral/mistral-large-latest",
MISTRAL_SMALL = "mistral/mistral-small-latest",
MISTRAL_MAGISTRAL_MEDIUM = "mistral/magistral-medium-2506",
BEDROCK_CLAUDE_3_5_SONNET = "bedrock/anthropic.claude-3-5-sonnet-20240620-v1:0",
BEDROCK_CLAUDE_3_HAIKU = "bedrock/anthropic.claude-3-haiku-20240307-v1:0",
OPENAI_GPT_5_2 = "openai/gpt-5.2",
OPENAI_GPT_5_2_CODEX = "openai/gpt-5.2-codex",
ANTHROPIC_CLAUDE_OPUS_4_6 = "anthropic/claude-opus-4-6",
ANTHROPIC_CLAUDE_SONNET_4_6 = "anthropic/claude-sonnet-4-6",
GEMINI_3_1_PRO = "gemini/gemini-3.1-pro-preview",
XAI_GROK_4_1_FAST = "xai/grok-4.1-fast",
PERPLEXITY_SONAR_PRO = "perplexity/sonar-pro",
PERPLEXITY_SONAR_REASONING_PRO = "perplexity/sonar-reasoning-pro"
}
/**
* Supported Models for Hugging Face Inference API
*/
export declare enum HuggingFaceModels {
LLAMA_3_3_70B_INSTRUCT = "meta-llama/Llama-3.3-70B-Instruct",
LLAMA_3_2_1B = "meta-llama/Llama-3.2-1B",
LLAMA_3_2_3B_INSTRUCT = "meta-llama/Llama-3.2-3B-Instruct",
LLAMA_3_1_8B = "meta-llama/Llama-3.1-8B",
LLAMA_3_1_70B_INSTRUCT = "meta-llama/Llama-3.1-70B-Instruct",
LLAMA_3_1_405B_INSTRUCT = "meta-llama/Llama-3.1-405B-Instruct",
LLAMA_3_8B_INSTRUCT = "meta-llama/Meta-Llama-3-8B-Instruct",
LLAMA_3_70B_INSTRUCT = "meta-llama/Meta-Llama-3-70B-Instruct",
MISTRAL_LARGE_3_675B = "mistralai/Mistral-Large-3-675B-Instruct-2512",
MISTRAL_SMALL_3_1_24B = "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
MISTRAL_SMALL_24B = "mistralai/Mistral-Small-24B-Instruct-2501",
MISTRAL_7B_INSTRUCT = "mistralai/Mistral-7B-Instruct-v0.2",
MIXTRAL_8X7B_INSTRUCT = "mistralai/Mixtral-8x7B-Instruct-v0.1",
DEVSTRAL_2 = "mistralai/Devstral-2",
QWEN_2_5_7B = "Qwen/Qwen2.5-7B",
QWEN_2_5_32B = "Qwen/Qwen2.5-32B",
QWEN_2_5_72B_INSTRUCT = "Qwen/Qwen2.5-72B-Instruct",
QWEN_2_5_CODER_7B = "Qwen/Qwen2.5-Coder-7B",
QWEN_2_5_CODER_32B_INSTRUCT = "Qwen/Qwen2.5-Coder-32B-Instruct",
QWQ_32B = "Qwen/QwQ-32B",
QWEN_2_5_VL_32B = "Qwen/Qwen2.5-VL-32B-Instruct",
DEEPSEEK_R1 = "deepseek-ai/DeepSeek-R1",
DEEPSEEK_V3 = "deepseek-ai/DeepSeek-V3",
DEEPSEEK_V3_1 = "deepseek-ai/DeepSeek-V3.1",
DEEPSEEK_V3_2_EXP = "deepseek-ai/DeepSeek-V3.2-Exp",
PHI_4 = "microsoft/phi-4",
PHI_4_REASONING = "microsoft/Phi-4-reasoning",
PHI_4_MINI_INSTRUCT = "microsoft/Phi-4-mini-instruct",
PHI_4_MINI_REASONING = "microsoft/Phi-4-mini-reasoning",
PHI_3_MINI_128K_INSTRUCT = "microsoft/Phi-3-mini-128k-instruct",
PHI_3_VISION_128K_INSTRUCT = "microsoft/Phi-3-vision-128k-instruct",
GEMMA_3_270M = "google/gemma-3-270m",
GEMMA_3_1B_IT = "google/gemma-3-1b-it",
GEMMA_3_4B_IT = "google/gemma-3-4b-it",
GEMMA_3_12B_IT = "google/gemma-3-12b-it",
GEMMA_3_27B_IT = "google/gemma-3-27b-it",
GEMMA_2_9B = "google/gemma-2-9b",
GEMMA_2_27B = "google/gemma-2-27b",
GEMMA_2B = "google/gemma-2b",
GEMMA_7B = "google/gemma-7b",
FALCON_40B_INSTRUCT = "tiiuae/falcon-40b-instruct",
FALCON_180B_CHAT = "tiiuae/falcon-180B-chat",
STARCODER2_15B = "bigcode/starcoder2-15b",
CODELLAMA_34B_INSTRUCT = "codellama/CodeLlama-34b-Instruct-hf",
BLOOM_7B1 = "bigscience/bloom-7b1",
BLOOM_1B3 = "bigscience/bloom-1b3",
GLM_5 = "zai-org/GLM-5",
QWEN_3_5_397B_A17B = "Qwen/Qwen3.5-397B-A17B",
NEMOTRON_3_NANO_30B = "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16",
SMOLLM3_3B = "HuggingFaceTB/SmolLM3-3B",
FALCON_3_7B_INSTRUCT = "tiiuae/Falcon3-7B-Instruct",
FALCON_3_10B_INSTRUCT = "tiiuae/Falcon3-10B-Instruct"
}
/**
* Supported Models for AWS SageMaker JumpStart
* https://docs.aws.amazon.com/sagemaker/latest/dg/jumpstart-foundation-models-latest.html
*/
export declare enum SageMakerModels {
LLAMA_4_SCOUT_17B_16E = "meta-llama-4-scout-17b-16e-instruct",
LLAMA_4_MAVERICK_17B_128E = "meta-llama-4-maverick-17b-128e-instruct",
LLAMA_4_MAVERICK_17B_128E_FP8 = "meta-llama-4-maverick-17b-128e-instruct-fp8",
LLAMA_3_8B = "meta-llama-3-8b-instruct",
LLAMA_3_70B = "meta-llama-3-70b-instruct",
CODE_LLAMA_7B = "meta-code-llama-7b",
CODE_LLAMA_13B = "meta-code-llama-13b",
CODE_LLAMA_34B = "meta-code-llama-34b",
MISTRAL_SMALL_24B = "mistral-small-24b-instruct-2501",
MISTRAL_7B_INSTRUCT = "mistral-7b-instruct-v0.3",
MIXTRAL_8X7B = "mistral-mixtral-8x7b-instruct-v0.1",
MIXTRAL_8X22B = "mistral-mixtral-8x22b-instruct-v0.1",
FALCON_3_7B = "tii-falcon-3-7b-instruct",
FALCON_3_10B = "tii-falcon-3-10b-instruct",
FALCON_40B = "tii-falcon-40b-instruct",
FALCON_180B = "tii-falcon-180b",
NEMOTRON_3_NANO_30B = "nvidia-nemotron-3-nano-30b",
QWEN3_VL_8B = "qwen3-vl-8b-instruct"
}
/**
* API Versions for various providers
*/
export declare enum APIVersions {
AZURE_LATEST = "2025-04-01-preview",
AZURE_STABLE = "2024-10-21",
AZURE_LEGACY = "2023-12-01-preview",
OPENAI_CURRENT = "v1",
OPENAI_BETA = "v1-beta",
GOOGLE_AI_CURRENT = "v1",
GOOGLE_AI_BETA = "v1beta",
ANTHROPIC_CURRENT = "2023-06-01"
}
export declare enum ErrorCategory {
VALIDATION = "validation",
TIMEOUT = "timeout",
NETWORK = "network",
RESOURCE = "resource",
PERMISSION = "permission",
CONFIGURATION = "configuration",
EXECUTION = "execution",
SYSTEM = "system",
/**
* Caller-initiated cancellation via AbortSignal. Distinct from system errors
* — represents a user/control-plane decision, not a SDK or provider failure.
* Consumers can branch on this category to differentiate "user cancelled"
* from "server error" without resorting to message-string matching.
*/
ABORT = "abort"
}
export declare enum ErrorSeverity {
LOW = "low",
MEDIUM = "medium",
HIGH = "high",
CRITICAL = "critical"
}
/**
* Beta features available for Anthropic API
*
* @description Beta feature flags that can be enabled for enhanced functionality:
* - CLAUDE_CODE: Claude Code beta features for development workflows
* - INTERLEAVED_THINKING: Enables interleaved thinking in responses
* - FINE_GRAINED_STREAMING: Fine-grained tool streaming for better UX
*/
export declare enum AnthropicBetaFeature {
CLAUDE_CODE = "claude-code-20250219",
INTERLEAVED_THINKING = "interleaved-thinking-2025-05-14",
FINE_GRAINED_STREAMING = "fine-grained-tool-streaming-2025-05-14"
}
/**
* Supported Models for DeepSeek
* Docs: https://api-docs.deepseek.com/quick_start/pricing
*/
export declare enum DeepSeekModels {
/** General-purpose chat (DeepSeek-V3) */
DEEPSEEK_CHAT = "deepseek-chat",
/** Reasoning model (DeepSeek-R1) — exposes reasoning_content */
DEEPSEEK_REASONER = "deepseek-reasoner"
}
/**
* Selected NVIDIA NIM Models
* Full catalog: https://build.nvidia.com/models
* Note: NIM hosts hundreds of models; pass arbitrary IDs via --model.
*/
export declare enum NvidiaNimModels {
LLAMA_3_3_70B_INSTRUCT = "meta/llama-3.3-70b-instruct",
LLAMA_3_1_405B_INSTRUCT = "meta/llama-3.1-405b-instruct",
LLAMA_3_1_70B_INSTRUCT = "meta/llama-3.1-70b-instruct",
LLAMA_3_2_90B_VISION = "meta/llama-3.2-90b-vision-instruct",
LLAMA_3_2_11B_VISION = "meta/llama-3.2-11b-vision-instruct",
NEMOTRON_SUPER_49B = "nvidia/llama-3.3-nemotron-super-49b-v1",
NEMOTRON_NANO_8B = "nvidia/llama-3.1-nemotron-nano-8b-v1",
NEMOTRON_70B_INSTRUCT = "nvidia/llama-3.1-nemotron-70b-instruct",
DEEPSEEK_R1 = "deepseek-ai/deepseek-r1",
DEEPSEEK_R1_DISTILL_LLAMA_70B = "deepseek-ai/deepseek-r1-distill-llama-70b",
MIXTRAL_8X22B_INSTRUCT = "mistralai/mixtral-8x22b-instruct-v0.1",
MIXTRAL_8X7B_INSTRUCT = "mistralai/mixtral-8x7b-instruct-v0.1",
PHI_4 = "microsoft/phi-4",
GEMMA_3_27B_IT = "google/gemma-3-27b-it",
GLM_4_5 = "z-ai/glm4.5"
}
/**
* LM Studio loads any GGUF model the user has downloaded.
* Default: empty string → triggers /v1/models auto-discovery.
*/
export declare enum LMStudioModels {
/** Sentinel value — triggers auto-discovery from /v1/models */
AUTO_DISCOVER = ""
}
/**
* llama.cpp serves a single model loaded at server startup.
* Default: empty string → uses whatever is loaded.
*/
export declare enum LlamaCppModels {
/** Sentinel value — uses the model loaded by the llama-server process */
AUTO_DISCOVER = ""
}
/**
* xAI Grok models — accessible at api.x.ai/v1 (OpenAI-compatible).
* @see https://docs.x.ai/docs/models
*/
export declare enum XaiModels {
/** Latest Grok 3 — flagship; best for complex reasoning */
GROK_3 = "grok-3",
/** Grok 3 Mini — faster + cheaper variant of Grok 3 */
GROK_3_MINI = "grok-3-mini",
/** Grok 2 latest — previous flagship; still supported */
GROK_2_LATEST = "grok-2-latest",
/** Grok 2 Vision — multimodal (text + images) */
GROK_2_VISION_LATEST = "grok-2-vision-latest",
/** Grok beta — pre-release / experimental access */
GROK_BETA = "grok-beta"
}
/**
* Groq-hosted models — Llama / Mistral / Gemma at sub-100ms inference.
* @see https://console.groq.com/docs/models
*/
export declare enum GroqModels {
/** Llama 3.3 70B Versatile — production default */
LLAMA_3_3_70B_VERSATILE = "llama-3.3-70b-versatile",
/** Llama 3.1 8B Instant — low-latency tier */
LLAMA_3_1_8B_INSTANT = "llama-3.1-8b-instant",
/** Gemma 2 9B IT — Google's lightweight instruct model */
GEMMA_2_9B_IT = "gemma2-9b-it",
/** Mixtral 8x7B 32K — Mistral's MoE model */
MIXTRAL_8X7B_32768 = "mixtral-8x7b-32768",
/** Llama Guard 3 8B — safety classifier */
LLAMA_GUARD_3_8B = "llama-guard-3-8b",
/** Llama 3.2 90B Vision Preview — multimodal */
LLAMA_3_2_90B_VISION_PREVIEW = "llama-3.2-90b-vision-preview",
/** Llama 3.2 11B Vision Preview — smaller multimodal */
LLAMA_3_2_11B_VISION_PREVIEW = "llama-3.2-11b-vision-preview"
}
/**
* Cohere Command + Embed models.
* @see https://docs.cohere.com/docs/models
*
* Note: bare aliases `command-r` and `command-r-plus` were retired on
* September 15, 2025. Use the dated variants instead.
*/
export declare enum CohereModels {
/** Command A (March 2025) — current flagship chat model */
COMMAND_A = "command-a-03-2025",
/** Command A Reasoning (Aug 2025) — explicit reasoning traces */
COMMAND_A_REASONING = "command-a-reasoning-08-2025",
/** Command R+ dated (Aug 2024) — last supported R+ variant */
COMMAND_R_PLUS = "command-r-plus-08-2024",
/** Command R dated (Aug 2024) — last supported R variant */
COMMAND_R = "command-r-08-2024",
/** Command R7B (Dec 2024) — most compact */
COMMAND_R7B = "command-r7b-12-2024",
/** Embed v3 multilingual */
EMBED_MULTILINGUAL_V3 = "embed-multilingual-v3.0",
/** Embed v3 English */
EMBED_ENGLISH_V3 = "embed-english-v3.0",
/** Rerank v3 multilingual */
RERANK_MULTILINGUAL_V3 = "rerank-multilingual-v3.0",
/** Rerank v3 English */
RERANK_ENGLISH_V3 = "rerank-english-v3.0"
}
/**
* Together AI hosted models — open-model gateway.
* @see https://docs.together.ai/docs/serverless-models
*/
export declare enum TogetherAIModels {
/** Llama 3.3 70B Instruct Turbo — production default */
LLAMA_3_3_70B_INSTRUCT_TURBO = "meta-llama/Llama-3.3-70B-Instruct-Turbo",
/** Llama 3.1 405B Instruct Turbo — flagship size */
LLAMA_3_1_405B_INSTRUCT_TURBO = "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo",
/** Llama 3.1 70B Instruct Turbo */
LLAMA_3_1_70B_INSTRUCT_TURBO = "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo",
/** Llama 3.1 8B Instruct Turbo — fastest */
LLAMA_3_1_8B_INSTRUCT_TURBO = "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo",
/** Mixtral 8x22B Instruct */
MIXTRAL_8X22B_INSTRUCT = "mistralai/Mixtral-8x22B-Instruct-v0.1",
/** Mixtral 8x7B Instruct */
MIXTRAL_8X7B_INSTRUCT = "mistralai/Mixtral-8x7B-Instruct-v0.1",
/** Qwen 2.5 72B Instruct Turbo */
QWEN_2_5_72B_INSTRUCT_TURBO = "Qwen/Qwen2.5-72B-Instruct-Turbo",
/** Qwen 2.5 Coder 32B Instruct */
QWEN_2_5_CODER_32B = "Qwen/Qwen2.5-Coder-32B-Instruct",
/** DeepSeek R1 — reasoning */
DEEPSEEK_R1 = "deepseek-ai/DeepSeek-R1",
/** DeepSeek V3 */
DEEPSEEK_V3 = "deepseek-ai/DeepSeek-V3",
/** Google Gemma 2 27B IT */
GEMMA_2_27B_IT = "google/gemma-2-27b-it",
/** WizardLM 2 8x22B */
WIZARDLM_2_8X22B = "microsoft/WizardLM-2-8x22B"
}
/**
* Fireworks AI hosted models — fast open-model serving.
* @see https://fireworks.ai/models
*
* Note: the older Llama / Mixtral / Qwen 2.5 generation was rotated
* out of Fireworks' serverless tier. Current shipping defaults below.
*/
export declare enum FireworksModels {
/** DeepSeek V4 Pro — current general-purpose default */
DEEPSEEK_V4_PRO = "accounts/fireworks/models/deepseek-v4-pro",
/** GLM 5.1 — Zhipu flagship */
GLM_5P1 = "accounts/fireworks/models/glm-5p1",
/** GLM 5 — broader coverage */
GLM_5 = "accounts/fireworks/models/glm-5",
/** Kimi K2.6 — Moonshot flagship */
KIMI_K2P6 = "accounts/fireworks/models/kimi-k2p6",
/** Kimi K2.5 — preceding Kimi */
KIMI_K2P5 = "accounts/fireworks/models/kimi-k2p5",
/** GPT-OSS 120B — Apache-2.0 OpenAI weights */
GPT_OSS_120B = "accounts/fireworks/models/gpt-oss-120b"
}
/**
* Perplexity Sonar models — built-in web grounding.
* @see https://docs.perplexity.ai/guides/model-cards
*/
export declare enum PerplexityModels {
/** Sonar — production default with web search */
SONAR = "sonar",
/** Sonar Pro — better reasoning + larger context */
SONAR_PRO = "sonar-pro",
/** Sonar Reasoning — explicit reasoning traces */
SONAR_REASONING = "sonar-reasoning",
/** Sonar Reasoning Pro — flagship reasoning + web */
SONAR_REASONING_PRO = "sonar-reasoning-pro",
/** Sonar Deep Research — long-form research with citations */
SONAR_DEEP_RESEARCH = "sonar-deep-research"
}
/**
* Cloudflare Workers AI models — edge-served open models.
* @see https://developers.cloudflare.com/workers-ai/models/
*/
export declare enum CloudflareModels {
/** Llama 3.3 70B Instruct (FP8 fast) */
LLAMA_3_3_70B_FAST = "@cf/meta/llama-3.3-70b-instruct-fp8-fast",
/** Llama 3.1 70B Instruct */
LLAMA_3_1_70B_INSTRUCT = "@cf/meta/llama-3.1-70b-instruct",
/** Llama 3.1 8B Instruct fast */
LLAMA_3_1_8B_FAST = "@cf/meta/llama-3.1-8b-instruct-fast",
/** Llama 3.2 11B Vision Instruct */
LLAMA_3_2_11B_VISION = "@cf/meta/llama-3.2-11b-vision-instruct",
/** Mistral 7B Instruct v0.2 */
MISTRAL_7B_INSTRUCT_V0_2 = "@cf/mistral/mistral-7b-instruct-v0.2",
/** Qwen 1.5 14B Chat AWQ */
QWEN_1P5_14B_CHAT_AWQ = "@cf/qwen/qwen1.5-14b-chat-awq",
/** Gemma 2B IT */
GEMMA_2B_IT_LORA = "@cf/google/gemma-2b-it-lora"
}
/**
* Voyage AI embedding models — top-tier RAG embedders.
* @see https://docs.voyageai.com/docs/embeddings
*/
export declare enum VoyageModels {
/** Voyage 3.5 — latest general-purpose (default) */
VOYAGE_3_5 = "voyage-3.5",
/** Voyage 3.5 Lite — smaller / cheaper */
VOYAGE_3_5_LITE = "voyage-3.5-lite",
/** Voyage 3 Large — flagship size */
VOYAGE_3_LARGE = "voyage-3-large",
/** Voyage Code 3 — code-tuned */
VOYAGE_CODE_3 = "voyage-code-3",
/** Voyage Finance 2 — domain-tuned */
VOYAGE_FINANCE_2 = "voyage-finance-2",
/** Voyage Law 2 — domain-tuned */
VOYAGE_LAW_2 = "voyage-law-2",
/** Voyage Multilingual 2 */
VOYAGE_MULTILINGUAL_2 = "voyage-multilingual-2"
}
/**
* Jina AI embedding + reranking models.
* @see https://jina.ai/embeddings/
*/
export declare enum JinaModels {
/** Jina Embeddings v3 — flagship multilingual (default) */
JINA_EMBEDDINGS_V3 = "jina-embeddings-v3",
/** Jina Embeddings v2 base English */
JINA_EMBEDDINGS_V2_BASE_EN = "jina-embeddings-v2-base-en",
/** Jina Embeddings v2 small English */
JINA_EMBEDDINGS_V2_SMALL_EN = "jina-embeddings-v2-small-en",
/** Jina Embeddings v2 base code */
JINA_EMBEDDINGS_V2_BASE_CODE = "jina-embeddings-v2-base-code",
/** Jina Embeddings v2 base multilingual */
JINA_EMBEDDINGS_V2_BASE_MULTILINGUAL = "jina-embeddings-v2-base-zh",
/** Jina ColBERT v2 — late-interaction retrieval */
JINA_COLBERT_V2 = "jina-colbert-v2",
/** Jina Reranker v2 base multilingual */
JINA_RERANKER_V2_BASE_MULTILINGUAL = "jina-reranker-v2-base-multilingual",
/** Jina Reranker v1 turbo English */
JINA_RERANKER_V1_TURBO_EN = "jina-reranker-v1-turbo-en"
}
/**
* Stability AI image generation models (api.stability.ai).
* @see https://platform.stability.ai/docs/api-reference
*/
export declare enum StabilityModels {
/** Stable Image Ultra — flagship quality (default) */
STABLE_IMAGE_ULTRA = "stable-image-ultra",
/** Stable Image Core — fast tier */
STABLE_IMAGE_CORE = "stable-image-core",
/** Stable Diffusion 3.5 Large */
SD_3_5_LARGE = "sd3.5-large",
/** Stable Diffusion 3.5 Large Turbo */
SD_3_5_LARGE_TURBO = "sd3.5-large-turbo",
/** Stable Diffusion 3.5 Medium */
SD_3_5_MEDIUM = "sd3.5-medium"
}
/**
* Ideogram image generation models.
* @see https://docs.ideogram.ai/api-reference/api-reference/post-v-1-ideogram-v-3-generate
*/
export declare enum IdeogramModels {
/** Ideogram V3 — latest with strong typography (default) */
IDEOGRAM_V3 = "V_3",
/** Ideogram V2 */
IDEOGRAM_V2 = "V_2",
/** Ideogram V2 Turbo — fast tier */
IDEOGRAM_V2_TURBO = "V_2_TURBO",
/** Ideogram V1 */
IDEOGRAM_V1 = "V_1"
}
/**
* Recraft image generation models — vector / illustration focus.
* @see https://www.recraft.ai/docs
*/
export declare enum RecraftModels {
/** Recraft V3 — flagship raster (default) */
RECRAFT_V3 = "recraftv3",
/** Recraft V3 SVG — vector output */
RECRAFT_V3_SVG = "recraftv3-svg",
/** Recraft V2 */
RECRAFT_V2 = "recraftv2"
}
/**
* Replicate hosted models (LLMs only — image / video / avatar / music
* accessed via dedicated handlers).
*
* Replicate accepts arbitrary `owner/name` or `owner/name:version`; this
* enum lists popular LLM defaults. Pass any model id via `--model`.
*
* @see https://replicate.com/explore
*/
export declare enum ReplicateModels {
/** Meta Llama 3.1 405B Instruct */
LLAMA_3_1_405B_INSTRUCT = "meta/meta-llama-3.1-405b-instruct",
/** Meta Llama 3 70B Instruct (stable; the meta-llama-3.1-70b variant was retired upstream) */
LLAMA_3_70B_INSTRUCT = "meta/meta-llama-3-70b-instruct",
/** Meta Llama 3 8B Instruct */
LLAMA_3_8B_INSTRUCT = "meta/meta-llama-3-8b-instruct",
/** Mistral 7B Instruct v0.2 */
MISTRAL_7B_INSTRUCT_V02 = "mistralai/mistral-7b-instruct-v0.2",
/** Mixtral 8x7B Instruct v0.1 */
MIXTRAL_8X7B_INSTRUCT_V01 = "mistralai/mixtral-8x7b-instruct-v0.1"
}
/**
* Buffer time in milliseconds before token expiry to trigger refresh
*
* @description Tokens are refreshed 5 minutes before expiry to prevent
* authentication failures during ongoing operations
*/
export declare const TOKEN_EXPIRY_BUFFER_MS: number;