UNPKG

@juspay/neurolink

Version:

Universal AI Development Platform with working MCP integration, multi-provider support, voice (TTS/STT/realtime), and professional CLI. 58+ external MCP servers discoverable, multimodal file processing, RAG pipelines. Build, test, and deploy AI applicatio

955 lines (954 loc) 40.8 kB
/** * Supported AI Provider Names */ export declare enum AIProviderName { BEDROCK = "bedrock", OPENAI = "openai", OPENAI_COMPATIBLE = "openai-compatible", OPENROUTER = "openrouter", VERTEX = "vertex", ANTHROPIC = "anthropic", AZURE = "azure", GOOGLE_AI = "google-ai", HUGGINGFACE = "huggingface", OLLAMA = "ollama", MISTRAL = "mistral", LITELLM = "litellm", SAGEMAKER = "sagemaker", DEEPSEEK = "deepseek", NVIDIA_NIM = "nvidia-nim", LM_STUDIO = "lm-studio", LLAMACPP = "llamacpp", XAI = "xai", GROQ = "groq", COHERE = "cohere", TOGETHER_AI = "together-ai", FIREWORKS = "fireworks", PERPLEXITY = "perplexity", CLOUDFLARE = "cloudflare", REPLICATE = "replicate", VOYAGE = "voyage", JINA = "jina", STABILITY = "stability", IDEOGRAM = "ideogram", RECRAFT = "recraft", AUTO = "auto" } /** * Popular Models for OpenRouter (300+ available at openrouter.ai/models) * OpenRouter uses 'provider/model' format */ export declare enum OpenRouterModels { CLAUDE_OPUS_4_6 = "anthropic/claude-opus-4.6", CLAUDE_SONNET_4_6 = "anthropic/claude-sonnet-4.6", CLAUDE_SONNET_4_5 = "anthropic/claude-sonnet-4.5", CLAUDE_HAIKU_4_5 = "anthropic/claude-haiku-4.5", CLAUDE_3_7_SONNET = "anthropic/claude-3.7-sonnet", CLAUDE_3_5_HAIKU = "anthropic/claude-3-5-haiku", CLAUDE_3_OPUS = "anthropic/claude-3-opus", GPT_5_2 = "openai/gpt-5.2", GPT_5 = "openai/gpt-5", GPT_4O = "openai/gpt-4o", GPT_4O_MINI = "openai/gpt-4o-mini", GPT_4_TURBO = "openai/gpt-4-turbo", GEMINI_3_1_PRO_PREVIEW = "google/gemini-3.1-pro-preview", GEMINI_3_FLASH_PREVIEW = "google/gemini-3-flash-preview", GEMINI_2_5_FLASH = "google/gemini-2.5-flash", GEMINI_2_5_FLASH_LITE = "google/gemini-2.5-flash-lite", GEMINI_2_0_FLASH = "google/gemini-2.0-flash", LLAMA_3_1_70B = "meta-llama/llama-3.1-70b-instruct", LLAMA_3_1_8B = "meta-llama/llama-3.1-8b-instruct", MISTRAL_LARGE = "mistralai/mistral-large", MIXTRAL_8X7B = "mistralai/mixtral-8x7b-instruct", DEEPSEEK_R1 = "deepseek/deepseek-r1", GROK_4_1_FAST = "xai/grok-4.1-fast" } /** * Supported Models for Amazon Bedrock */ export declare enum BedrockModels { CLAUDE_4_6_OPUS = "anthropic.claude-opus-4-6-v1:0", CLAUDE_4_6_SONNET = "anthropic.claude-sonnet-4-6", CLAUDE_4_5_OPUS = "anthropic.claude-opus-4-5-20251124-v1:0", CLAUDE_4_5_SONNET = "anthropic.claude-sonnet-4-5-20250929-v1:0", CLAUDE_4_5_HAIKU = "anthropic.claude-haiku-4-5-20251001-v1:0", CLAUDE_4_1_OPUS = "anthropic.claude-opus-4-1-20250805-v1:0", CLAUDE_4_SONNET = "anthropic.claude-sonnet-4-20250514-v1:0", /** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */ CLAUDE_3_7_SONNET = "anthropic.claude-3-7-sonnet-20250219-v1:0", /** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */ CLAUDE_3_5_SONNET = "anthropic.claude-3-5-sonnet-20241022-v1:0", /** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */ CLAUDE_3_5_HAIKU = "anthropic.claude-3-5-haiku-20241022-v1:0", /** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */ CLAUDE_3_SONNET = "anthropic.claude-3-sonnet-20240229-v1:0", /** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */ CLAUDE_3_HAIKU = "anthropic.claude-3-haiku-20240307-v1:0", NOVA_PREMIER = "amazon.nova-premier-v1:0", NOVA_PRO = "amazon.nova-pro-v1:0", NOVA_LITE = "amazon.nova-lite-v1:0", NOVA_MICRO = "amazon.nova-micro-v1:0", NOVA_2_LITE = "amazon.nova-2-lite-v1:0", NOVA_2_SONIC = "amazon.nova-2-sonic-v1:0", NOVA_SONIC = "amazon.nova-sonic-v1:0", NOVA_CANVAS = "amazon.nova-canvas-v1:0", NOVA_REEL = "amazon.nova-reel-v1:0", NOVA_REEL_V1_1 = "amazon.nova-reel-v1:1", NOVA_MULTIMODAL_EMBEDDINGS = "amazon.nova-2-multimodal-embeddings-v1:0", TITAN_TEXT_LARGE = "amazon.titan-tg1-large", TITAN_EMBED_TEXT_V2 = "amazon.titan-embed-text-v2:0", TITAN_EMBED_TEXT_V1 = "amazon.titan-embed-text-v1", TITAN_EMBED_G1_TEXT_02 = "amazon.titan-embed-g1-text-02", TITAN_EMBED_IMAGE_V1 = "amazon.titan-embed-image-v1", TITAN_IMAGE_GENERATOR_V2 = "amazon.titan-image-generator-v2:0", LLAMA_4_MAVERICK_17B = "meta.llama4-maverick-17b-instruct-v1:0", LLAMA_4_SCOUT_17B = "meta.llama4-scout-17b-instruct-v1:0", LLAMA_3_3_70B = "meta.llama3-3-70b-instruct-v1:0", LLAMA_3_2_90B = "meta.llama3-2-90b-instruct-v1:0", LLAMA_3_2_11B = "meta.llama3-2-11b-instruct-v1:0", LLAMA_3_2_3B = "meta.llama3-2-3b-instruct-v1:0", LLAMA_3_2_1B = "meta.llama3-2-1b-instruct-v1:0", LLAMA_3_1_405B = "meta.llama3-1-405b-instruct-v1:0", LLAMA_3_1_70B = "meta.llama3-1-70b-instruct-v1:0", LLAMA_3_1_8B = "meta.llama3-1-8b-instruct-v1:0", LLAMA_3_70B = "meta.llama3-70b-instruct-v1:0", LLAMA_3_8B = "meta.llama3-8b-instruct-v1:0", MISTRAL_LARGE_3 = "mistral.mistral-large-3-675b-instruct", MISTRAL_LARGE_2407 = "mistral.mistral-large-2407-v1:0", MISTRAL_LARGE_2402 = "mistral.mistral-large-2402-v1:0", MAGISTRAL_SMALL_2509 = "mistral.magistral-small-2509", MINISTRAL_3_14B = "mistral.ministral-3-14b-instruct", MINISTRAL_3_8B = "mistral.ministral-3-8b-instruct", MINISTRAL_3_3B = "mistral.ministral-3-3b-instruct", MISTRAL_7B = "mistral.mistral-7b-instruct-v0:2", MIXTRAL_8x7B = "mistral.mixtral-8x7b-instruct-v0:1", PIXTRAL_LARGE_2502 = "mistral.pixtral-large-2502-v1:0", VOXTRAL_SMALL_24B = "mistral.voxtral-small-24b-2507", VOXTRAL_MINI_3B = "mistral.voxtral-mini-3b-2507", COHERE_COMMAND_R_PLUS = "cohere.command-r-plus-v1:0", COHERE_COMMAND_R = "cohere.command-r-v1:0", DEEPSEEK_R1 = "deepseek.r1-v1:0", DEEPSEEK_V3 = "deepseek.v3-v1:0", QWEN_3_235B_A22B = "qwen.qwen3-235b-a22b-2507-v1:0", QWEN_3_CODER_480B_A35B = "qwen.qwen3-coder-480b-a35b-v1:0", QWEN_3_CODER_30B_A3B = "qwen.qwen3-coder-30b-a3b-v1:0", QWEN_3_32B = "qwen.qwen3-32b-v1:0", QWEN_3_NEXT_80B_A3B = "qwen.qwen3-next-80b-a3b", QWEN_3_VL_235B_A22B = "qwen.qwen3-vl-235b-a22b", GEMMA_3_27B_IT = "google.gemma-3-27b-it", GEMMA_3_12B_IT = "google.gemma-3-12b-it", GEMMA_3_4B_IT = "google.gemma-3-4b-it", JAMBA_1_5_LARGE = "ai21.jamba-1-5-large-v1:0", JAMBA_1_5_MINI = "ai21.jamba-1-5-mini-v1:0", WRITER_PALMYRA_X5 = "writer.palmyra-x5-v1:0", WRITER_PALMYRA_X4 = "writer.palmyra-x4-v1:0", MINIMAX_M2_1 = "minimax.minimax-m2.1", MINIMAX_M2 = "minimax.minimax-m2", KIMI_K2_THINKING = "moonshot.kimi-k2-thinking", KIMI_K2_5 = "moonshotai.kimi-k2.5", NVIDIA_NEMOTRON_NANO_3_30B = "nvidia.nemotron-nano-3-30b", NVIDIA_NEMOTRON_NANO_12B_V2 = "nvidia.nemotron-nano-12b-v2", NVIDIA_NEMOTRON_NANO_9B_V2 = "nvidia.nemotron-nano-9b-v2", OPENAI_GPT_OSS_120B = "openai.gpt-oss-120b-1:0", OPENAI_GPT_OSS_20B = "openai.gpt-oss-20b-1:0", GLM_4_7 = "zai.glm-4.7", GLM_4_7_FLASH = "zai.glm-4.7-flash", COHERE_EMBED_ENGLISH_V3 = "cohere.embed-english-v3", COHERE_EMBED_MULTILINGUAL_V3 = "cohere.embed-multilingual-v3", COHERE_EMBED_V4 = "cohere.embed-v4:0", COHERE_RERANK_V3_5 = "cohere.rerank-v3-5:0", AMAZON_RERANK_V1 = "amazon.rerank-v1:0", DEVSTRAL_2_123B = "mistral.devstral-2-123b" } /** * Supported Models for OpenAI */ export declare enum OpenAIModels { GPT_5_3_CODEX = "gpt-5.3-codex", GPT_5_4 = "gpt-5.4", GPT_5_4_MINI = "gpt-5.4-mini", GPT_5_4_NANO = "gpt-5.4-nano", GPT_5_4_PRO = "gpt-5.4-pro", GPT_5_2 = "gpt-5.2", GPT_5_2_CHAT_LATEST = "gpt-5.2-chat-latest", GPT_5_2_PRO = "gpt-5.2-pro", GPT_5_2_CODEX = "gpt-5.2-codex", GPT_5_1 = "gpt-5.1", GPT_5_1_CHAT_LATEST = "gpt-5.1-chat-latest", GPT_5_1_CODEX = "gpt-5.1-codex", GPT_5_1_CODEX_MAX = "gpt-5.1-codex-max", GPT_5_1_CODEX_MINI = "gpt-5.1-codex-mini", GPT_5 = "gpt-5", GPT_5_MINI = "gpt-5-mini", GPT_5_NANO = "gpt-5-nano", GPT_5_PRO = "gpt-5-pro", GPT_5_CHAT_LATEST = "gpt-5-chat-latest", GPT_5_CODEX = "gpt-5-codex", GPT_OSS_120B = "gpt-oss-120b", GPT_OSS_20B = "gpt-oss-20b", GPT_4_1 = "gpt-4.1", GPT_4_1_MINI = "gpt-4.1-mini", GPT_4_1_NANO = "gpt-4.1-nano", GPT_4O = "gpt-4o", GPT_4O_MINI = "gpt-4o-mini", O3 = "o3", O3_MINI = "o3-mini", O3_PRO = "o3-pro", O4_MINI = "o4-mini", O1 = "o1", /** @deprecated Turned off Jul 14, 2025. Use GPT_4_1 or O3. */ O1_PREVIEW = "o1-preview", /** @deprecated Replaced by o3-mini. */ O1_MINI = "o1-mini", GPT_4 = "gpt-4", GPT_4_TURBO = "gpt-4-turbo", GPT_3_5_TURBO = "gpt-3.5-turbo", GPT_IMAGE_1 = "gpt-image-1", DALL_E_3 = "dall-e-3", DALL_E_2 = "dall-e-2" } /** * Supported Models for Azure OpenAI * Note: Azure uses deployment names, these are model identifiers */ export declare enum AzureOpenAIModels { GPT_5_2 = "gpt-5.2", GPT_5_2_CHAT = "gpt-5.2-chat", GPT_5_2_PRO = "gpt-5.2-pro", GPT_5_2_CODEX = "gpt-5.2-codex", GPT_5_4 = "gpt-5.4", GPT_5_4_MINI = "gpt-5.4-mini", GPT_5_4_NANO = "gpt-5.4-nano", GPT_5_1 = "gpt-5.1", GPT_5_1_CHAT = "gpt-5.1-chat", GPT_5_1_CODEX = "gpt-5.1-codex", GPT_5_1_CODEX_MINI = "gpt-5.1-codex-mini", GPT_5_1_CODEX_MAX = "gpt-5.1-codex-max", GPT_5 = "gpt-5", GPT_5_MINI = "gpt-5-mini", GPT_5_NANO = "gpt-5-nano", GPT_5_CHAT = "gpt-5-chat", GPT_5_CODEX = "gpt-5-codex", GPT_5_PRO = "gpt-5-pro", GPT_5_TURBO = "gpt-5-turbo", O4_MINI = "o4-mini", O3 = "o3", O3_MINI = "o3-mini", O3_PRO = "o3-pro", O1 = "o1", O1_MINI = "o1-mini", O1_PREVIEW = "o1-preview", CODEX_MINI = "codex-mini", GPT_4_1 = "gpt-4.1", GPT_4_1_NANO = "gpt-4.1-nano", GPT_4_1_MINI = "gpt-4.1-mini", GPT_4O = "gpt-4o", GPT_4O_MINI = "gpt-4o-mini", GPT_4_TURBO = "gpt-4-turbo", GPT_4 = "gpt-4", GPT_4_32K = "gpt-4-32k", GPT_3_5_TURBO = "gpt-35-turbo", GPT_3_5_TURBO_INSTRUCT = "gpt-35-turbo-instruct" } /** * Supported Models for Google Vertex AI */ export declare enum VertexModels { CLAUDE_4_6_OPUS = "claude-opus-4-6", CLAUDE_4_6_SONNET = "claude-sonnet-4-6", CLAUDE_4_5_OPUS = "claude-opus-4-5@20251124", CLAUDE_4_5_SONNET = "claude-sonnet-4-5@20250929", CLAUDE_4_5_HAIKU = "claude-haiku-4-5@20251001", CLAUDE_4_0_SONNET = "claude-sonnet-4@20250514", CLAUDE_4_0_OPUS = "claude-opus-4@20250514", /** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */ CLAUDE_3_7_SONNET = "claude-3-7-sonnet@20250219", /** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */ CLAUDE_3_5_SONNET = "claude-3-5-sonnet-20241022", /** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */ CLAUDE_3_5_HAIKU = "claude-3-5-haiku-20241022", /** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */ CLAUDE_3_SONNET = "claude-3-sonnet-20240229", /** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */ CLAUDE_3_OPUS = "claude-3-opus-20240229", /** @deprecated Retired from Anthropic API. Use CLAUDE_4_6_SONNET instead. */ CLAUDE_3_HAIKU = "claude-3-haiku-20240307", GEMINI_3_1_PRO_PREVIEW = "gemini-3.1-pro-preview", GEMINI_3_1_FLASH_LITE_PREVIEW = "gemini-3.1-flash-lite-preview", GEMINI_3_1_FLASH_IMAGE_PREVIEW = "gemini-3.1-flash-image-preview", GEMINI_3_1_PRO_PREVIEW_CUSTOMTOOLS = "gemini-3.1-pro-preview-customtools", GEMINI_3_FLASH_PREVIEW = "gemini-3-flash-preview", GEMINI_3_PRO_IMAGE_PREVIEW = "gemini-3-pro-image-preview", /** @deprecated SHUT DOWN March 9, 2026. Migrate to GEMINI_3_1_PRO_PREVIEW. */ GEMINI_3_PRO_PREVIEW = "gemini-3-pro-preview", GEMINI_2_5_PRO = "gemini-2.5-pro", GEMINI_2_5_FLASH = "gemini-2.5-flash", GEMINI_2_5_FLASH_LITE = "gemini-2.5-flash-lite", GEMINI_2_5_FLASH_IMAGE = "gemini-2.5-flash-image", GEMINI_2_0_FLASH = "gemini-2.0-flash", GEMINI_2_0_FLASH_001 = "gemini-2.0-flash-001", GEMINI_2_0_FLASH_LITE = "gemini-2.0-flash-lite", /** @deprecated SHUT DOWN. Returns 404. Use GEMINI_2_5_FLASH or newer. */ GEMINI_1_5_PRO = "gemini-1.5-pro-002", /** @deprecated SHUT DOWN. Returns 404. Use GEMINI_2_5_FLASH or newer. */ GEMINI_1_5_FLASH = "gemini-1.5-flash-002" } /** * Supported Models for Google AI Studio */ export declare enum GoogleAIModels { GEMINI_3_1_PRO_PREVIEW = "gemini-3.1-pro-preview", GEMINI_3_1_FLASH_LITE_PREVIEW = "gemini-3.1-flash-lite-preview", GEMINI_3_1_FLASH_IMAGE_PREVIEW = "gemini-3.1-flash-image-preview", GEMINI_3_1_PRO_PREVIEW_CUSTOMTOOLS = "gemini-3.1-pro-preview-customtools", GEMINI_3_FLASH_PREVIEW = "gemini-3-flash-preview", GEMINI_3_PRO_IMAGE_PREVIEW = "gemini-3-pro-image-preview", /** @deprecated SHUT DOWN March 9, 2026. Migrate to GEMINI_3_1_PRO_PREVIEW. */ GEMINI_3_PRO_PREVIEW = "gemini-3-pro-preview", GEMINI_2_5_PRO = "gemini-2.5-pro", GEMINI_2_5_FLASH = "gemini-2.5-flash", GEMINI_2_5_FLASH_LITE = "gemini-2.5-flash-lite", GEMINI_2_5_FLASH_IMAGE = "gemini-2.5-flash-image", GEMINI_2_5_FLASH_PREVIEW_TTS = "gemini-2.5-flash-preview-tts", GEMINI_2_5_PRO_PREVIEW_TTS = "gemini-2.5-pro-preview-tts", /** @deprecated Retiring June 1, 2026. Use GEMINI_2_5_FLASH instead. */ GEMINI_2_0_FLASH = "gemini-2.0-flash", GEMINI_2_0_FLASH_001 = "gemini-2.0-flash-001", GEMINI_2_0_FLASH_LITE = "gemini-2.0-flash-lite", GEMINI_2_0_FLASH_IMAGE = "gemini-2.0-flash-preview-image-generation", /** @deprecated SHUT DOWN. Returns 404. Use GEMINI_2_5_FLASH or newer. */ GEMINI_1_5_PRO = "gemini-1.5-pro", /** @deprecated SHUT DOWN. Returns 404. Use GEMINI_2_5_FLASH or newer. */ GEMINI_1_5_FLASH = "gemini-1.5-flash", GEMINI_EMBEDDING = "gemini-embedding-001", GEMINI_EMBEDDING_2_PREVIEW = "gemini-embedding-2-preview", /** @deprecated SHUT DOWN Jan 14, 2026. Use GEMINI_EMBEDDING instead. */ TEXT_EMBEDDING_004 = "text-embedding-004" } /** * Supported Models for Anthropic (Direct API) */ export declare enum AnthropicModels { CLAUDE_OPUS_4_6 = "claude-opus-4-6", CLAUDE_SONNET_4_6 = "claude-sonnet-4-6", CLAUDE_OPUS_4_5 = "claude-opus-4-5-20251101", CLAUDE_SONNET_4_5 = "claude-sonnet-4-5-20250929", CLAUDE_4_5_HAIKU = "claude-haiku-4-5-20251001", CLAUDE_OPUS_4_1 = "claude-opus-4-1-20250805", CLAUDE_OPUS_4_0 = "claude-opus-4-20250514", CLAUDE_SONNET_4_0 = "claude-sonnet-4-20250514", /** @deprecated Retired from Anthropic API. Use CLAUDE_SONNET_4_6 instead. */ CLAUDE_SONNET_3_7 = "claude-3-7-sonnet-20250219", /** @deprecated Retired from Anthropic API. Use CLAUDE_SONNET_4_6 instead. */ CLAUDE_3_5_SONNET = "claude-3-5-sonnet-20241022", /** @deprecated Retired from Anthropic API. Use CLAUDE_SONNET_4_6 instead. */ CLAUDE_3_5_HAIKU = "claude-3-5-haiku-20241022", /** @deprecated Retired from Anthropic API. Use CLAUDE_SONNET_4_6 instead. */ CLAUDE_3_SONNET = "claude-3-sonnet-20240229", /** @deprecated Retired from Anthropic API. Use CLAUDE_SONNET_4_6 instead. */ CLAUDE_3_OPUS = "claude-3-opus-20240229", /** @deprecated Retired from Anthropic API. Use CLAUDE_SONNET_4_6 instead. */ CLAUDE_3_HAIKU = "claude-3-haiku-20240307" } /** * Supported Models for Mistral AI */ export declare enum MistralModels { MISTRAL_LARGE_LATEST = "mistral-large-latest", MISTRAL_LARGE_2512 = "mistral-large-2512", MISTRAL_MEDIUM_LATEST = "mistral-medium-latest", MISTRAL_MEDIUM_2508 = "mistral-medium-2508", MISTRAL_SMALL_LATEST = "mistral-small-latest", MISTRAL_SMALL_2506 = "mistral-small-2506", MAGISTRAL_MEDIUM_LATEST = "magistral-medium-latest", MAGISTRAL_SMALL_LATEST = "magistral-small-latest", MINISTRAL_14B_2512 = "ministral-14b-2512", MINISTRAL_8B_2512 = "ministral-8b-2512", MINISTRAL_3B_2512 = "ministral-3b-2512", CODESTRAL_LATEST = "codestral-latest", CODESTRAL_2508 = "codestral-2508", CODESTRAL_EMBED = "codestral-embed", DEVSTRAL_MEDIUM_LATEST = "devstral-medium-latest", DEVSTRAL_SMALL_LATEST = "devstral-small-latest", PIXTRAL_LARGE = "pixtral-large", PIXTRAL_12B = "pixtral-12b", VOXTRAL_SMALL_LATEST = "voxtral-small-latest", VOXTRAL_MINI_LATEST = "voxtral-mini-latest", DEVSTRAL_2 = "devstral-2512", DEVSTRAL_SMALL_2 = "devstral-small-2512", MAGISTRAL_MEDIUM_2509 = "magistral-medium-2509", MAGISTRAL_SMALL_2509 = "magistral-small-2509", VOXTRAL_MINI_TRANSCRIBE_2 = "voxtral-mini-2602", MISTRAL_OCR_3 = "mistral-ocr-2512", MISTRAL_OCR_LATEST = "mistral-ocr-latest", MISTRAL_NEMO = "mistral-nemo", MISTRAL_EMBED = "mistral-embed", MISTRAL_MODERATION_LATEST = "mistral-moderation-latest", MISTRAL_SMALL_4 = "mistral-small-2603", MISTRAL_SMALL_CREATIVE = "mistral-small-creative" } /** * Supported Models for Ollama (Local) * All models can be run locally without requiring API keys or cloud services */ export declare enum OllamaModels { LLAMA4_SCOUT = "llama4:scout", LLAMA4_MAVERICK = "llama4:maverick", LLAMA4_LATEST = "llama4:latest", LLAMA3_3_LATEST = "llama3.3:latest", LLAMA3_3_70B = "llama3.3:70b", LLAMA3_2_LATEST = "llama3.2:latest", LLAMA3_2_3B = "llama3.2:3b", LLAMA3_2_1B = "llama3.2:1b", LLAMA3_1_8B = "llama3.1:8b", LLAMA3_1_70B = "llama3.1:70b", LLAMA3_1_405B = "llama3.1:405b", QWEN3_4B = "qwen3:4b", QWEN3_8B = "qwen3:8b", QWEN3_14B = "qwen3:14b", QWEN3_32B = "qwen3:32b", QWEN3_72B = "qwen3:72b", QWEN2_5_3B = "qwen2.5:3b", QWEN2_5_7B = "qwen2.5:7b", QWEN2_5_14B = "qwen2.5:14b", QWEN2_5_32B = "qwen2.5:32b", QWEN2_5_72B = "qwen2.5:72b", QWQ_32B = "qwq:32b", QWQ_LATEST = "qwq:latest", DEEPSEEK_R1_1_5B = "deepseek-r1:1.5b", DEEPSEEK_R1_7B = "deepseek-r1:7b", DEEPSEEK_R1_8B = "deepseek-r1:8b", DEEPSEEK_R1_14B = "deepseek-r1:14b", DEEPSEEK_R1_32B = "deepseek-r1:32b", DEEPSEEK_R1_70B = "deepseek-r1:70b", DEEPSEEK_V3_671B = "deepseek-v3:671b", DEEPSEEK_V3_LATEST = "deepseek-v3:latest", MISTRAL_LATEST = "mistral:latest", MISTRAL_7B = "mistral:7b", MISTRAL_SMALL_LATEST = "mistral-small:latest", MISTRAL_NEMO_LATEST = "mistral-nemo:latest", MISTRAL_LARGE_LATEST = "mistral-large:latest", GEMMA3_LATEST = "gemma3:latest", GEMMA2_2B = "gemma2:2b", GEMMA2_9B = "gemma2:9b", GEMMA2_27B = "gemma2:27b", PHI4_LATEST = "phi4:latest", PHI4_14B = "phi4:14b", PHI3_MINI = "phi3:mini", PHI3_3_8B = "phi3:3.8b", PHI3_MEDIUM = "phi3:medium", PHI3_14B = "phi3:14b", LLAVA_7B = "llava:7b", LLAVA_13B = "llava:13b", LLAVA_34B = "llava:34b", LLAVA_LLAMA3_8B = "llava-llama3:8b", CODELLAMA_7B = "codellama:7b", CODELLAMA_13B = "codellama:13b", CODELLAMA_34B = "codellama:34b", CODELLAMA_70B = "codellama:70b", QWEN2_5_CODER_7B = "qwen2.5-coder:7b", QWEN2_5_CODER_32B = "qwen2.5-coder:32b", STARCODER2_3B = "starcoder2:3b", STARCODER2_7B = "starcoder2:7b", STARCODER2_15B = "starcoder2:15b", MIXTRAL_8X7B = "mixtral:8x7b", MIXTRAL_8X22B = "mixtral:8x22b", COMMAND_R_PLUS = "command-r-plus:104b", GLM_5_LATEST = "glm-5:latest", KIMI_K2_5_LATEST = "kimi-k2.5:latest", QWEN3_5_LATEST = "qwen3.5:latest", QWEN3_CODER_LATEST = "qwen3-coder:latest", QWEN3_CODER_30B = "qwen3-coder:30b", DEEPSEEK_V3_2_LATEST = "deepseek-v3.2:latest", NEMOTRON_3_NANO_LATEST = "nemotron-3-nano:latest", NEMOTRON_3_NANO_30B = "nemotron-3-nano:30b", SMOLLM3_3B = "smollm3:3b", GPT_OSS_LATEST = "gpt-oss:latest" } /** * Common Models for LiteLLM Proxy * LiteLLM supports 100+ models through unified proxy interface * Models use provider-specific prefixes (e.g., "openai/", "anthropic/") */ export declare enum LiteLLMModels { OPENAI_GPT_5 = "openai/gpt-5", OPENAI_GPT_4O = "openai/gpt-4o", OPENAI_GPT_4O_MINI = "openai/gpt-4o-mini", OPENAI_GPT_4_TURBO = "openai/gpt-4-turbo", OPENAI_GPT_4 = "openai/gpt-4", OPENAI_GPT_3_5_TURBO = "openai/gpt-3.5-turbo", ANTHROPIC_CLAUDE_SONNET_4_5 = "anthropic/claude-sonnet-4-5-20250929", ANTHROPIC_CLAUDE_OPUS_4_1 = "anthropic/claude-opus-4-1-20250805", ANTHROPIC_CLAUDE_3_5_SONNET = "anthropic/claude-3-5-sonnet-20240620", ANTHROPIC_CLAUDE_3_HAIKU = "anthropic/claude-3-haiku-20240307", VERTEX_GEMINI_2_5_PRO = "vertex_ai/gemini-2.5-pro", VERTEX_GEMINI_1_5_PRO = "vertex_ai/gemini-1.5-pro", VERTEX_GEMINI_1_5_FLASH = "vertex_ai/gemini-1.5-flash", GEMINI_2_5_PRO = "gemini/gemini-2.5-pro", GEMINI_2_0_FLASH = "gemini/gemini-2.0-flash", GEMINI_1_5_PRO = "gemini/gemini-1.5-pro", GEMINI_1_5_FLASH = "gemini/gemini-1.5-flash", GROQ_LLAMA_3_1_70B_VERSATILE = "groq/llama-3.1-70b-versatile", GROQ_LLAMA_3_1_8B_INSTANT = "groq/llama-3.1-8b-instant", GROQ_LLAMA_3_2_11B_VISION = "groq/llama-3.2-11b-vision-preview", GROQ_MIXTRAL_8X7B = "groq/mixtral-8x7b-32768", TOGETHER_LLAMA_2_70B_CHAT = "together_ai/togethercomputer/llama-2-70b-chat", TOGETHER_MIXTRAL_8X7B = "together_ai/mistralai/Mixtral-8x7B-Instruct-v0.1", TOGETHER_CODELLAMA_34B = "together_ai/codellama/CodeLlama-34b-Instruct-hf", DEEPINFRA_LLAMA_3_70B = "deepinfra/meta-llama/Meta-Llama-3-70B-Instruct", DEEPINFRA_LLAMA_2_70B = "deepinfra/meta-llama/Llama-2-70b-chat-hf", DEEPINFRA_MISTRAL_7B = "deepinfra/mistralai/Mistral-7B-Instruct-v0.1", MISTRAL_LARGE = "mistral/mistral-large-latest", MISTRAL_SMALL = "mistral/mistral-small-latest", MISTRAL_MAGISTRAL_MEDIUM = "mistral/magistral-medium-2506", BEDROCK_CLAUDE_3_5_SONNET = "bedrock/anthropic.claude-3-5-sonnet-20240620-v1:0", BEDROCK_CLAUDE_3_HAIKU = "bedrock/anthropic.claude-3-haiku-20240307-v1:0", OPENAI_GPT_5_2 = "openai/gpt-5.2", OPENAI_GPT_5_2_CODEX = "openai/gpt-5.2-codex", ANTHROPIC_CLAUDE_OPUS_4_6 = "anthropic/claude-opus-4-6", ANTHROPIC_CLAUDE_SONNET_4_6 = "anthropic/claude-sonnet-4-6", GEMINI_3_1_PRO = "gemini/gemini-3.1-pro-preview", XAI_GROK_4_1_FAST = "xai/grok-4.1-fast", PERPLEXITY_SONAR_PRO = "perplexity/sonar-pro", PERPLEXITY_SONAR_REASONING_PRO = "perplexity/sonar-reasoning-pro" } /** * Supported Models for Hugging Face Inference API */ export declare enum HuggingFaceModels { LLAMA_3_3_70B_INSTRUCT = "meta-llama/Llama-3.3-70B-Instruct", LLAMA_3_2_1B = "meta-llama/Llama-3.2-1B", LLAMA_3_2_3B_INSTRUCT = "meta-llama/Llama-3.2-3B-Instruct", LLAMA_3_1_8B = "meta-llama/Llama-3.1-8B", LLAMA_3_1_70B_INSTRUCT = "meta-llama/Llama-3.1-70B-Instruct", LLAMA_3_1_405B_INSTRUCT = "meta-llama/Llama-3.1-405B-Instruct", LLAMA_3_8B_INSTRUCT = "meta-llama/Meta-Llama-3-8B-Instruct", LLAMA_3_70B_INSTRUCT = "meta-llama/Meta-Llama-3-70B-Instruct", MISTRAL_LARGE_3_675B = "mistralai/Mistral-Large-3-675B-Instruct-2512", MISTRAL_SMALL_3_1_24B = "mistralai/Mistral-Small-3.1-24B-Instruct-2503", MISTRAL_SMALL_24B = "mistralai/Mistral-Small-24B-Instruct-2501", MISTRAL_7B_INSTRUCT = "mistralai/Mistral-7B-Instruct-v0.2", MIXTRAL_8X7B_INSTRUCT = "mistralai/Mixtral-8x7B-Instruct-v0.1", DEVSTRAL_2 = "mistralai/Devstral-2", QWEN_2_5_7B = "Qwen/Qwen2.5-7B", QWEN_2_5_32B = "Qwen/Qwen2.5-32B", QWEN_2_5_72B_INSTRUCT = "Qwen/Qwen2.5-72B-Instruct", QWEN_2_5_CODER_7B = "Qwen/Qwen2.5-Coder-7B", QWEN_2_5_CODER_32B_INSTRUCT = "Qwen/Qwen2.5-Coder-32B-Instruct", QWQ_32B = "Qwen/QwQ-32B", QWEN_2_5_VL_32B = "Qwen/Qwen2.5-VL-32B-Instruct", DEEPSEEK_R1 = "deepseek-ai/DeepSeek-R1", DEEPSEEK_V3 = "deepseek-ai/DeepSeek-V3", DEEPSEEK_V3_1 = "deepseek-ai/DeepSeek-V3.1", DEEPSEEK_V3_2_EXP = "deepseek-ai/DeepSeek-V3.2-Exp", PHI_4 = "microsoft/phi-4", PHI_4_REASONING = "microsoft/Phi-4-reasoning", PHI_4_MINI_INSTRUCT = "microsoft/Phi-4-mini-instruct", PHI_4_MINI_REASONING = "microsoft/Phi-4-mini-reasoning", PHI_3_MINI_128K_INSTRUCT = "microsoft/Phi-3-mini-128k-instruct", PHI_3_VISION_128K_INSTRUCT = "microsoft/Phi-3-vision-128k-instruct", GEMMA_3_270M = "google/gemma-3-270m", GEMMA_3_1B_IT = "google/gemma-3-1b-it", GEMMA_3_4B_IT = "google/gemma-3-4b-it", GEMMA_3_12B_IT = "google/gemma-3-12b-it", GEMMA_3_27B_IT = "google/gemma-3-27b-it", GEMMA_2_9B = "google/gemma-2-9b", GEMMA_2_27B = "google/gemma-2-27b", GEMMA_2B = "google/gemma-2b", GEMMA_7B = "google/gemma-7b", FALCON_40B_INSTRUCT = "tiiuae/falcon-40b-instruct", FALCON_180B_CHAT = "tiiuae/falcon-180B-chat", STARCODER2_15B = "bigcode/starcoder2-15b", CODELLAMA_34B_INSTRUCT = "codellama/CodeLlama-34b-Instruct-hf", BLOOM_7B1 = "bigscience/bloom-7b1", BLOOM_1B3 = "bigscience/bloom-1b3", GLM_5 = "zai-org/GLM-5", QWEN_3_5_397B_A17B = "Qwen/Qwen3.5-397B-A17B", NEMOTRON_3_NANO_30B = "nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16", SMOLLM3_3B = "HuggingFaceTB/SmolLM3-3B", FALCON_3_7B_INSTRUCT = "tiiuae/Falcon3-7B-Instruct", FALCON_3_10B_INSTRUCT = "tiiuae/Falcon3-10B-Instruct" } /** * Supported Models for AWS SageMaker JumpStart * https://docs.aws.amazon.com/sagemaker/latest/dg/jumpstart-foundation-models-latest.html */ export declare enum SageMakerModels { LLAMA_4_SCOUT_17B_16E = "meta-llama-4-scout-17b-16e-instruct", LLAMA_4_MAVERICK_17B_128E = "meta-llama-4-maverick-17b-128e-instruct", LLAMA_4_MAVERICK_17B_128E_FP8 = "meta-llama-4-maverick-17b-128e-instruct-fp8", LLAMA_3_8B = "meta-llama-3-8b-instruct", LLAMA_3_70B = "meta-llama-3-70b-instruct", CODE_LLAMA_7B = "meta-code-llama-7b", CODE_LLAMA_13B = "meta-code-llama-13b", CODE_LLAMA_34B = "meta-code-llama-34b", MISTRAL_SMALL_24B = "mistral-small-24b-instruct-2501", MISTRAL_7B_INSTRUCT = "mistral-7b-instruct-v0.3", MIXTRAL_8X7B = "mistral-mixtral-8x7b-instruct-v0.1", MIXTRAL_8X22B = "mistral-mixtral-8x22b-instruct-v0.1", FALCON_3_7B = "tii-falcon-3-7b-instruct", FALCON_3_10B = "tii-falcon-3-10b-instruct", FALCON_40B = "tii-falcon-40b-instruct", FALCON_180B = "tii-falcon-180b", NEMOTRON_3_NANO_30B = "nvidia-nemotron-3-nano-30b", QWEN3_VL_8B = "qwen3-vl-8b-instruct" } /** * API Versions for various providers */ export declare enum APIVersions { AZURE_LATEST = "2025-04-01-preview", AZURE_STABLE = "2024-10-21", AZURE_LEGACY = "2023-12-01-preview", OPENAI_CURRENT = "v1", OPENAI_BETA = "v1-beta", GOOGLE_AI_CURRENT = "v1", GOOGLE_AI_BETA = "v1beta", ANTHROPIC_CURRENT = "2023-06-01" } export declare enum ErrorCategory { VALIDATION = "validation", TIMEOUT = "timeout", NETWORK = "network", RESOURCE = "resource", PERMISSION = "permission", CONFIGURATION = "configuration", EXECUTION = "execution", SYSTEM = "system", /** * Caller-initiated cancellation via AbortSignal. Distinct from system errors * — represents a user/control-plane decision, not a SDK or provider failure. * Consumers can branch on this category to differentiate "user cancelled" * from "server error" without resorting to message-string matching. */ ABORT = "abort" } export declare enum ErrorSeverity { LOW = "low", MEDIUM = "medium", HIGH = "high", CRITICAL = "critical" } /** * Beta features available for Anthropic API * * @description Beta feature flags that can be enabled for enhanced functionality: * - CLAUDE_CODE: Claude Code beta features for development workflows * - INTERLEAVED_THINKING: Enables interleaved thinking in responses * - FINE_GRAINED_STREAMING: Fine-grained tool streaming for better UX */ export declare enum AnthropicBetaFeature { CLAUDE_CODE = "claude-code-20250219", INTERLEAVED_THINKING = "interleaved-thinking-2025-05-14", FINE_GRAINED_STREAMING = "fine-grained-tool-streaming-2025-05-14" } /** * Supported Models for DeepSeek * Docs: https://api-docs.deepseek.com/quick_start/pricing */ export declare enum DeepSeekModels { /** General-purpose chat (DeepSeek-V3) */ DEEPSEEK_CHAT = "deepseek-chat", /** Reasoning model (DeepSeek-R1) — exposes reasoning_content */ DEEPSEEK_REASONER = "deepseek-reasoner" } /** * Selected NVIDIA NIM Models * Full catalog: https://build.nvidia.com/models * Note: NIM hosts hundreds of models; pass arbitrary IDs via --model. */ export declare enum NvidiaNimModels { LLAMA_3_3_70B_INSTRUCT = "meta/llama-3.3-70b-instruct", LLAMA_3_1_405B_INSTRUCT = "meta/llama-3.1-405b-instruct", LLAMA_3_1_70B_INSTRUCT = "meta/llama-3.1-70b-instruct", LLAMA_3_2_90B_VISION = "meta/llama-3.2-90b-vision-instruct", LLAMA_3_2_11B_VISION = "meta/llama-3.2-11b-vision-instruct", NEMOTRON_SUPER_49B = "nvidia/llama-3.3-nemotron-super-49b-v1", NEMOTRON_NANO_8B = "nvidia/llama-3.1-nemotron-nano-8b-v1", NEMOTRON_70B_INSTRUCT = "nvidia/llama-3.1-nemotron-70b-instruct", DEEPSEEK_R1 = "deepseek-ai/deepseek-r1", DEEPSEEK_R1_DISTILL_LLAMA_70B = "deepseek-ai/deepseek-r1-distill-llama-70b", MIXTRAL_8X22B_INSTRUCT = "mistralai/mixtral-8x22b-instruct-v0.1", MIXTRAL_8X7B_INSTRUCT = "mistralai/mixtral-8x7b-instruct-v0.1", PHI_4 = "microsoft/phi-4", GEMMA_3_27B_IT = "google/gemma-3-27b-it", GLM_4_5 = "z-ai/glm4.5" } /** * LM Studio loads any GGUF model the user has downloaded. * Default: empty string → triggers /v1/models auto-discovery. */ export declare enum LMStudioModels { /** Sentinel value — triggers auto-discovery from /v1/models */ AUTO_DISCOVER = "" } /** * llama.cpp serves a single model loaded at server startup. * Default: empty string → uses whatever is loaded. */ export declare enum LlamaCppModels { /** Sentinel value — uses the model loaded by the llama-server process */ AUTO_DISCOVER = "" } /** * xAI Grok models — accessible at api.x.ai/v1 (OpenAI-compatible). * @see https://docs.x.ai/docs/models */ export declare enum XaiModels { /** Latest Grok 3 — flagship; best for complex reasoning */ GROK_3 = "grok-3", /** Grok 3 Mini — faster + cheaper variant of Grok 3 */ GROK_3_MINI = "grok-3-mini", /** Grok 2 latest — previous flagship; still supported */ GROK_2_LATEST = "grok-2-latest", /** Grok 2 Vision — multimodal (text + images) */ GROK_2_VISION_LATEST = "grok-2-vision-latest", /** Grok beta — pre-release / experimental access */ GROK_BETA = "grok-beta" } /** * Groq-hosted models — Llama / Mistral / Gemma at sub-100ms inference. * @see https://console.groq.com/docs/models */ export declare enum GroqModels { /** Llama 3.3 70B Versatile — production default */ LLAMA_3_3_70B_VERSATILE = "llama-3.3-70b-versatile", /** Llama 3.1 8B Instant — low-latency tier */ LLAMA_3_1_8B_INSTANT = "llama-3.1-8b-instant", /** Gemma 2 9B IT — Google's lightweight instruct model */ GEMMA_2_9B_IT = "gemma2-9b-it", /** Mixtral 8x7B 32K — Mistral's MoE model */ MIXTRAL_8X7B_32768 = "mixtral-8x7b-32768", /** Llama Guard 3 8B — safety classifier */ LLAMA_GUARD_3_8B = "llama-guard-3-8b", /** Llama 3.2 90B Vision Preview — multimodal */ LLAMA_3_2_90B_VISION_PREVIEW = "llama-3.2-90b-vision-preview", /** Llama 3.2 11B Vision Preview — smaller multimodal */ LLAMA_3_2_11B_VISION_PREVIEW = "llama-3.2-11b-vision-preview" } /** * Cohere Command + Embed models. * @see https://docs.cohere.com/docs/models * * Note: bare aliases `command-r` and `command-r-plus` were retired on * September 15, 2025. Use the dated variants instead. */ export declare enum CohereModels { /** Command A (March 2025) — current flagship chat model */ COMMAND_A = "command-a-03-2025", /** Command A Reasoning (Aug 2025) — explicit reasoning traces */ COMMAND_A_REASONING = "command-a-reasoning-08-2025", /** Command R+ dated (Aug 2024) — last supported R+ variant */ COMMAND_R_PLUS = "command-r-plus-08-2024", /** Command R dated (Aug 2024) — last supported R variant */ COMMAND_R = "command-r-08-2024", /** Command R7B (Dec 2024) — most compact */ COMMAND_R7B = "command-r7b-12-2024", /** Embed v3 multilingual */ EMBED_MULTILINGUAL_V3 = "embed-multilingual-v3.0", /** Embed v3 English */ EMBED_ENGLISH_V3 = "embed-english-v3.0", /** Rerank v3 multilingual */ RERANK_MULTILINGUAL_V3 = "rerank-multilingual-v3.0", /** Rerank v3 English */ RERANK_ENGLISH_V3 = "rerank-english-v3.0" } /** * Together AI hosted models — open-model gateway. * @see https://docs.together.ai/docs/serverless-models */ export declare enum TogetherAIModels { /** Llama 3.3 70B Instruct Turbo — production default */ LLAMA_3_3_70B_INSTRUCT_TURBO = "meta-llama/Llama-3.3-70B-Instruct-Turbo", /** Llama 3.1 405B Instruct Turbo — flagship size */ LLAMA_3_1_405B_INSTRUCT_TURBO = "meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo", /** Llama 3.1 70B Instruct Turbo */ LLAMA_3_1_70B_INSTRUCT_TURBO = "meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo", /** Llama 3.1 8B Instruct Turbo — fastest */ LLAMA_3_1_8B_INSTRUCT_TURBO = "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo", /** Mixtral 8x22B Instruct */ MIXTRAL_8X22B_INSTRUCT = "mistralai/Mixtral-8x22B-Instruct-v0.1", /** Mixtral 8x7B Instruct */ MIXTRAL_8X7B_INSTRUCT = "mistralai/Mixtral-8x7B-Instruct-v0.1", /** Qwen 2.5 72B Instruct Turbo */ QWEN_2_5_72B_INSTRUCT_TURBO = "Qwen/Qwen2.5-72B-Instruct-Turbo", /** Qwen 2.5 Coder 32B Instruct */ QWEN_2_5_CODER_32B = "Qwen/Qwen2.5-Coder-32B-Instruct", /** DeepSeek R1 — reasoning */ DEEPSEEK_R1 = "deepseek-ai/DeepSeek-R1", /** DeepSeek V3 */ DEEPSEEK_V3 = "deepseek-ai/DeepSeek-V3", /** Google Gemma 2 27B IT */ GEMMA_2_27B_IT = "google/gemma-2-27b-it", /** WizardLM 2 8x22B */ WIZARDLM_2_8X22B = "microsoft/WizardLM-2-8x22B" } /** * Fireworks AI hosted models — fast open-model serving. * @see https://fireworks.ai/models * * Note: the older Llama / Mixtral / Qwen 2.5 generation was rotated * out of Fireworks' serverless tier. Current shipping defaults below. */ export declare enum FireworksModels { /** DeepSeek V4 Pro — current general-purpose default */ DEEPSEEK_V4_PRO = "accounts/fireworks/models/deepseek-v4-pro", /** GLM 5.1 — Zhipu flagship */ GLM_5P1 = "accounts/fireworks/models/glm-5p1", /** GLM 5 — broader coverage */ GLM_5 = "accounts/fireworks/models/glm-5", /** Kimi K2.6 — Moonshot flagship */ KIMI_K2P6 = "accounts/fireworks/models/kimi-k2p6", /** Kimi K2.5 — preceding Kimi */ KIMI_K2P5 = "accounts/fireworks/models/kimi-k2p5", /** GPT-OSS 120B — Apache-2.0 OpenAI weights */ GPT_OSS_120B = "accounts/fireworks/models/gpt-oss-120b" } /** * Perplexity Sonar models — built-in web grounding. * @see https://docs.perplexity.ai/guides/model-cards */ export declare enum PerplexityModels { /** Sonar — production default with web search */ SONAR = "sonar", /** Sonar Pro — better reasoning + larger context */ SONAR_PRO = "sonar-pro", /** Sonar Reasoning — explicit reasoning traces */ SONAR_REASONING = "sonar-reasoning", /** Sonar Reasoning Pro — flagship reasoning + web */ SONAR_REASONING_PRO = "sonar-reasoning-pro", /** Sonar Deep Research — long-form research with citations */ SONAR_DEEP_RESEARCH = "sonar-deep-research" } /** * Cloudflare Workers AI models — edge-served open models. * @see https://developers.cloudflare.com/workers-ai/models/ */ export declare enum CloudflareModels { /** Llama 3.3 70B Instruct (FP8 fast) */ LLAMA_3_3_70B_FAST = "@cf/meta/llama-3.3-70b-instruct-fp8-fast", /** Llama 3.1 70B Instruct */ LLAMA_3_1_70B_INSTRUCT = "@cf/meta/llama-3.1-70b-instruct", /** Llama 3.1 8B Instruct fast */ LLAMA_3_1_8B_FAST = "@cf/meta/llama-3.1-8b-instruct-fast", /** Llama 3.2 11B Vision Instruct */ LLAMA_3_2_11B_VISION = "@cf/meta/llama-3.2-11b-vision-instruct", /** Mistral 7B Instruct v0.2 */ MISTRAL_7B_INSTRUCT_V0_2 = "@cf/mistral/mistral-7b-instruct-v0.2", /** Qwen 1.5 14B Chat AWQ */ QWEN_1P5_14B_CHAT_AWQ = "@cf/qwen/qwen1.5-14b-chat-awq", /** Gemma 2B IT */ GEMMA_2B_IT_LORA = "@cf/google/gemma-2b-it-lora" } /** * Voyage AI embedding models — top-tier RAG embedders. * @see https://docs.voyageai.com/docs/embeddings */ export declare enum VoyageModels { /** Voyage 3.5 — latest general-purpose (default) */ VOYAGE_3_5 = "voyage-3.5", /** Voyage 3.5 Lite — smaller / cheaper */ VOYAGE_3_5_LITE = "voyage-3.5-lite", /** Voyage 3 Large — flagship size */ VOYAGE_3_LARGE = "voyage-3-large", /** Voyage Code 3 — code-tuned */ VOYAGE_CODE_3 = "voyage-code-3", /** Voyage Finance 2 — domain-tuned */ VOYAGE_FINANCE_2 = "voyage-finance-2", /** Voyage Law 2 — domain-tuned */ VOYAGE_LAW_2 = "voyage-law-2", /** Voyage Multilingual 2 */ VOYAGE_MULTILINGUAL_2 = "voyage-multilingual-2" } /** * Jina AI embedding + reranking models. * @see https://jina.ai/embeddings/ */ export declare enum JinaModels { /** Jina Embeddings v3 — flagship multilingual (default) */ JINA_EMBEDDINGS_V3 = "jina-embeddings-v3", /** Jina Embeddings v2 base English */ JINA_EMBEDDINGS_V2_BASE_EN = "jina-embeddings-v2-base-en", /** Jina Embeddings v2 small English */ JINA_EMBEDDINGS_V2_SMALL_EN = "jina-embeddings-v2-small-en", /** Jina Embeddings v2 base code */ JINA_EMBEDDINGS_V2_BASE_CODE = "jina-embeddings-v2-base-code", /** Jina Embeddings v2 base multilingual */ JINA_EMBEDDINGS_V2_BASE_MULTILINGUAL = "jina-embeddings-v2-base-zh", /** Jina ColBERT v2 — late-interaction retrieval */ JINA_COLBERT_V2 = "jina-colbert-v2", /** Jina Reranker v2 base multilingual */ JINA_RERANKER_V2_BASE_MULTILINGUAL = "jina-reranker-v2-base-multilingual", /** Jina Reranker v1 turbo English */ JINA_RERANKER_V1_TURBO_EN = "jina-reranker-v1-turbo-en" } /** * Stability AI image generation models (api.stability.ai). * @see https://platform.stability.ai/docs/api-reference */ export declare enum StabilityModels { /** Stable Image Ultra — flagship quality (default) */ STABLE_IMAGE_ULTRA = "stable-image-ultra", /** Stable Image Core — fast tier */ STABLE_IMAGE_CORE = "stable-image-core", /** Stable Diffusion 3.5 Large */ SD_3_5_LARGE = "sd3.5-large", /** Stable Diffusion 3.5 Large Turbo */ SD_3_5_LARGE_TURBO = "sd3.5-large-turbo", /** Stable Diffusion 3.5 Medium */ SD_3_5_MEDIUM = "sd3.5-medium" } /** * Ideogram image generation models. * @see https://docs.ideogram.ai/api-reference/api-reference/post-v-1-ideogram-v-3-generate */ export declare enum IdeogramModels { /** Ideogram V3 — latest with strong typography (default) */ IDEOGRAM_V3 = "V_3", /** Ideogram V2 */ IDEOGRAM_V2 = "V_2", /** Ideogram V2 Turbo — fast tier */ IDEOGRAM_V2_TURBO = "V_2_TURBO", /** Ideogram V1 */ IDEOGRAM_V1 = "V_1" } /** * Recraft image generation models — vector / illustration focus. * @see https://www.recraft.ai/docs */ export declare enum RecraftModels { /** Recraft V3 — flagship raster (default) */ RECRAFT_V3 = "recraftv3", /** Recraft V3 SVG — vector output */ RECRAFT_V3_SVG = "recraftv3-svg", /** Recraft V2 */ RECRAFT_V2 = "recraftv2" } /** * Replicate hosted models (LLMs only — image / video / avatar / music * accessed via dedicated handlers). * * Replicate accepts arbitrary `owner/name` or `owner/name:version`; this * enum lists popular LLM defaults. Pass any model id via `--model`. * * @see https://replicate.com/explore */ export declare enum ReplicateModels { /** Meta Llama 3.1 405B Instruct */ LLAMA_3_1_405B_INSTRUCT = "meta/meta-llama-3.1-405b-instruct", /** Meta Llama 3 70B Instruct (stable; the meta-llama-3.1-70b variant was retired upstream) */ LLAMA_3_70B_INSTRUCT = "meta/meta-llama-3-70b-instruct", /** Meta Llama 3 8B Instruct */ LLAMA_3_8B_INSTRUCT = "meta/meta-llama-3-8b-instruct", /** Mistral 7B Instruct v0.2 */ MISTRAL_7B_INSTRUCT_V02 = "mistralai/mistral-7b-instruct-v0.2", /** Mixtral 8x7B Instruct v0.1 */ MIXTRAL_8X7B_INSTRUCT_V01 = "mistralai/mixtral-8x7b-instruct-v0.1" } /** * Buffer time in milliseconds before token expiry to trigger refresh * * @description Tokens are refreshed 5 minutes before expiry to prevent * authentication failures during ongoing operations */ export declare const TOKEN_EXPIRY_BUFFER_MS: number;