UNPKG

@juspay/neurolink

Version:

Universal AI Development Platform with working MCP integration, multi-provider support, voice (TTS/STT/realtime), and professional CLI. 58+ external MCP servers discoverable, multimodal file processing, RAG pipelines. Build, test, and deploy AI applicatio

1,725 lines (1,724 loc) 69.8 kB
/** * Model Registry for NeuroLink CLI Commands * Provides centralized model data for models command system * Part of Phase 4.1 - Models Command System */ import { DEFAULT_MODEL_ALIASES } from "../types/index.js"; import { AIProviderName, OpenAIModels, AzureOpenAIModels, GoogleAIModels, AnthropicModels, BedrockModels, MistralModels, OllamaModels, } from "../constants/enums.js"; /** * Comprehensive model registry */ export const MODEL_REGISTRY = { // OpenAI Models [OpenAIModels.GPT_4O]: { id: OpenAIModels.GPT_4O, name: "GPT-4 Omni", provider: AIProviderName.OPENAI, description: "Most capable OpenAI model with vision and advanced reasoning", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.005, outputCostPer1K: 0.015, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 128000, maxOutputTokens: 4096, maxRequestsPerMinute: 500, }, useCases: { coding: 9, creative: 8, analysis: 9, conversation: 9, reasoning: 9, translation: 8, summarization: 8, }, aliases: ["gpt4o", "gpt-4-omni", "openai-flagship"], deprecated: false, isLocal: false, // Cloud-based model releaseDate: "2024-05-13", category: "general", }, [OpenAIModels.GPT_4O_MINI]: { id: OpenAIModels.GPT_4O_MINI, name: "GPT-4 Omni Mini", provider: AIProviderName.OPENAI, description: "Fast and cost-effective model with strong performance", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.00015, outputCostPer1K: 0.0006, currency: "USD", }, performance: { speed: "fast", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 128000, maxOutputTokens: 16384, maxRequestsPerMinute: 1000, }, useCases: { coding: 8, creative: 7, analysis: 8, conversation: 8, reasoning: 8, translation: 8, summarization: 9, }, aliases: ["gpt4o-mini", "gpt-4-mini", "fastest", "cheap"], deprecated: false, isLocal: false, // Cloud-based model releaseDate: "2024-07-18", category: "general", }, // OpenAI GPT-5 Series [OpenAIModels.GPT_5]: { id: OpenAIModels.GPT_5, name: "GPT-5", provider: AIProviderName.OPENAI, description: "OpenAI's most advanced model with breakthrough reasoning and multimodal capabilities", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.01, outputCostPer1K: 0.03, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 256000, maxOutputTokens: 32768, maxRequestsPerMinute: 200, }, useCases: { coding: 10, creative: 10, analysis: 10, conversation: 10, reasoning: 10, translation: 9, summarization: 9, }, aliases: ["gpt5", "gpt-5-flagship", "openai-latest"], deprecated: false, isLocal: false, releaseDate: "2025-08-07", category: "reasoning", }, [OpenAIModels.GPT_5_MINI]: { id: OpenAIModels.GPT_5_MINI, name: "GPT-5 Mini", provider: AIProviderName.OPENAI, description: "Fast and efficient GPT-5 variant for everyday tasks", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.002, outputCostPer1K: 0.006, currency: "USD", }, performance: { speed: "fast", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 128000, maxOutputTokens: 16384, maxRequestsPerMinute: 500, }, useCases: { coding: 8, creative: 8, analysis: 8, conversation: 9, reasoning: 8, translation: 8, summarization: 9, }, aliases: ["gpt5-mini", "gpt-5-fast"], deprecated: false, isLocal: false, releaseDate: "2025-08-07", category: "general", }, // OpenAI O-Series Reasoning Models [OpenAIModels.O3]: { id: OpenAIModels.O3, name: "O3", provider: AIProviderName.OPENAI, description: "Advanced reasoning model with extended thinking capabilities for complex tasks", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.015, outputCostPer1K: 0.06, currency: "USD", }, performance: { speed: "slow", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 200000, maxOutputTokens: 100000, maxRequestsPerMinute: 100, }, useCases: { coding: 10, creative: 8, analysis: 10, conversation: 7, reasoning: 10, translation: 7, summarization: 8, }, aliases: ["o3-reasoning", "o3-thinking"], deprecated: false, isLocal: false, releaseDate: "2025-01-31", category: "reasoning", }, [OpenAIModels.O3_MINI]: { id: OpenAIModels.O3_MINI, name: "O3 Mini", provider: AIProviderName.OPENAI, description: "Cost-effective reasoning model with strong logical capabilities", capabilities: { vision: false, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: false, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.003, outputCostPer1K: 0.012, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 200000, maxOutputTokens: 65536, maxRequestsPerMinute: 200, }, useCases: { coding: 9, creative: 6, analysis: 9, conversation: 7, reasoning: 9, translation: 6, summarization: 7, }, aliases: ["o3-mini-reasoning"], deprecated: false, isLocal: false, releaseDate: "2025-01-31", category: "reasoning", }, [OpenAIModels.GPT_5_NANO]: { id: OpenAIModels.GPT_5_NANO, name: "GPT-5 Nano", provider: AIProviderName.OPENAI, description: "Fastest and most cost-effective GPT-5 variant for simple tasks", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.00005, outputCostPer1K: 0.0004, currency: "USD", }, performance: { speed: "fast", quality: "medium", accuracy: "medium", }, limits: { maxContextTokens: 272000, maxOutputTokens: 128000, maxRequestsPerMinute: 2000, }, useCases: { coding: 6, creative: 6, analysis: 6, conversation: 8, reasoning: 6, translation: 7, summarization: 8, }, aliases: ["gpt5-nano", "gpt-5-cheapest"], deprecated: false, isLocal: false, releaseDate: "2025-08-07", category: "general", }, // OpenAI GPT-5.2 Series (Released December 11, 2025) - Latest flagship models [OpenAIModels.GPT_5_2]: { id: OpenAIModels.GPT_5_2, name: "GPT-5.2 Thinking", provider: AIProviderName.OPENAI, description: "OpenAI's latest flagship model with deep reasoning capabilities, 100% on AIME 2025, 80% SWE-bench Verified", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.00175, outputCostPer1K: 0.014, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 256000, maxOutputTokens: 64000, maxRequestsPerMinute: 150, }, useCases: { coding: 10, creative: 10, analysis: 10, conversation: 9, reasoning: 10, translation: 9, summarization: 9, }, aliases: ["gpt52", "gpt-5.2-thinking", "openai-latest-reasoning"], deprecated: false, isLocal: false, releaseDate: "2025-12-11", category: "reasoning", }, [OpenAIModels.GPT_5_2_CHAT_LATEST]: { id: OpenAIModels.GPT_5_2_CHAT_LATEST, name: "GPT-5.2 Instant", provider: AIProviderName.OPENAI, description: "Fast everyday model for quick tasks with excellent performance across all domains", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.00175, outputCostPer1K: 0.014, currency: "USD", }, performance: { speed: "fast", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 256000, maxOutputTokens: 32000, maxRequestsPerMinute: 300, }, useCases: { coding: 9, creative: 9, analysis: 9, conversation: 10, reasoning: 9, translation: 9, summarization: 9, }, aliases: ["gpt52-chat", "gpt-5.2-instant", "gpt52-fast"], deprecated: false, isLocal: false, releaseDate: "2025-12-11", category: "general", }, [OpenAIModels.GPT_5_2_PRO]: { id: OpenAIModels.GPT_5_2_PRO, name: "GPT-5.2 Pro", provider: AIProviderName.OPENAI, description: "Highest quality model for science, math, and complex problem-solving with 92.4% GPQA Diamond performance", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.021, outputCostPer1K: 0.168, currency: "USD", }, performance: { speed: "slow", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 256000, maxOutputTokens: 128000, maxRequestsPerMinute: 50, }, useCases: { coding: 10, creative: 9, analysis: 10, conversation: 8, reasoning: 10, translation: 9, summarization: 9, }, aliases: ["gpt52-pro", "gpt-5.2-professional", "openai-science"], deprecated: false, isLocal: false, releaseDate: "2025-12-11", category: "reasoning", }, // OpenAI GPT-4.1 Series (1M context window) [OpenAIModels.GPT_4_1]: { id: OpenAIModels.GPT_4_1, name: "GPT-4.1", provider: AIProviderName.OPENAI, description: "Advanced coding model with 1 million token context window", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.002, outputCostPer1K: 0.008, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 1000000, maxOutputTokens: 128000, maxRequestsPerMinute: 200, }, useCases: { coding: 10, creative: 8, analysis: 9, conversation: 8, reasoning: 9, translation: 8, summarization: 9, }, aliases: ["gpt-4.1", "gpt41", "million-context"], deprecated: false, isLocal: false, releaseDate: "2025-04-14", category: "coding", }, [OpenAIModels.GPT_4_1_MINI]: { id: OpenAIModels.GPT_4_1_MINI, name: "GPT-4.1 Mini", provider: AIProviderName.OPENAI, description: "Fast GPT-4.1 variant with 1M context for efficient coding", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.0004, outputCostPer1K: 0.0016, currency: "USD", }, performance: { speed: "fast", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 1000000, maxOutputTokens: 128000, maxRequestsPerMinute: 500, }, useCases: { coding: 9, creative: 7, analysis: 8, conversation: 8, reasoning: 8, translation: 8, summarization: 9, }, aliases: ["gpt-4.1-mini", "gpt41-mini"], deprecated: false, isLocal: false, releaseDate: "2025-04-14", category: "coding", }, [OpenAIModels.GPT_4_1_NANO]: { id: OpenAIModels.GPT_4_1_NANO, name: "GPT-4.1 Nano", provider: AIProviderName.OPENAI, description: "Most cost-effective GPT-4.1 variant with 1M context", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.0001, outputCostPer1K: 0.0004, currency: "USD", }, performance: { speed: "fast", quality: "medium", accuracy: "medium", }, limits: { maxContextTokens: 1000000, maxOutputTokens: 128000, maxRequestsPerMinute: 1000, }, useCases: { coding: 7, creative: 6, analysis: 7, conversation: 7, reasoning: 7, translation: 7, summarization: 8, }, aliases: ["gpt-4.1-nano", "gpt41-nano"], deprecated: false, isLocal: false, releaseDate: "2025-04-14", category: "coding", }, // OpenAI O-Series Additional Models [OpenAIModels.O3_PRO]: { id: OpenAIModels.O3_PRO, name: "O3 Pro", provider: AIProviderName.OPENAI, description: "Most powerful reasoning model for complex scientific and coding tasks", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.03, outputCostPer1K: 0.12, currency: "USD", }, performance: { speed: "slow", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 200000, maxOutputTokens: 100000, maxRequestsPerMinute: 50, }, useCases: { coding: 10, creative: 7, analysis: 10, conversation: 6, reasoning: 10, translation: 6, summarization: 7, }, aliases: ["o3-pro", "o3-professional"], deprecated: false, isLocal: false, releaseDate: "2025-04-16", category: "reasoning", }, [OpenAIModels.O4_MINI]: { id: OpenAIModels.O4_MINI, name: "O4 Mini", provider: AIProviderName.OPENAI, description: "Fast reasoning model optimized for math, coding, and visual tasks", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.003, outputCostPer1K: 0.012, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 200000, maxOutputTokens: 100000, maxRequestsPerMinute: 200, }, useCases: { coding: 9, creative: 6, analysis: 9, conversation: 7, reasoning: 10, translation: 6, summarization: 7, }, aliases: ["o4-mini", "o4-fast"], deprecated: false, isLocal: false, releaseDate: "2025-04-16", category: "reasoning", }, [OpenAIModels.O1]: { id: OpenAIModels.O1, name: "O1", provider: AIProviderName.OPENAI, description: "Premium reasoning model with highest capability for mission-critical tasks", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.15, outputCostPer1K: 0.6, currency: "USD", }, performance: { speed: "slow", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 128000, maxOutputTokens: 32768, maxRequestsPerMinute: 50, }, useCases: { coding: 10, creative: 7, analysis: 10, conversation: 6, reasoning: 10, translation: 6, summarization: 7, }, aliases: ["o1-full", "o1-premium"], deprecated: false, isLocal: false, releaseDate: "2024-09-12", category: "reasoning", }, [OpenAIModels.O1_PREVIEW]: { id: OpenAIModels.O1_PREVIEW, name: "O1 Preview", provider: AIProviderName.OPENAI, description: "Preview version of O1 reasoning model", capabilities: { vision: false, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: false, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.015, outputCostPer1K: 0.06, currency: "USD", }, performance: { speed: "slow", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 128000, maxOutputTokens: 32768, maxRequestsPerMinute: 100, }, useCases: { coding: 9, creative: 6, analysis: 9, conversation: 6, reasoning: 9, translation: 5, summarization: 6, }, aliases: ["o1-preview"], deprecated: false, isLocal: false, releaseDate: "2024-09-12", category: "reasoning", }, [OpenAIModels.O1_MINI]: { id: OpenAIModels.O1_MINI, name: "O1 Mini", provider: AIProviderName.OPENAI, description: "Cost-effective O1 variant with strong reasoning capabilities", capabilities: { vision: false, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: false, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.003, outputCostPer1K: 0.012, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 128000, maxOutputTokens: 65536, maxRequestsPerMinute: 200, }, useCases: { coding: 8, creative: 5, analysis: 8, conversation: 6, reasoning: 8, translation: 5, summarization: 6, }, aliases: ["o1-mini", "o1-budget"], deprecated: false, isLocal: false, releaseDate: "2024-09-12", category: "reasoning", }, // OpenAI Legacy Models [OpenAIModels.GPT_4]: { id: OpenAIModels.GPT_4, name: "GPT-4", provider: AIProviderName.OPENAI, description: "Previous generation flagship model (legacy)", capabilities: { vision: false, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: false, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.03, outputCostPer1K: 0.06, currency: "USD", }, performance: { speed: "slow", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 8192, maxOutputTokens: 4096, maxRequestsPerMinute: 200, }, useCases: { coding: 8, creative: 8, analysis: 8, conversation: 8, reasoning: 8, translation: 8, summarization: 8, }, aliases: ["gpt4", "gpt-4-base"], deprecated: true, isLocal: false, releaseDate: "2023-03-14", category: "general", }, [OpenAIModels.GPT_4_TURBO]: { id: OpenAIModels.GPT_4_TURBO, name: "GPT-4 Turbo", provider: AIProviderName.OPENAI, description: "Faster GPT-4 variant with extended context (legacy)", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.01, outputCostPer1K: 0.03, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 128000, maxOutputTokens: 4096, maxRequestsPerMinute: 500, }, useCases: { coding: 8, creative: 8, analysis: 9, conversation: 8, reasoning: 8, translation: 8, summarization: 8, }, aliases: ["gpt4-turbo", "gpt-4-turbo-preview"], deprecated: true, isLocal: false, releaseDate: "2024-04-09", category: "general", }, [OpenAIModels.GPT_3_5_TURBO]: { id: OpenAIModels.GPT_3_5_TURBO, name: "GPT-3.5 Turbo", provider: AIProviderName.OPENAI, description: "Fast and cost-effective model for simpler tasks (legacy)", capabilities: { vision: false, functionCalling: true, codeGeneration: true, reasoning: false, multimodal: false, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.0005, outputCostPer1K: 0.0015, currency: "USD", }, performance: { speed: "fast", quality: "medium", accuracy: "medium", }, limits: { maxContextTokens: 16385, maxOutputTokens: 4096, maxRequestsPerMinute: 3500, }, useCases: { coding: 6, creative: 6, analysis: 6, conversation: 7, reasoning: 5, translation: 7, summarization: 7, }, aliases: ["gpt35", "gpt-3.5", "chatgpt"], deprecated: true, isLocal: false, releaseDate: "2023-03-01", category: "general", }, // Google AI Studio Models [GoogleAIModels.GEMINI_2_5_PRO]: { id: GoogleAIModels.GEMINI_2_5_PRO, name: "Gemini 2.5 Pro", provider: AIProviderName.GOOGLE_AI, description: "Google's most capable multimodal model with large context window", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.00125, outputCostPer1K: 0.005, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 2097152, // 2M tokens maxOutputTokens: 8192, maxRequestsPerMinute: 360, }, useCases: { coding: 9, creative: 8, analysis: 10, conversation: 8, reasoning: 9, translation: 9, summarization: 9, }, aliases: ["gemini-pro", "google-flagship", "best-analysis"], deprecated: false, isLocal: false, // Cloud-based model releaseDate: "2024-12-11", category: "reasoning", }, [GoogleAIModels.GEMINI_2_5_FLASH]: { id: GoogleAIModels.GEMINI_2_5_FLASH, name: "Gemini 2.5 Flash", provider: AIProviderName.GOOGLE_AI, description: "Fast and efficient multimodal model with large context", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.000075, outputCostPer1K: 0.0003, currency: "USD", }, performance: { speed: "fast", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 1048576, // 1M tokens maxOutputTokens: 8192, maxRequestsPerMinute: 1000, }, useCases: { coding: 8, creative: 7, analysis: 9, conversation: 8, reasoning: 8, translation: 8, summarization: 9, }, aliases: ["gemini-flash", "google-fast", "best-value"], deprecated: false, isLocal: false, // Cloud-based model releaseDate: "2024-12-11", category: "general", }, // Anthropic Models [AnthropicModels.CLAUDE_OPUS_4_5]: { id: AnthropicModels.CLAUDE_OPUS_4_5, name: "Claude Opus 4.5", provider: AIProviderName.ANTHROPIC, description: "Anthropic's most capable model with exceptional reasoning, coding, and multimodal capabilities", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: false, }, pricing: { inputCostPer1K: 0.015, outputCostPer1K: 0.075, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 200000, maxOutputTokens: 64000, maxRequestsPerMinute: 50, }, useCases: { coding: 10, creative: 10, analysis: 10, conversation: 9, reasoning: 10, translation: 9, summarization: 9, }, aliases: [ "claude-4.5-opus", "claude-opus-latest", "opus-4.5", "anthropic-flagship", ], deprecated: false, isLocal: false, releaseDate: "2025-11-24", category: "reasoning", }, [AnthropicModels.CLAUDE_SONNET_4_5]: { id: AnthropicModels.CLAUDE_SONNET_4_5, name: "Claude Sonnet 4.5", provider: AIProviderName.ANTHROPIC, description: "Balanced Claude model with excellent performance across all tasks including vision and reasoning", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: false, }, pricing: { inputCostPer1K: 0.003, outputCostPer1K: 0.015, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 200000, maxOutputTokens: 64000, maxRequestsPerMinute: 100, }, useCases: { coding: 10, creative: 9, analysis: 9, conversation: 9, reasoning: 10, translation: 8, summarization: 8, }, aliases: ["claude-4.5-sonnet", "claude-sonnet-latest", "sonnet-4.5"], deprecated: false, isLocal: false, releaseDate: "2025-09-29", category: "coding", }, [AnthropicModels.CLAUDE_4_5_HAIKU]: { id: AnthropicModels.CLAUDE_4_5_HAIKU, name: "Claude 4.5 Haiku", provider: AIProviderName.ANTHROPIC, description: "Latest fast and efficient Claude model with vision support", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: false, }, pricing: { inputCostPer1K: 0.001, outputCostPer1K: 0.005, currency: "USD", }, performance: { speed: "fast", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 200000, maxOutputTokens: 64000, maxRequestsPerMinute: 100, }, useCases: { coding: 8, creative: 8, analysis: 8, conversation: 9, reasoning: 8, translation: 8, summarization: 9, }, aliases: ["claude-4.5-haiku", "claude-haiku-latest", "haiku-4.5"], deprecated: false, isLocal: false, releaseDate: "2025-10-15", category: "general", }, [AnthropicModels.CLAUDE_3_5_SONNET]: { id: AnthropicModels.CLAUDE_3_5_SONNET, name: "Claude 3.5 Sonnet", provider: AIProviderName.ANTHROPIC, description: "Anthropic's most capable model with excellent reasoning and coding", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: false, }, pricing: { inputCostPer1K: 0.003, outputCostPer1K: 0.015, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 200000, maxOutputTokens: 8192, maxRequestsPerMinute: 50, }, useCases: { coding: 10, creative: 9, analysis: 9, conversation: 9, reasoning: 10, translation: 8, summarization: 8, }, aliases: [ "claude-3.5-sonnet", "claude-sonnet", "best-coding", "claude-latest", ], deprecated: false, isLocal: false, // Cloud-based model releaseDate: "2024-10-22", category: "coding", }, [AnthropicModels.CLAUDE_3_5_HAIKU]: { id: AnthropicModels.CLAUDE_3_5_HAIKU, name: "Claude 3.5 Haiku", provider: AIProviderName.ANTHROPIC, description: "Fast and efficient Claude model for quick tasks", capabilities: { vision: false, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: false, streaming: true, jsonMode: false, }, pricing: { inputCostPer1K: 0.001, outputCostPer1K: 0.005, currency: "USD", }, performance: { speed: "fast", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 200000, maxOutputTokens: 8192, maxRequestsPerMinute: 100, }, useCases: { coding: 8, creative: 7, analysis: 8, conversation: 8, reasoning: 8, translation: 8, summarization: 9, }, aliases: ["claude-3.5-haiku", "claude-haiku", "claude-fast"], deprecated: false, isLocal: false, // Cloud-based model releaseDate: "2024-10-22", category: "general", }, // Mistral Models [MistralModels.MISTRAL_LARGE_LATEST]: { id: MistralModels.MISTRAL_LARGE_LATEST, name: "Mistral Large", provider: AIProviderName.MISTRAL, description: "Mistral's flagship model with excellent reasoning and multilingual capabilities", capabilities: { vision: false, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: false, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.002, outputCostPer1K: 0.006, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 131072, maxOutputTokens: 8192, maxRequestsPerMinute: 100, }, useCases: { coding: 9, creative: 8, analysis: 9, conversation: 8, reasoning: 9, translation: 9, summarization: 8, }, aliases: ["mistral-large", "mistral-flagship"], deprecated: false, isLocal: false, releaseDate: "2025-12-01", category: "reasoning", }, [MistralModels.MISTRAL_SMALL_LATEST]: { id: MistralModels.MISTRAL_SMALL_LATEST, name: "Mistral Small", provider: AIProviderName.MISTRAL, description: "Efficient model for simple tasks and cost-sensitive applications", capabilities: { vision: false, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: false, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.001, outputCostPer1K: 0.003, currency: "USD", }, performance: { speed: "fast", quality: "medium", accuracy: "medium", }, limits: { maxContextTokens: 32768, maxOutputTokens: 8192, maxRequestsPerMinute: 200, }, useCases: { coding: 6, creative: 6, analysis: 7, conversation: 7, reasoning: 6, translation: 7, summarization: 7, }, aliases: ["mistral-small", "mistral-cheap"], deprecated: false, isLocal: false, releaseDate: "2024-02-26", category: "general", }, [MistralModels.CODESTRAL_LATEST]: { id: MistralModels.CODESTRAL_LATEST, name: "Codestral", provider: AIProviderName.MISTRAL, description: "Specialized code generation model trained on 80+ programming languages", capabilities: { vision: false, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: false, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.001, outputCostPer1K: 0.003, currency: "USD", }, performance: { speed: "fast", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 32768, maxOutputTokens: 8192, maxRequestsPerMinute: 200, }, useCases: { coding: 10, creative: 5, analysis: 7, conversation: 5, reasoning: 8, translation: 5, summarization: 6, }, aliases: ["codestral", "mistral-code"], deprecated: false, isLocal: false, releaseDate: "2024-05-29", category: "coding", }, [MistralModels.PIXTRAL_LARGE]: { id: MistralModels.PIXTRAL_LARGE, name: "Pixtral Large", provider: AIProviderName.MISTRAL, description: "Multimodal vision-language model for image understanding", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.002, outputCostPer1K: 0.006, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 131072, maxOutputTokens: 8192, maxRequestsPerMinute: 100, }, useCases: { coding: 8, creative: 8, analysis: 9, conversation: 7, reasoning: 8, translation: 7, summarization: 8, }, aliases: ["pixtral", "mistral-vision"], deprecated: false, isLocal: false, releaseDate: "2024-09-01", category: "vision", }, // Ollama Models (local) [OllamaModels.LLAMA4_LATEST]: { id: OllamaModels.LLAMA4_LATEST, name: "Llama 4", provider: AIProviderName.OLLAMA, description: "Latest Llama 4 with multimodal vision and tool capabilities, runs locally", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0, outputCostPer1K: 0, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 131072, maxOutputTokens: 8192, }, useCases: { coding: 9, creative: 8, analysis: 9, conversation: 8, reasoning: 9, translation: 8, summarization: 8, }, aliases: ["llama4", "llama4-local"], deprecated: false, isLocal: true, releaseDate: "2025-04-01", category: "reasoning", }, [OllamaModels.LLAMA3_3_LATEST]: { id: OllamaModels.LLAMA3_3_LATEST, name: "Llama 3.3", provider: AIProviderName.OLLAMA, description: "High-performance Llama 3.3 for local inference", capabilities: { vision: false, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: false, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0, outputCostPer1K: 0, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 131072, maxOutputTokens: 8192, }, useCases: { coding: 8, creative: 8, analysis: 8, conversation: 8, reasoning: 8, translation: 8, summarization: 8, }, aliases: ["llama3.3", "llama3.3-local"], deprecated: false, isLocal: true, releaseDate: "2024-12-01", category: "general", }, [OllamaModels.LLAMA3_2_LATEST]: { id: OllamaModels.LLAMA3_2_LATEST, name: "Llama 3.2 Latest", provider: AIProviderName.OLLAMA, description: "Local Llama model for private, offline AI generation", capabilities: { vision: false, functionCalling: false, codeGeneration: true, reasoning: true, multimodal: false, streaming: true, jsonMode: false, }, pricing: { inputCostPer1K: 0, outputCostPer1K: 0, currency: "USD", }, performance: { speed: "fast", quality: "medium", accuracy: "medium", }, limits: { maxContextTokens: 131072, maxOutputTokens: 8192, }, useCases: { coding: 6, creative: 7, analysis: 6, conversation: 7, reasoning: 6, translation: 6, summarization: 6, }, aliases: ["llama3.2", "llama", "local", "offline"], deprecated: false, isLocal: true, releaseDate: "2024-09-25", category: "general", }, [OllamaModels.DEEPSEEK_R1_70B]: { id: OllamaModels.DEEPSEEK_R1_70B, name: "DeepSeek-R1 70B", provider: AIProviderName.OLLAMA, description: "State-of-the-art reasoning model rivaling OpenAI O1, runs locally", capabilities: { vision: false, functionCalling: false, codeGeneration: true, reasoning: true, multimodal: false, streaming: true, jsonMode: false, }, pricing: { inputCostPer1K: 0, outputCostPer1K: 0, currency: "USD", }, performance: { speed: "slow", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 65536, maxOutputTokens: 8192, }, useCases: { coding: 10, creative: 7, analysis: 10, conversation: 6, reasoning: 10, translation: 7, summarization: 7, }, aliases: ["deepseek-r1", "deepseek-reasoning", "local-reasoning"], deprecated: false, isLocal: true, releaseDate: "2025-01-20", category: "reasoning", }, [OllamaModels.QWEN3_72B]: { id: OllamaModels.QWEN3_72B, name: "Qwen 3 72B", provider: AIProviderName.OLLAMA, description: "Advanced reasoning and multilingual model from Alibaba", capabilities: { vision: false, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: false, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0, outputCostPer1K: 0, currency: "USD", }, performance: { speed: "slow", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 131072, maxOutputTokens: 8192, }, useCases: { coding: 9, creative: 8, analysis: 9, conversation: 8, reasoning: 9, translation: 9, summarization: 8, }, aliases: ["qwen3", "qwen3-72b-local"], deprecated: false, isLocal: true, releaseDate: "2025-04-01", category: "reasoning", }, [OllamaModels.MISTRAL_LARGE_LATEST]: { id: OllamaModels.MISTRAL_LARGE_LATEST, name: "Mistral Large (Local)", provider: AIProviderName.OLLAMA, description: "Mistral Large model for local inference", capabilities: { vision: false, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: false, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0, outputCostPer1K: 0, currency: "USD", }, performance: { speed: "slow", quality: "high", accuracy: "high", }, limits: { maxContextTokens: 131072, maxOutputTokens: 8192, }, useCases: { coding: 8, creative: 8, analysis: 8, conversation: 8, reasoning: 8, translation: 9, summarization: 8, }, aliases: ["mistral-large-local"], deprecated: false, isLocal: true, releaseDate: "2024-02-26", category: "general", }, // Bedrock Models [BedrockModels.NOVA_PREMIER]: { id: BedrockModels.NOVA_PREMIER, name: "Amazon Nova Premier", provider: AIProviderName.BEDROCK, description: "Amazon's most capable foundation model with advanced multimodal capabilities", capabilities: { vision: true, functionCalling: true, codeGeneration: true, reasoning: true, multimodal: true, streaming: true, jsonMode: true, }, pricing: { inputCostPer1K: 0.0025, outputCostPer1K: 0.0125, currency: "USD", }, performance: { speed: "medium", quality: "high", accuracy: "high", }, limits: {