@juspay/neurolink
Version:
Universal AI Development Platform with working MCP integration, multi-provider support, voice (TTS/STT/realtime), and professional CLI. 58+ external MCP servers discoverable, multimodal file processing, RAG pipelines. Build, test, and deploy AI applicatio
1,725 lines (1,724 loc) • 69.8 kB
JavaScript
/**
* Model Registry for NeuroLink CLI Commands
* Provides centralized model data for models command system
* Part of Phase 4.1 - Models Command System
*/
import { DEFAULT_MODEL_ALIASES } from "../types/index.js";
import { AIProviderName, OpenAIModels, AzureOpenAIModels, GoogleAIModels, AnthropicModels, BedrockModels, MistralModels, OllamaModels, } from "../constants/enums.js";
/**
* Comprehensive model registry
*/
export const MODEL_REGISTRY = {
// OpenAI Models
[OpenAIModels.GPT_4O]: {
id: OpenAIModels.GPT_4O,
name: "GPT-4 Omni",
provider: AIProviderName.OPENAI,
description: "Most capable OpenAI model with vision and advanced reasoning",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.005,
outputCostPer1K: 0.015,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 128000,
maxOutputTokens: 4096,
maxRequestsPerMinute: 500,
},
useCases: {
coding: 9,
creative: 8,
analysis: 9,
conversation: 9,
reasoning: 9,
translation: 8,
summarization: 8,
},
aliases: ["gpt4o", "gpt-4-omni", "openai-flagship"],
deprecated: false,
isLocal: false, // Cloud-based model
releaseDate: "2024-05-13",
category: "general",
},
[OpenAIModels.GPT_4O_MINI]: {
id: OpenAIModels.GPT_4O_MINI,
name: "GPT-4 Omni Mini",
provider: AIProviderName.OPENAI,
description: "Fast and cost-effective model with strong performance",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.00015,
outputCostPer1K: 0.0006,
currency: "USD",
},
performance: {
speed: "fast",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 128000,
maxOutputTokens: 16384,
maxRequestsPerMinute: 1000,
},
useCases: {
coding: 8,
creative: 7,
analysis: 8,
conversation: 8,
reasoning: 8,
translation: 8,
summarization: 9,
},
aliases: ["gpt4o-mini", "gpt-4-mini", "fastest", "cheap"],
deprecated: false,
isLocal: false, // Cloud-based model
releaseDate: "2024-07-18",
category: "general",
},
// OpenAI GPT-5 Series
[OpenAIModels.GPT_5]: {
id: OpenAIModels.GPT_5,
name: "GPT-5",
provider: AIProviderName.OPENAI,
description: "OpenAI's most advanced model with breakthrough reasoning and multimodal capabilities",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.01,
outputCostPer1K: 0.03,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 256000,
maxOutputTokens: 32768,
maxRequestsPerMinute: 200,
},
useCases: {
coding: 10,
creative: 10,
analysis: 10,
conversation: 10,
reasoning: 10,
translation: 9,
summarization: 9,
},
aliases: ["gpt5", "gpt-5-flagship", "openai-latest"],
deprecated: false,
isLocal: false,
releaseDate: "2025-08-07",
category: "reasoning",
},
[OpenAIModels.GPT_5_MINI]: {
id: OpenAIModels.GPT_5_MINI,
name: "GPT-5 Mini",
provider: AIProviderName.OPENAI,
description: "Fast and efficient GPT-5 variant for everyday tasks",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.002,
outputCostPer1K: 0.006,
currency: "USD",
},
performance: {
speed: "fast",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 128000,
maxOutputTokens: 16384,
maxRequestsPerMinute: 500,
},
useCases: {
coding: 8,
creative: 8,
analysis: 8,
conversation: 9,
reasoning: 8,
translation: 8,
summarization: 9,
},
aliases: ["gpt5-mini", "gpt-5-fast"],
deprecated: false,
isLocal: false,
releaseDate: "2025-08-07",
category: "general",
},
// OpenAI O-Series Reasoning Models
[OpenAIModels.O3]: {
id: OpenAIModels.O3,
name: "O3",
provider: AIProviderName.OPENAI,
description: "Advanced reasoning model with extended thinking capabilities for complex tasks",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.015,
outputCostPer1K: 0.06,
currency: "USD",
},
performance: {
speed: "slow",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 200000,
maxOutputTokens: 100000,
maxRequestsPerMinute: 100,
},
useCases: {
coding: 10,
creative: 8,
analysis: 10,
conversation: 7,
reasoning: 10,
translation: 7,
summarization: 8,
},
aliases: ["o3-reasoning", "o3-thinking"],
deprecated: false,
isLocal: false,
releaseDate: "2025-01-31",
category: "reasoning",
},
[OpenAIModels.O3_MINI]: {
id: OpenAIModels.O3_MINI,
name: "O3 Mini",
provider: AIProviderName.OPENAI,
description: "Cost-effective reasoning model with strong logical capabilities",
capabilities: {
vision: false,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: false,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.003,
outputCostPer1K: 0.012,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 200000,
maxOutputTokens: 65536,
maxRequestsPerMinute: 200,
},
useCases: {
coding: 9,
creative: 6,
analysis: 9,
conversation: 7,
reasoning: 9,
translation: 6,
summarization: 7,
},
aliases: ["o3-mini-reasoning"],
deprecated: false,
isLocal: false,
releaseDate: "2025-01-31",
category: "reasoning",
},
[OpenAIModels.GPT_5_NANO]: {
id: OpenAIModels.GPT_5_NANO,
name: "GPT-5 Nano",
provider: AIProviderName.OPENAI,
description: "Fastest and most cost-effective GPT-5 variant for simple tasks",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.00005,
outputCostPer1K: 0.0004,
currency: "USD",
},
performance: {
speed: "fast",
quality: "medium",
accuracy: "medium",
},
limits: {
maxContextTokens: 272000,
maxOutputTokens: 128000,
maxRequestsPerMinute: 2000,
},
useCases: {
coding: 6,
creative: 6,
analysis: 6,
conversation: 8,
reasoning: 6,
translation: 7,
summarization: 8,
},
aliases: ["gpt5-nano", "gpt-5-cheapest"],
deprecated: false,
isLocal: false,
releaseDate: "2025-08-07",
category: "general",
},
// OpenAI GPT-5.2 Series (Released December 11, 2025) - Latest flagship models
[OpenAIModels.GPT_5_2]: {
id: OpenAIModels.GPT_5_2,
name: "GPT-5.2 Thinking",
provider: AIProviderName.OPENAI,
description: "OpenAI's latest flagship model with deep reasoning capabilities, 100% on AIME 2025, 80% SWE-bench Verified",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.00175,
outputCostPer1K: 0.014,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 256000,
maxOutputTokens: 64000,
maxRequestsPerMinute: 150,
},
useCases: {
coding: 10,
creative: 10,
analysis: 10,
conversation: 9,
reasoning: 10,
translation: 9,
summarization: 9,
},
aliases: ["gpt52", "gpt-5.2-thinking", "openai-latest-reasoning"],
deprecated: false,
isLocal: false,
releaseDate: "2025-12-11",
category: "reasoning",
},
[OpenAIModels.GPT_5_2_CHAT_LATEST]: {
id: OpenAIModels.GPT_5_2_CHAT_LATEST,
name: "GPT-5.2 Instant",
provider: AIProviderName.OPENAI,
description: "Fast everyday model for quick tasks with excellent performance across all domains",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.00175,
outputCostPer1K: 0.014,
currency: "USD",
},
performance: {
speed: "fast",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 256000,
maxOutputTokens: 32000,
maxRequestsPerMinute: 300,
},
useCases: {
coding: 9,
creative: 9,
analysis: 9,
conversation: 10,
reasoning: 9,
translation: 9,
summarization: 9,
},
aliases: ["gpt52-chat", "gpt-5.2-instant", "gpt52-fast"],
deprecated: false,
isLocal: false,
releaseDate: "2025-12-11",
category: "general",
},
[OpenAIModels.GPT_5_2_PRO]: {
id: OpenAIModels.GPT_5_2_PRO,
name: "GPT-5.2 Pro",
provider: AIProviderName.OPENAI,
description: "Highest quality model for science, math, and complex problem-solving with 92.4% GPQA Diamond performance",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.021,
outputCostPer1K: 0.168,
currency: "USD",
},
performance: {
speed: "slow",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 256000,
maxOutputTokens: 128000,
maxRequestsPerMinute: 50,
},
useCases: {
coding: 10,
creative: 9,
analysis: 10,
conversation: 8,
reasoning: 10,
translation: 9,
summarization: 9,
},
aliases: ["gpt52-pro", "gpt-5.2-professional", "openai-science"],
deprecated: false,
isLocal: false,
releaseDate: "2025-12-11",
category: "reasoning",
},
// OpenAI GPT-4.1 Series (1M context window)
[OpenAIModels.GPT_4_1]: {
id: OpenAIModels.GPT_4_1,
name: "GPT-4.1",
provider: AIProviderName.OPENAI,
description: "Advanced coding model with 1 million token context window",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.002,
outputCostPer1K: 0.008,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 1000000,
maxOutputTokens: 128000,
maxRequestsPerMinute: 200,
},
useCases: {
coding: 10,
creative: 8,
analysis: 9,
conversation: 8,
reasoning: 9,
translation: 8,
summarization: 9,
},
aliases: ["gpt-4.1", "gpt41", "million-context"],
deprecated: false,
isLocal: false,
releaseDate: "2025-04-14",
category: "coding",
},
[OpenAIModels.GPT_4_1_MINI]: {
id: OpenAIModels.GPT_4_1_MINI,
name: "GPT-4.1 Mini",
provider: AIProviderName.OPENAI,
description: "Fast GPT-4.1 variant with 1M context for efficient coding",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.0004,
outputCostPer1K: 0.0016,
currency: "USD",
},
performance: {
speed: "fast",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 1000000,
maxOutputTokens: 128000,
maxRequestsPerMinute: 500,
},
useCases: {
coding: 9,
creative: 7,
analysis: 8,
conversation: 8,
reasoning: 8,
translation: 8,
summarization: 9,
},
aliases: ["gpt-4.1-mini", "gpt41-mini"],
deprecated: false,
isLocal: false,
releaseDate: "2025-04-14",
category: "coding",
},
[OpenAIModels.GPT_4_1_NANO]: {
id: OpenAIModels.GPT_4_1_NANO,
name: "GPT-4.1 Nano",
provider: AIProviderName.OPENAI,
description: "Most cost-effective GPT-4.1 variant with 1M context",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.0001,
outputCostPer1K: 0.0004,
currency: "USD",
},
performance: {
speed: "fast",
quality: "medium",
accuracy: "medium",
},
limits: {
maxContextTokens: 1000000,
maxOutputTokens: 128000,
maxRequestsPerMinute: 1000,
},
useCases: {
coding: 7,
creative: 6,
analysis: 7,
conversation: 7,
reasoning: 7,
translation: 7,
summarization: 8,
},
aliases: ["gpt-4.1-nano", "gpt41-nano"],
deprecated: false,
isLocal: false,
releaseDate: "2025-04-14",
category: "coding",
},
// OpenAI O-Series Additional Models
[OpenAIModels.O3_PRO]: {
id: OpenAIModels.O3_PRO,
name: "O3 Pro",
provider: AIProviderName.OPENAI,
description: "Most powerful reasoning model for complex scientific and coding tasks",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.03,
outputCostPer1K: 0.12,
currency: "USD",
},
performance: {
speed: "slow",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 200000,
maxOutputTokens: 100000,
maxRequestsPerMinute: 50,
},
useCases: {
coding: 10,
creative: 7,
analysis: 10,
conversation: 6,
reasoning: 10,
translation: 6,
summarization: 7,
},
aliases: ["o3-pro", "o3-professional"],
deprecated: false,
isLocal: false,
releaseDate: "2025-04-16",
category: "reasoning",
},
[OpenAIModels.O4_MINI]: {
id: OpenAIModels.O4_MINI,
name: "O4 Mini",
provider: AIProviderName.OPENAI,
description: "Fast reasoning model optimized for math, coding, and visual tasks",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.003,
outputCostPer1K: 0.012,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 200000,
maxOutputTokens: 100000,
maxRequestsPerMinute: 200,
},
useCases: {
coding: 9,
creative: 6,
analysis: 9,
conversation: 7,
reasoning: 10,
translation: 6,
summarization: 7,
},
aliases: ["o4-mini", "o4-fast"],
deprecated: false,
isLocal: false,
releaseDate: "2025-04-16",
category: "reasoning",
},
[OpenAIModels.O1]: {
id: OpenAIModels.O1,
name: "O1",
provider: AIProviderName.OPENAI,
description: "Premium reasoning model with highest capability for mission-critical tasks",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.15,
outputCostPer1K: 0.6,
currency: "USD",
},
performance: {
speed: "slow",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 128000,
maxOutputTokens: 32768,
maxRequestsPerMinute: 50,
},
useCases: {
coding: 10,
creative: 7,
analysis: 10,
conversation: 6,
reasoning: 10,
translation: 6,
summarization: 7,
},
aliases: ["o1-full", "o1-premium"],
deprecated: false,
isLocal: false,
releaseDate: "2024-09-12",
category: "reasoning",
},
[OpenAIModels.O1_PREVIEW]: {
id: OpenAIModels.O1_PREVIEW,
name: "O1 Preview",
provider: AIProviderName.OPENAI,
description: "Preview version of O1 reasoning model",
capabilities: {
vision: false,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: false,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.015,
outputCostPer1K: 0.06,
currency: "USD",
},
performance: {
speed: "slow",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 128000,
maxOutputTokens: 32768,
maxRequestsPerMinute: 100,
},
useCases: {
coding: 9,
creative: 6,
analysis: 9,
conversation: 6,
reasoning: 9,
translation: 5,
summarization: 6,
},
aliases: ["o1-preview"],
deprecated: false,
isLocal: false,
releaseDate: "2024-09-12",
category: "reasoning",
},
[OpenAIModels.O1_MINI]: {
id: OpenAIModels.O1_MINI,
name: "O1 Mini",
provider: AIProviderName.OPENAI,
description: "Cost-effective O1 variant with strong reasoning capabilities",
capabilities: {
vision: false,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: false,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.003,
outputCostPer1K: 0.012,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 128000,
maxOutputTokens: 65536,
maxRequestsPerMinute: 200,
},
useCases: {
coding: 8,
creative: 5,
analysis: 8,
conversation: 6,
reasoning: 8,
translation: 5,
summarization: 6,
},
aliases: ["o1-mini", "o1-budget"],
deprecated: false,
isLocal: false,
releaseDate: "2024-09-12",
category: "reasoning",
},
// OpenAI Legacy Models
[OpenAIModels.GPT_4]: {
id: OpenAIModels.GPT_4,
name: "GPT-4",
provider: AIProviderName.OPENAI,
description: "Previous generation flagship model (legacy)",
capabilities: {
vision: false,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: false,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.03,
outputCostPer1K: 0.06,
currency: "USD",
},
performance: {
speed: "slow",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 8192,
maxOutputTokens: 4096,
maxRequestsPerMinute: 200,
},
useCases: {
coding: 8,
creative: 8,
analysis: 8,
conversation: 8,
reasoning: 8,
translation: 8,
summarization: 8,
},
aliases: ["gpt4", "gpt-4-base"],
deprecated: true,
isLocal: false,
releaseDate: "2023-03-14",
category: "general",
},
[OpenAIModels.GPT_4_TURBO]: {
id: OpenAIModels.GPT_4_TURBO,
name: "GPT-4 Turbo",
provider: AIProviderName.OPENAI,
description: "Faster GPT-4 variant with extended context (legacy)",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.01,
outputCostPer1K: 0.03,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 128000,
maxOutputTokens: 4096,
maxRequestsPerMinute: 500,
},
useCases: {
coding: 8,
creative: 8,
analysis: 9,
conversation: 8,
reasoning: 8,
translation: 8,
summarization: 8,
},
aliases: ["gpt4-turbo", "gpt-4-turbo-preview"],
deprecated: true,
isLocal: false,
releaseDate: "2024-04-09",
category: "general",
},
[OpenAIModels.GPT_3_5_TURBO]: {
id: OpenAIModels.GPT_3_5_TURBO,
name: "GPT-3.5 Turbo",
provider: AIProviderName.OPENAI,
description: "Fast and cost-effective model for simpler tasks (legacy)",
capabilities: {
vision: false,
functionCalling: true,
codeGeneration: true,
reasoning: false,
multimodal: false,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.0005,
outputCostPer1K: 0.0015,
currency: "USD",
},
performance: {
speed: "fast",
quality: "medium",
accuracy: "medium",
},
limits: {
maxContextTokens: 16385,
maxOutputTokens: 4096,
maxRequestsPerMinute: 3500,
},
useCases: {
coding: 6,
creative: 6,
analysis: 6,
conversation: 7,
reasoning: 5,
translation: 7,
summarization: 7,
},
aliases: ["gpt35", "gpt-3.5", "chatgpt"],
deprecated: true,
isLocal: false,
releaseDate: "2023-03-01",
category: "general",
},
// Google AI Studio Models
[GoogleAIModels.GEMINI_2_5_PRO]: {
id: GoogleAIModels.GEMINI_2_5_PRO,
name: "Gemini 2.5 Pro",
provider: AIProviderName.GOOGLE_AI,
description: "Google's most capable multimodal model with large context window",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.00125,
outputCostPer1K: 0.005,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 2097152, // 2M tokens
maxOutputTokens: 8192,
maxRequestsPerMinute: 360,
},
useCases: {
coding: 9,
creative: 8,
analysis: 10,
conversation: 8,
reasoning: 9,
translation: 9,
summarization: 9,
},
aliases: ["gemini-pro", "google-flagship", "best-analysis"],
deprecated: false,
isLocal: false, // Cloud-based model
releaseDate: "2024-12-11",
category: "reasoning",
},
[GoogleAIModels.GEMINI_2_5_FLASH]: {
id: GoogleAIModels.GEMINI_2_5_FLASH,
name: "Gemini 2.5 Flash",
provider: AIProviderName.GOOGLE_AI,
description: "Fast and efficient multimodal model with large context",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.000075,
outputCostPer1K: 0.0003,
currency: "USD",
},
performance: {
speed: "fast",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 1048576, // 1M tokens
maxOutputTokens: 8192,
maxRequestsPerMinute: 1000,
},
useCases: {
coding: 8,
creative: 7,
analysis: 9,
conversation: 8,
reasoning: 8,
translation: 8,
summarization: 9,
},
aliases: ["gemini-flash", "google-fast", "best-value"],
deprecated: false,
isLocal: false, // Cloud-based model
releaseDate: "2024-12-11",
category: "general",
},
// Anthropic Models
[AnthropicModels.CLAUDE_OPUS_4_5]: {
id: AnthropicModels.CLAUDE_OPUS_4_5,
name: "Claude Opus 4.5",
provider: AIProviderName.ANTHROPIC,
description: "Anthropic's most capable model with exceptional reasoning, coding, and multimodal capabilities",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: false,
},
pricing: {
inputCostPer1K: 0.015,
outputCostPer1K: 0.075,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 200000,
maxOutputTokens: 64000,
maxRequestsPerMinute: 50,
},
useCases: {
coding: 10,
creative: 10,
analysis: 10,
conversation: 9,
reasoning: 10,
translation: 9,
summarization: 9,
},
aliases: [
"claude-4.5-opus",
"claude-opus-latest",
"opus-4.5",
"anthropic-flagship",
],
deprecated: false,
isLocal: false,
releaseDate: "2025-11-24",
category: "reasoning",
},
[AnthropicModels.CLAUDE_SONNET_4_5]: {
id: AnthropicModels.CLAUDE_SONNET_4_5,
name: "Claude Sonnet 4.5",
provider: AIProviderName.ANTHROPIC,
description: "Balanced Claude model with excellent performance across all tasks including vision and reasoning",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: false,
},
pricing: {
inputCostPer1K: 0.003,
outputCostPer1K: 0.015,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 200000,
maxOutputTokens: 64000,
maxRequestsPerMinute: 100,
},
useCases: {
coding: 10,
creative: 9,
analysis: 9,
conversation: 9,
reasoning: 10,
translation: 8,
summarization: 8,
},
aliases: ["claude-4.5-sonnet", "claude-sonnet-latest", "sonnet-4.5"],
deprecated: false,
isLocal: false,
releaseDate: "2025-09-29",
category: "coding",
},
[AnthropicModels.CLAUDE_4_5_HAIKU]: {
id: AnthropicModels.CLAUDE_4_5_HAIKU,
name: "Claude 4.5 Haiku",
provider: AIProviderName.ANTHROPIC,
description: "Latest fast and efficient Claude model with vision support",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: false,
},
pricing: {
inputCostPer1K: 0.001,
outputCostPer1K: 0.005,
currency: "USD",
},
performance: {
speed: "fast",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 200000,
maxOutputTokens: 64000,
maxRequestsPerMinute: 100,
},
useCases: {
coding: 8,
creative: 8,
analysis: 8,
conversation: 9,
reasoning: 8,
translation: 8,
summarization: 9,
},
aliases: ["claude-4.5-haiku", "claude-haiku-latest", "haiku-4.5"],
deprecated: false,
isLocal: false,
releaseDate: "2025-10-15",
category: "general",
},
[AnthropicModels.CLAUDE_3_5_SONNET]: {
id: AnthropicModels.CLAUDE_3_5_SONNET,
name: "Claude 3.5 Sonnet",
provider: AIProviderName.ANTHROPIC,
description: "Anthropic's most capable model with excellent reasoning and coding",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: false,
},
pricing: {
inputCostPer1K: 0.003,
outputCostPer1K: 0.015,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 200000,
maxOutputTokens: 8192,
maxRequestsPerMinute: 50,
},
useCases: {
coding: 10,
creative: 9,
analysis: 9,
conversation: 9,
reasoning: 10,
translation: 8,
summarization: 8,
},
aliases: [
"claude-3.5-sonnet",
"claude-sonnet",
"best-coding",
"claude-latest",
],
deprecated: false,
isLocal: false, // Cloud-based model
releaseDate: "2024-10-22",
category: "coding",
},
[AnthropicModels.CLAUDE_3_5_HAIKU]: {
id: AnthropicModels.CLAUDE_3_5_HAIKU,
name: "Claude 3.5 Haiku",
provider: AIProviderName.ANTHROPIC,
description: "Fast and efficient Claude model for quick tasks",
capabilities: {
vision: false,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: false,
streaming: true,
jsonMode: false,
},
pricing: {
inputCostPer1K: 0.001,
outputCostPer1K: 0.005,
currency: "USD",
},
performance: {
speed: "fast",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 200000,
maxOutputTokens: 8192,
maxRequestsPerMinute: 100,
},
useCases: {
coding: 8,
creative: 7,
analysis: 8,
conversation: 8,
reasoning: 8,
translation: 8,
summarization: 9,
},
aliases: ["claude-3.5-haiku", "claude-haiku", "claude-fast"],
deprecated: false,
isLocal: false, // Cloud-based model
releaseDate: "2024-10-22",
category: "general",
},
// Mistral Models
[MistralModels.MISTRAL_LARGE_LATEST]: {
id: MistralModels.MISTRAL_LARGE_LATEST,
name: "Mistral Large",
provider: AIProviderName.MISTRAL,
description: "Mistral's flagship model with excellent reasoning and multilingual capabilities",
capabilities: {
vision: false,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: false,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.002,
outputCostPer1K: 0.006,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 131072,
maxOutputTokens: 8192,
maxRequestsPerMinute: 100,
},
useCases: {
coding: 9,
creative: 8,
analysis: 9,
conversation: 8,
reasoning: 9,
translation: 9,
summarization: 8,
},
aliases: ["mistral-large", "mistral-flagship"],
deprecated: false,
isLocal: false,
releaseDate: "2025-12-01",
category: "reasoning",
},
[MistralModels.MISTRAL_SMALL_LATEST]: {
id: MistralModels.MISTRAL_SMALL_LATEST,
name: "Mistral Small",
provider: AIProviderName.MISTRAL,
description: "Efficient model for simple tasks and cost-sensitive applications",
capabilities: {
vision: false,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: false,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.001,
outputCostPer1K: 0.003,
currency: "USD",
},
performance: {
speed: "fast",
quality: "medium",
accuracy: "medium",
},
limits: {
maxContextTokens: 32768,
maxOutputTokens: 8192,
maxRequestsPerMinute: 200,
},
useCases: {
coding: 6,
creative: 6,
analysis: 7,
conversation: 7,
reasoning: 6,
translation: 7,
summarization: 7,
},
aliases: ["mistral-small", "mistral-cheap"],
deprecated: false,
isLocal: false,
releaseDate: "2024-02-26",
category: "general",
},
[MistralModels.CODESTRAL_LATEST]: {
id: MistralModels.CODESTRAL_LATEST,
name: "Codestral",
provider: AIProviderName.MISTRAL,
description: "Specialized code generation model trained on 80+ programming languages",
capabilities: {
vision: false,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: false,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.001,
outputCostPer1K: 0.003,
currency: "USD",
},
performance: {
speed: "fast",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 32768,
maxOutputTokens: 8192,
maxRequestsPerMinute: 200,
},
useCases: {
coding: 10,
creative: 5,
analysis: 7,
conversation: 5,
reasoning: 8,
translation: 5,
summarization: 6,
},
aliases: ["codestral", "mistral-code"],
deprecated: false,
isLocal: false,
releaseDate: "2024-05-29",
category: "coding",
},
[MistralModels.PIXTRAL_LARGE]: {
id: MistralModels.PIXTRAL_LARGE,
name: "Pixtral Large",
provider: AIProviderName.MISTRAL,
description: "Multimodal vision-language model for image understanding",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.002,
outputCostPer1K: 0.006,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 131072,
maxOutputTokens: 8192,
maxRequestsPerMinute: 100,
},
useCases: {
coding: 8,
creative: 8,
analysis: 9,
conversation: 7,
reasoning: 8,
translation: 7,
summarization: 8,
},
aliases: ["pixtral", "mistral-vision"],
deprecated: false,
isLocal: false,
releaseDate: "2024-09-01",
category: "vision",
},
// Ollama Models (local)
[OllamaModels.LLAMA4_LATEST]: {
id: OllamaModels.LLAMA4_LATEST,
name: "Llama 4",
provider: AIProviderName.OLLAMA,
description: "Latest Llama 4 with multimodal vision and tool capabilities, runs locally",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0,
outputCostPer1K: 0,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 131072,
maxOutputTokens: 8192,
},
useCases: {
coding: 9,
creative: 8,
analysis: 9,
conversation: 8,
reasoning: 9,
translation: 8,
summarization: 8,
},
aliases: ["llama4", "llama4-local"],
deprecated: false,
isLocal: true,
releaseDate: "2025-04-01",
category: "reasoning",
},
[OllamaModels.LLAMA3_3_LATEST]: {
id: OllamaModels.LLAMA3_3_LATEST,
name: "Llama 3.3",
provider: AIProviderName.OLLAMA,
description: "High-performance Llama 3.3 for local inference",
capabilities: {
vision: false,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: false,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0,
outputCostPer1K: 0,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 131072,
maxOutputTokens: 8192,
},
useCases: {
coding: 8,
creative: 8,
analysis: 8,
conversation: 8,
reasoning: 8,
translation: 8,
summarization: 8,
},
aliases: ["llama3.3", "llama3.3-local"],
deprecated: false,
isLocal: true,
releaseDate: "2024-12-01",
category: "general",
},
[OllamaModels.LLAMA3_2_LATEST]: {
id: OllamaModels.LLAMA3_2_LATEST,
name: "Llama 3.2 Latest",
provider: AIProviderName.OLLAMA,
description: "Local Llama model for private, offline AI generation",
capabilities: {
vision: false,
functionCalling: false,
codeGeneration: true,
reasoning: true,
multimodal: false,
streaming: true,
jsonMode: false,
},
pricing: {
inputCostPer1K: 0,
outputCostPer1K: 0,
currency: "USD",
},
performance: {
speed: "fast",
quality: "medium",
accuracy: "medium",
},
limits: {
maxContextTokens: 131072,
maxOutputTokens: 8192,
},
useCases: {
coding: 6,
creative: 7,
analysis: 6,
conversation: 7,
reasoning: 6,
translation: 6,
summarization: 6,
},
aliases: ["llama3.2", "llama", "local", "offline"],
deprecated: false,
isLocal: true,
releaseDate: "2024-09-25",
category: "general",
},
[OllamaModels.DEEPSEEK_R1_70B]: {
id: OllamaModels.DEEPSEEK_R1_70B,
name: "DeepSeek-R1 70B",
provider: AIProviderName.OLLAMA,
description: "State-of-the-art reasoning model rivaling OpenAI O1, runs locally",
capabilities: {
vision: false,
functionCalling: false,
codeGeneration: true,
reasoning: true,
multimodal: false,
streaming: true,
jsonMode: false,
},
pricing: {
inputCostPer1K: 0,
outputCostPer1K: 0,
currency: "USD",
},
performance: {
speed: "slow",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 65536,
maxOutputTokens: 8192,
},
useCases: {
coding: 10,
creative: 7,
analysis: 10,
conversation: 6,
reasoning: 10,
translation: 7,
summarization: 7,
},
aliases: ["deepseek-r1", "deepseek-reasoning", "local-reasoning"],
deprecated: false,
isLocal: true,
releaseDate: "2025-01-20",
category: "reasoning",
},
[OllamaModels.QWEN3_72B]: {
id: OllamaModels.QWEN3_72B,
name: "Qwen 3 72B",
provider: AIProviderName.OLLAMA,
description: "Advanced reasoning and multilingual model from Alibaba",
capabilities: {
vision: false,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: false,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0,
outputCostPer1K: 0,
currency: "USD",
},
performance: {
speed: "slow",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 131072,
maxOutputTokens: 8192,
},
useCases: {
coding: 9,
creative: 8,
analysis: 9,
conversation: 8,
reasoning: 9,
translation: 9,
summarization: 8,
},
aliases: ["qwen3", "qwen3-72b-local"],
deprecated: false,
isLocal: true,
releaseDate: "2025-04-01",
category: "reasoning",
},
[OllamaModels.MISTRAL_LARGE_LATEST]: {
id: OllamaModels.MISTRAL_LARGE_LATEST,
name: "Mistral Large (Local)",
provider: AIProviderName.OLLAMA,
description: "Mistral Large model for local inference",
capabilities: {
vision: false,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: false,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0,
outputCostPer1K: 0,
currency: "USD",
},
performance: {
speed: "slow",
quality: "high",
accuracy: "high",
},
limits: {
maxContextTokens: 131072,
maxOutputTokens: 8192,
},
useCases: {
coding: 8,
creative: 8,
analysis: 8,
conversation: 8,
reasoning: 8,
translation: 9,
summarization: 8,
},
aliases: ["mistral-large-local"],
deprecated: false,
isLocal: true,
releaseDate: "2024-02-26",
category: "general",
},
// Bedrock Models
[BedrockModels.NOVA_PREMIER]: {
id: BedrockModels.NOVA_PREMIER,
name: "Amazon Nova Premier",
provider: AIProviderName.BEDROCK,
description: "Amazon's most capable foundation model with advanced multimodal capabilities",
capabilities: {
vision: true,
functionCalling: true,
codeGeneration: true,
reasoning: true,
multimodal: true,
streaming: true,
jsonMode: true,
},
pricing: {
inputCostPer1K: 0.0025,
outputCostPer1K: 0.0125,
currency: "USD",
},
performance: {
speed: "medium",
quality: "high",
accuracy: "high",
},
limits: {