UNPKG

@juspay/neurolink

Version:

Universal AI Development Platform with working MCP integration, multi-provider support, voice (TTS/STT/realtime), and professional CLI. 58+ external MCP servers discoverable, multimodal file processing, RAG pipelines. Build, test, and deploy AI applicatio

github.com/juspay/neurolink

juspay/neurolink

249 lines (248 loc) • 9.22 kB

JavaScript

import { modelConfig } from "./modelConfiguration.js"; const PERFORMANCE_THRESHOLDS = { EXCELLENT_SUCCESS_RATE: 0.95, EXCELLENT_RESPONSE_TIME_MS: 2000, GOOD_SUCCESS_RATE: 0.9, FAIR_SUCCESS_RATE: 0.8, }; const providerMetrics = new Map(); /** * Convert new configuration format to legacy format for backwards compatibility */ function convertToLegacyFormat(config) { return { provider: config.provider, models: Object.keys(config.models || {}), costPerToken: config.defaultCost, requiresApiKey: config.requiredEnvVars, performance: config.performance, }; } /** * Get all provider configurations using the new configuration system * Replaces hardcoded EVALUATION_PROVIDER_CONFIGS with configurable system */ function getEvaluationProviderConfigs() { const configs = {}; const allConfigs = modelConfig.getAllConfigurations(); for (const [provider, config] of allConfigs) { configs[provider] = convertToLegacyFormat(config); } return configs; } /** * Dynamic provider configurations for evaluation * Now uses configurable system instead of hardcoded values */ export const EVALUATION_PROVIDER_CONFIGS = getEvaluationProviderConfigs(); /** * Get provider configuration by name * Now uses the configurable system */ export function getProviderConfig(providerName) { const config = modelConfig.getProviderConfiguration(providerName); return config ? convertToLegacyFormat(config) : null; } /** * Get all available providers with required API keys present * Now uses the configurable system */ export function getAvailableProviders() { return modelConfig .getAvailableProviders() .map((config) => convertToLegacyFormat(config)); } /** * Sort providers by preference (cost, speed, quality) */ export function sortProvidersByPreference(providers, preferCheap = true) { return [...providers].sort((a, b) => { const aPerf = a.performance || { cost: 0, speed: 0, quality: 0 }; const bPerf = b.performance || { cost: 0, speed: 0, quality: 0 }; if (preferCheap) { // Cost > Speed > Quality for cheap preference if ((aPerf.cost || 0) !== (bPerf.cost || 0)) { return (bPerf.cost || 0) - (aPerf.cost || 0); } if ((aPerf.speed || 0) !== (bPerf.speed || 0)) { return (bPerf.speed || 0) - (aPerf.speed || 0); } return (bPerf.quality || 0) - (aPerf.quality || 0); } else { // Quality > Speed > Cost for quality preference if ((aPerf.quality || 0) !== (bPerf.quality || 0)) { return (bPerf.quality || 0) - (aPerf.quality || 0); } if ((aPerf.speed || 0) !== (bPerf.speed || 0)) { return (bPerf.speed || 0) - (aPerf.speed || 0); } return (bPerf.cost || 0) - (aPerf.cost || 0); } }); } /** * Estimate cost for a specific provider and token usage * Now uses the configurable system */ export function estimateProviderCost(providerName, input, output) { const costInfo = modelConfig.getCostInfo(providerName); if (!costInfo) { return 0; } return input * costInfo.input + output * costInfo.output; } /** * Check if a provider is available (has required API keys) * Now uses the configurable system */ export function isProviderAvailable(providerName) { return modelConfig.isProviderAvailable(providerName); } /** * Get the best available provider based on preference */ export function getBestAvailableProvider(preferCheap = true) { const availableProviders = getAvailableProviders(); if (availableProviders.length === 0) { return null; } const sortedProviders = sortProvidersByPreference(availableProviders, preferCheap); return sortedProviders[0]; } /** Record actual provider performance for optimization */ export function recordProviderPerformanceFromMetrics(providerName, metrics) { const existing = providerMetrics.get(providerName) || { responseTime: [], successRate: 0, tokenThroughput: 0, costEfficiency: 0, lastUpdated: new Date(), sampleCount: 0, }; // Keep rolling window of last 50 response times existing.responseTime.push(metrics.responseTime); if (existing.responseTime.length > 50) { existing.responseTime.shift(); } // Update success rate const totalSamples = existing.sampleCount + 1; existing.successRate = (existing.successRate * existing.sampleCount + (metrics.success ? 1 : 0)) / totalSamples; // Update throughput (tokens per second) if (metrics.responseTime > 0) { const tokensPerSecond = metrics.tokensGenerated / (metrics.responseTime / 1000); existing.tokenThroughput = (existing.tokenThroughput * existing.sampleCount + tokensPerSecond) / totalSamples; } // If responseTime is 0, skip updating tokenThroughput for this sample // but still update other metrics // Update cost efficiency (tokens per dollar) if (metrics.cost > 0) { const tokensPerDollar = metrics.tokensGenerated / metrics.cost; existing.costEfficiency = (existing.costEfficiency * existing.sampleCount + tokensPerDollar) / totalSamples; } existing.sampleCount = totalSamples; existing.lastUpdated = new Date(); providerMetrics.set(providerName, existing); } /** * Get performance-optimized provider based on real metrics */ export function getPerformanceOptimizedProvider(priority = "speed") { const availableProviders = getAvailableProviders(); if (availableProviders.length === 0) { return null; } // Score providers based on real performance data. // Only consider providers that have runtime metrics (sampleCount >= 3). // Providers without metrics are excluded to avoid misleading recommendations // (e.g. ollama appearing as "recommended" when it has no requiredEnvVars and // thus always passes the "available" check, even when not actually in use). const scoredProviders = []; for (const provider of availableProviders) { const metrics = providerMetrics.get(provider.provider); if (!metrics || metrics.sampleCount < 3) { // Skip providers without sufficient runtime data continue; } let score = 0; switch (priority) { case "speed": { const avgResponseTime = metrics.responseTime.reduce((a, b) => a + b, 0) / metrics.responseTime.length; score = metrics.tokenThroughput * 0.6 + (5000 / Math.max(avgResponseTime, 100)) * 0.4; break; } case "cost": { score = metrics.costEfficiency * 0.7 + metrics.successRate * 0.3; break; } case "reliability": { score = metrics.successRate * 0.8 + (metrics.sampleCount / 100) * 0.2; break; } } scoredProviders.push({ provider, score }); } if (scoredProviders.length === 0) { // No providers have sufficient runtime data to make a recommendation return null; } // Sort by score and return best scoredProviders.sort((a, b) => b.score - a.score); return scoredProviders[0].provider; } export function getProviderPerformanceAnalytics() { const analytics = {}; for (const [providerName, metrics] of providerMetrics.entries()) { if (metrics.sampleCount === 0) { continue; } const avgResponseTime = metrics.responseTime.reduce((a, b) => a + b, 0) / metrics.responseTime.length; let recommendation; if (metrics.successRate > PERFORMANCE_THRESHOLDS.EXCELLENT_SUCCESS_RATE && avgResponseTime < PERFORMANCE_THRESHOLDS.EXCELLENT_RESPONSE_TIME_MS) { recommendation = "Excellent - Recommended for production"; } else if (metrics.successRate > PERFORMANCE_THRESHOLDS.GOOD_SUCCESS_RATE) { recommendation = "Good - Suitable for most tasks"; } else if (metrics.successRate > PERFORMANCE_THRESHOLDS.FAIR_SUCCESS_RATE) { recommendation = "Fair - Monitor closely"; } else { recommendation = "Poor - Consider alternative providers"; } analytics[providerName] = { avgResponseTime, successRate: metrics.successRate, tokenThroughput: metrics.tokenThroughput, costEfficiency: metrics.costEfficiency, recommendation, sampleCount: metrics.sampleCount, }; } return analytics; } /** * Reset performance metrics for a provider or all providers. * @param providerName - (Optional) The name of the provider to reset. If omitted, resets all providers. */ export function resetProviderMetrics(providerName) { if (providerName) { providerMetrics.delete(providerName); } else { providerMetrics.clear(); } }