llmpool
Version:
Production-ready LLM API pool manager with load balancing, failover, and dynamic configuration
825 lines (665 loc) • 26.5 kB
JavaScript
const {
LLMPool,
ConfigManager,
Provider,
ProviderError,
ConfigurationError,
RateLimitError,
PROVIDERS,
createTextMessage,
createImageMessage
} = require('../src/llm-pool');
const fs = require('fs').promises;
const path = require('path');
// Mock axios for testing
jest.mock('axios');
const axios = require('axios');
describe('LLM Pool Manager', () => {
let testConfigPath;
let validConfig;
beforeAll(async () => {
testConfigPath = path.join(__dirname, 'test-config.json');
validConfig = {
providers: [
{
name: 'test-openai',
type: 'openai',
api_key: 'test-key',
base_url: 'https://api.openai.com/v1',
model: 'gpt-3.5-turbo',
priority: 1,
requests_per_minute: 100,
requests_per_day: 1000
},
{
name: 'test-anthropic',
type: 'anthropic',
api_key: 'test-key-2',
base_url: 'https://api.anthropic.com/v1',
model: 'claude-3-sonnet-20240229',
priority: 2,
requests_per_minute: 50,
requests_per_day: 500
}
]
};
await fs.writeFile(testConfigPath, JSON.stringify(validConfig));
});
afterAll(async () => {
try {
await fs.unlink(testConfigPath);
} catch (error) {
// Ignore if file doesn't exist
}
});
describe('Provider Class', () => {
test('should create valid provider', () => {
const config = validConfig.providers[0];
const provider = new Provider(config);
expect(provider.name).toBe(config.name);
expect(provider.type).toBe(config.type);
expect(provider.model).toBe(config.model);
expect(provider.canUse()).toBe(true);
});
test('should validate required fields', () => {
const invalidConfig = { name: 'test' }; // Missing required fields
expect(() => new Provider(invalidConfig)).toThrow(ConfigurationError);
});
test('should handle rate limiting', () => {
const config = { ...validConfig.providers[0], requests_per_minute: 1 };
const provider = new Provider(config);
expect(provider.canUse()).toBe(true);
// Simulate request
provider.recordRequest(true, 100, 10, 0.001);
expect(provider.canUse()).toBe(false);
// Reset rate limit (simulate time passing)
provider.lastReset = new Date(Date.now() - 61000); // 61 seconds ago
expect(provider.canUse()).toBe(true);
});
test('should handle circuit breaker', () => {
const config = { ...validConfig.providers[0], circuit_breaker_threshold: 2 };
const provider = new Provider(config);
// Record failures
provider.recordRequest(false, 100);
provider.recordRequest(false, 100);
expect(provider.isCircuitBreakerOpen).toBe(true);
expect(provider.canUse()).toBe(false);
});
test('should calculate success rate', () => {
const provider = new Provider(validConfig.providers[0]);
provider.recordRequest(true, 100);
provider.recordRequest(true, 100);
provider.recordRequest(false, 100);
expect(provider.getSuccessRate()).toBe(66.66666666666666);
});
test('should track response times', () => {
const provider = new Provider(validConfig.providers[0]);
provider.recordRequest(true, 100);
provider.recordRequest(true, 200);
provider.recordRequest(true, 300);
expect(provider.getAverageResponseTime()).toBe(200);
});
});
describe('ConfigManager Class', () => {
test('should load local configuration', async () => {
const configManager = new ConfigManager({ configPath: testConfigPath });
const config = await configManager.loadConfig();
expect(config).toEqual(validConfig);
});
test('should validate configuration', async () => {
const invalidConfigPath = path.join(__dirname, 'invalid-config.json');
const invalidConfig = { providers: [{ name: 'invalid' }] };
await fs.writeFile(invalidConfigPath, JSON.stringify(invalidConfig));
const configManager = new ConfigManager({ configPath: invalidConfigPath });
await expect(configManager.loadConfig()).rejects.toThrow(ConfigurationError);
await fs.unlink(invalidConfigPath);
});
test('should detect configuration changes', async () => {
const configManager = new ConfigManager({ configPath: testConfigPath });
// Load initial config
await configManager.loadConfig();
const initialChecksum = configManager.currentChecksum;
// Modify config
const modifiedConfig = {
...validConfig,
providers: [...validConfig.providers, {
name: 'new-provider',
type: 'groq',
api_key: 'new-key',
base_url: 'https://api.groq.com/openai/v1',
model: 'mixtral-8x7b-32768',
priority: 3,
requests_per_minute: 30
}]
};
await fs.writeFile(testConfigPath, JSON.stringify(modifiedConfig));
// Load modified config
await configManager.loadConfig();
expect(configManager.currentChecksum).not.toBe(initialChecksum);
// Restore original config
await fs.writeFile(testConfigPath, JSON.stringify(validConfig));
});
test('should handle remote configuration', async () => {
const mockResponse = { data: validConfig };
axios.get.mockResolvedValue(mockResponse);
const configManager = new ConfigManager({
configUrl: 'https://example.com/config.json'
});
const config = await configManager.loadConfig();
expect(config).toEqual(validConfig);
expect(axios.get).toHaveBeenCalledWith(
'https://example.com/config.json',
expect.any(Object)
);
});
test('should handle remote configuration errors', async () => {
axios.get.mockRejectedValue(new Error('Network error'));
const configManager = new ConfigManager({
configUrl: 'https://example.com/invalid-config.json'
});
await expect(configManager.loadConfig()).rejects.toThrow(ConfigurationError);
});
});
describe('LLMPool Class', () => {
let pool;
beforeEach(async () => {
pool = new LLMPool({ configPath: testConfigPath });
await pool.initialize();
});
afterEach(async () => {
await pool.shutdown();
});
test('should initialize with providers', async () => {
expect(pool.providers.size).toBe(2);
expect(pool.providers.has('test-openai')).toBe(true);
expect(pool.providers.has('test-anthropic')).toBe(true);
});
test('should select provider by priority', () => {
const provider = pool.selectProvider();
expect(provider.name).toBe('test-openai'); // Priority 1
});
test('should exclude rate-limited providers', () => {
const provider1 = pool.providers.get('test-openai');
provider1.requestCount = provider1.requestsPerMinute; // Max out requests
const provider = pool.selectProvider();
expect(provider.name).toBe('test-anthropic');
});
test('should format requests for different providers', () => {
const request = {
messages: [createTextMessage('user', 'Hello')],
temperature: 0.7,
max_tokens: 100
};
const openaiProvider = pool.providers.get('test-openai');
const openaiRequest = pool.formatRequestForProvider(openaiProvider, request);
expect(openaiRequest).toHaveProperty('messages');
expect(openaiRequest).toHaveProperty('model', 'gpt-3.5-turbo');
const anthropicProvider = pool.providers.get('test-anthropic');
const anthropicRequest = pool.formatRequestForProvider(anthropicProvider, request);
expect(anthropicRequest).toHaveProperty('messages');
expect(anthropicRequest).toHaveProperty('model', 'claude-3-sonnet-20240229');
});
test('should handle successful requests', async () => {
const mockResponse = {
data: {
id: 'test-id',
choices: [{ message: { content: 'Hello world' } }],
usage: { prompt_tokens: 10, completion_tokens: 2, total_tokens: 12 },
model: 'gpt-3.5-turbo'
}
};
axios.post.mockResolvedValue({ status: 200, ...mockResponse });
const response = await pool.chat({
messages: [createTextMessage('user', 'Hello')]
});
expect(response.content).toBe('Hello world');
expect(response.provider).toBe('test-openai');
expect(response.usage.total_tokens).toBe(12);
});
test('should handle provider failures and retry', async () => {
let callCount = 0;
axios.post.mockImplementation(() => {
callCount++;
if (callCount === 1) {
return Promise.reject(new Error('Network error'));
}
return Promise.resolve({
status: 200,
data: {
id: 'test-id',
choices: [{ message: { content: 'Success on retry' } }],
usage: { prompt_tokens: 10, completion_tokens: 3, total_tokens: 13 }
}
});
});
const response = await pool.chat({
messages: [createTextMessage('user', 'Hello')]
});
expect(response.content).toBe('Success on retry');
expect(callCount).toBe(2); // First call failed, second succeeded
});
test('should handle rate limit errors', async () => {
axios.post.mockResolvedValue({
status: 429,
headers: { 'retry-after': '60' },
data: { error: { message: 'Rate limit exceeded' } }
});
await expect(pool.chat({
messages: [createTextMessage('user', 'Hello')]
})).rejects.toThrow(RateLimitError);
});
test('should get provider statistics', () => {
const stats = pool.getProviderStats();
expect(stats).toHaveProperty('test-openai');
expect(stats).toHaveProperty('test-anthropic');
expect(stats['test-openai']).toHaveProperty('health');
expect(stats['test-openai']).toHaveProperty('usage');
expect(stats['test-openai']).toHaveProperty('performance');
});
test('should get pool health', () => {
const health = pool.getPoolHealth();
expect(health).toHaveProperty('totalProviders', 2);
expect(health).toHaveProperty('availableProviders');
expect(health).toHaveProperty('healthy');
expect(health).toHaveProperty('providers');
});
});
describe('Message Helpers', () => {
test('should create text message', () => {
const message = createTextMessage('user', 'Hello world');
expect(message).toEqual({
role: 'user',
content: 'Hello world'
});
});
test('should create image message', () => {
const message = createImageMessage('user', 'What is this?', '');
expect(message).toEqual({
role: 'user',
content: [
{ type: 'text', text: 'What is this?' },
{ type: 'image_url', image_url: { url: '' } }
]
});
});
});
describe('Error Handling', () => {
test('should create ProviderError with correct properties', () => {
const error = new ProviderError('Test error', 'test-provider', 500, true);
expect(error.name).toBe('ProviderError');
expect(error.message).toBe('Test error');
expect(error.provider).toBe('test-provider');
expect(error.statusCode).toBe(500);
expect(error.retryable).toBe(true);
});
test('should create RateLimitError with reset time', () => {
const error = new RateLimitError('Rate limited', 'test-provider', 60);
expect(error.name).toBe('RateLimitError');
expect(error.provider).toBe('test-provider');
expect(error.resetTime).toBe(60);
});
test('should create ConfigurationError', () => {
const error = new ConfigurationError('Invalid config');
expect(error.name).toBe('ConfigurationError');
expect(error.message).toBe('Invalid config');
});
});
describe('Token Estimation', () => {
let pool;
beforeEach(async () => {
pool = new LLMPool({
configPath: testConfigPath,
useTokenCounting: true
});
await pool.initialize();
});
afterEach(async () => {
await pool.shutdown();
});
test('should estimate tokens for text messages', () => {
const messages = [
createTextMessage('user', 'Hello world'),
createTextMessage('assistant', 'Hi there!')
];
const tokens = pool.estimateTokens(messages);
expect(tokens).toBeGreaterThan(0);
});
test('should handle mixed content messages', () => {
const messages = [
createImageMessage('user', 'What is this?', '')
];
const tokens = pool.estimateTokens(messages);
expect(tokens).toBeGreaterThan(0);
});
});
describe('Cost Calculation', () => {
test('should calculate request cost', () => {
const provider = new Provider({
...validConfig.providers[0],
input_token_price: 0.5, // $0.5 per 1M tokens
output_token_price: 1.5 // $1.5 per 1M tokens
});
const pool = new LLMPool({ configPath: testConfigPath });
const usage = {
prompt_tokens: 100,
completion_tokens: 50,
total_tokens: 150
};
const cost = pool.calculateCost(provider, usage);
expect(cost).toBe((100 * 0.5 + 50 * 1.5) / 1000000);
});
});
describe('Integration Tests', () => {
test('should handle concurrent requests', async () => {
const pool = new LLMPool({ configPath: testConfigPath });
await pool.initialize();
// Mock successful responses
axios.post.mockResolvedValue({
status: 200,
data: {
id: 'test-id',
choices: [{ message: { content: 'Concurrent response' } }],
usage: { prompt_tokens: 10, completion_tokens: 2, total_tokens: 12 }
}
});
const promises = Array(10).fill(0).map((_, i) =>
pool.chat({
messages: [createTextMessage('user', `Request ${i}`)]
})
);
const responses = await Promise.allSettled(promises);
const successful = responses.filter(r => r.status === 'fulfilled').length;
expect(successful).toBeGreaterThan(0);
await pool.shutdown();
});
});
});
// Test utilities
class TestUtils {
static createMockProvider(name, type = 'openai', overrides = {}) {
return {
name,
type,
api_key: 'test-key',
base_url: 'https://api.test.com/v1',
model: 'test-model',
priority: 1,
requests_per_minute: 100,
requests_per_day: 1000,
...overrides
};
}
static createMockResponse(content = 'Test response', provider = 'openai') {
const responses = {
openai: {
status: 200,
data: {
id: 'test-id',
choices: [{ message: { content } }],
usage: { prompt_tokens: 10, completion_tokens: 2, total_tokens: 12 },
model: 'gpt-3.5-turbo'
}
},
anthropic: {
status: 200,
data: {
id: 'test-id',
content: [{ text: content }],
usage: { input_tokens: 10, output_tokens: 2 },
model: 'claude-3-sonnet-20240229'
}
}
};
return responses[provider] || responses.openai;
}
static async createTestConfig(providers = null) {
const config = {
providers: providers || [
TestUtils.createMockProvider('test-provider-1'),
TestUtils.createMockProvider('test-provider-2', 'anthropic', { priority: 2 })
]
};
const configPath = path.join(__dirname, `test-config-${Date.now()}.json`);
await fs.writeFile(configPath, JSON.stringify(config));
return { config, configPath };
}
static async cleanupTestConfig(configPath) {
try {
await fs.unlink(configPath);
} catch (error) {
// Ignore if file doesn't exist
}
}
static mockAxiosResponse(responses) {
let callCount = 0;
axios.post.mockImplementation(() => {
const response = Array.isArray(responses) ? responses[callCount++] : responses;
if (response instanceof Error) {
return Promise.reject(response);
}
return Promise.resolve(response);
});
}
}
// Performance Tests
describe('Performance Tests', () => {
let pool;
let configPath;
beforeEach(async () => {
const { config, configPath: path } = await TestUtils.createTestConfig([
TestUtils.createMockProvider('fast-provider', 'openai', { priority: 1 }),
TestUtils.createMockProvider('slow-provider', 'anthropic', { priority: 2 }),
TestUtils.createMockProvider('backup-provider', 'groq', { priority: 3 })
]);
configPath = path;
pool = new LLMPool({ configPath });
await pool.initialize();
});
afterEach(async () => {
await pool.shutdown();
await TestUtils.cleanupTestConfig(configPath);
});
test('should handle high throughput requests', async () => {
TestUtils.mockAxiosResponse(TestUtils.createMockResponse('Fast response'));
const startTime = Date.now();
const promises = Array(100).fill(0).map((_, i) =>
pool.chat({
messages: [createTextMessage('user', `High throughput test ${i}`)]
}).catch(() => null) // Don't fail the test on individual request failures
);
const results = await Promise.allSettled(promises);
const duration = Date.now() - startTime;
const successCount = results.filter(r => r.status === 'fulfilled' && r.value !== null).length;
console.log(`Processed ${successCount}/100 requests in ${duration}ms`);
expect(successCount).toBeGreaterThan(50); // At least 50% success rate
expect(duration).toBeLessThan(30000); // Complete within 30 seconds
});
test('should maintain performance under provider failures', async () => {
// First provider fails, others succeed
let callCount = 0;
axios.post.mockImplementation(() => {
callCount++;
if (callCount <= 10) {
return Promise.reject(new Error('Provider temporarily down'));
}
return Promise.resolve(TestUtils.createMockResponse('Backup success'));
});
const promises = Array(20).fill(0).map((_, i) =>
pool.chat({
messages: [createTextMessage('user', `Failover test ${i}`)]
}).catch(() => null)
);
const results = await Promise.allSettled(promises);
const successCount = results.filter(r => r.status === 'fulfilled' && r.value !== null).length;
expect(successCount).toBeGreaterThan(5); // Some requests should succeed via fallback
});
});
// Security Tests
describe('Security Tests', () => {
test('should sanitize API keys in provider stats', async () => {
const pool = new LLMPool();
const provider = new Provider({
name: 'security-test',
type: 'openai',
api_key: 'very-secret-key-12345',
base_url: 'https://api.openai.com/v1',
model: 'gpt-3.5-turbo'
});
pool.providers.set('security-test', provider);
const publicProviders = pool.GetProviders ? pool.GetProviders() : Array.from(pool.providers.values());
// API keys should be hidden in any public interface
expect(JSON.stringify(publicProviders)).not.toContain('very-secret-key-12345');
});
test('should validate request inputs', async () => {
const { configPath } = await TestUtils.createTestConfig();
const pool = new LLMPool({ configPath });
await pool.initialize();
// Test with invalid messages
await expect(pool.chat({ messages: null })).rejects.toThrow();
await expect(pool.chat({ messages: 'invalid' })).rejects.toThrow();
await expect(pool.chat({})).rejects.toThrow();
await pool.shutdown();
await TestUtils.cleanupTestConfig(configPath);
});
test('should handle malformed configuration gracefully', async () => {
const malformedConfig = {
providers: [
{
name: 'malformed',
type: 'unknown-provider', // Invalid provider type
api_key: 'test',
base_url: 'invalid-url',
model: 'test'
}
]
};
const configPath = path.join(__dirname, 'malformed-config.json');
await fs.writeFile(configPath, JSON.stringify(malformedConfig));
const configManager = new ConfigManager({ configPath });
await expect(configManager.loadConfig()).rejects.toThrow(ConfigurationError);
await TestUtils.cleanupTestConfig(configPath);
});
});
// Edge Cases
describe('Edge Cases', () => {
test('should handle empty provider list', async () => {
const emptyConfig = { providers: [] };
const configPath = path.join(__dirname, 'empty-config.json');
await fs.writeFile(configPath, JSON.stringify(emptyConfig));
const pool = new LLMPool({ configPath });
await pool.initialize();
await expect(pool.chat({
messages: [createTextMessage('user', 'Hello')]
})).rejects.toThrow();
await pool.shutdown();
await TestUtils.cleanupTestConfig(configPath);
});
test('should handle all providers rate-limited', async () => {
const { configPath } = await TestUtils.createTestConfig([
TestUtils.createMockProvider('limited-1', 'openai', { requests_per_minute: 0 }),
TestUtils.createMockProvider('limited-2', 'anthropic', { requests_per_minute: 0 })
]);
const pool = new LLMPool({ configPath });
await pool.initialize();
// All providers should be rate-limited
const health = pool.getPoolHealth();
expect(health.availableProviders).toBe(0);
await pool.shutdown();
await TestUtils.cleanupTestConfig(configPath);
});
test('should handle network timeouts', async () => {
const { configPath } = await TestUtils.createTestConfig();
const pool = new LLMPool({
configPath,
timeout: 100 // Very short timeout
});
await pool.initialize();
// Mock slow response
axios.post.mockImplementation(() =>
new Promise(resolve => setTimeout(resolve, 1000))
);
await expect(pool.chat({
messages: [createTextMessage('user', 'Hello')]
})).rejects.toThrow();
await pool.shutdown();
await TestUtils.cleanupTestConfig(configPath);
});
test('should handle very large messages', async () => {
const { configPath } = await TestUtils.createTestConfig();
const pool = new LLMPool({ configPath });
await pool.initialize();
TestUtils.mockAxiosResponse(TestUtils.createMockResponse('Response to large message'));
const largeMessage = 'x'.repeat(100000); // 100K characters
const response = await pool.chat({
messages: [createTextMessage('user', largeMessage)]
});
expect(response.content).toBe('Response to large message');
await pool.shutdown();
await TestUtils.cleanupTestConfig(configPath);
});
test('should handle special characters in messages', async () => {
const { configPath } = await TestUtils.createTestConfig();
const pool = new LLMPool({ configPath });
await pool.initialize();
TestUtils.mockAxiosResponse(TestUtils.createMockResponse('Handled special chars'));
const specialMessage = '🚀 Hello! @#$%^&*()_+ 中文 العربية 🎉';
const response = await pool.chat({
messages: [createTextMessage('user', specialMessage)]
});
expect(response.content).toBe('Handled special chars');
await pool.shutdown();
await TestUtils.cleanupTestConfig(configPath);
});
});
// Real-world Scenarios
describe('Real-world Scenarios', () => {
test('should handle provider maintenance windows', async () => {
const { configPath } = await TestUtils.createTestConfig([
TestUtils.createMockProvider('primary', 'openai', { priority: 1 }),
TestUtils.createMockProvider('backup', 'anthropic', { priority: 2 })
]);
const pool = new LLMPool({ configPath, maxRetries: 3 });
await pool.initialize();
// Simulate primary provider down for maintenance
let callCount = 0;
axios.post.mockImplementation((url) => {
callCount++;
if (url.includes('openai')) {
return Promise.reject(new Error('Service temporarily unavailable'));
}
return Promise.resolve(TestUtils.createMockResponse('Backup response', 'anthropic'));
});
const response = await pool.chat({
messages: [createTextMessage('user', 'Hello during maintenance')]
});
expect(response.content).toBe('Backup response');
expect(response.provider).toBe('backup');
await pool.shutdown();
await TestUtils.cleanupTestConfig(configPath);
});
test('should recover from temporary network issues', async () => {
const { configPath } = await TestUtils.createTestConfig();
const pool = new LLMPool({ configPath, maxRetries: 3, retryDelay: 100 });
await pool.initialize();
// First two attempts fail, third succeeds
let attemptCount = 0;
axios.post.mockImplementation(() => {
attemptCount++;
if (attemptCount <= 2) {
return Promise.reject(new Error('ECONNRESET'));
}
return Promise.resolve(TestUtils.createMockResponse('Recovered successfully'));
});
const response = await pool.chat({
messages: [createTextMessage('user', 'Network recovery test')]
});
expect(response.content).toBe('Recovered successfully');
expect(attemptCount).toBe(3);
await pool.shutdown();
await TestUtils.cleanupTestConfig(configPath);
});
});
// Export test utilities for external use
module.exports = {
TestUtils
};