@aj-archipelago/cortex
Version:
Cortex is a GraphQL API for AI. It provides a simple, extensible interface for using AI services from OpenAI, Azure and others.
589 lines (488 loc) • 26.2 kB
JavaScript
import test from 'ava';
import OpenAIVisionPlugin from '../server/plugins/openAiVisionPlugin.js';
import Claude3VertexPlugin from '../server/plugins/claude3VertexPlugin.js';
import Gemini15VisionPlugin from '../server/plugins/gemini15VisionPlugin.js';
import GeminiVisionPlugin from '../server/plugins/geminiVisionPlugin.js';
// Mock pathway and model for plugin initialization
const mockPathway = { name: 'test', temperature: 0.7 };
const mockModel = { name: 'test-model' };
// Helper function to validate base64 image data
function validateBase64Image(base64Data) {
// Decode first few bytes to check for common image format headers
const decodedData = Buffer.from(base64Data, 'base64').slice(0, 4);
const validImageHeaders = [
Buffer.from([0xFF, 0xD8, 0xFF]), // JPEG
Buffer.from([0x89, 0x50, 0x4E, 0x47]), // PNG
Buffer.from([0x47, 0x49, 0x46]), // GIF
Buffer.from([0x52, 0x49, 0x46, 0x46]), // WEBP
];
return validImageHeaders.some(header =>
decodedData.slice(0, header.length).equals(header)
);
}
// Helper function to create plugin instances
const createPlugins = () => ({
openai: new OpenAIVisionPlugin(mockPathway, mockModel),
claude: new Claude3VertexPlugin(mockPathway, mockModel),
gemini15: new Gemini15VisionPlugin(mockPathway, mockModel),
gemini: new GeminiVisionPlugin(mockPathway, mockModel)
});
// Sample base64 image data
const sampleBase64Image = '...';
// Test OpenAI to Claude conversion
test('OpenAI to Claude conversion data url', async (t) => {
const { openai, claude } = createPlugins();
const openaiMessages = [
{ role: 'system', content: 'You are a helpful assistant.' },
{ role: 'user', content: [
{ type: 'text', text: 'What\'s in this image?' },
{ type: 'image_url', image_url: { url: sampleBase64Image } }
]}
];
const parsedOpenAI = await openai.tryParseMessages(openaiMessages);
const { system, modifiedMessages } = await claude.convertMessagesToClaudeVertex(parsedOpenAI);
t.is(modifiedMessages.length, 1);
t.is(system, 'You are a helpful assistant.');
t.is(modifiedMessages[0].role, 'user');
t.true(modifiedMessages[0].content[0].type === 'text');
t.is(modifiedMessages[0].content[0].text, 'What\'s in this image?');
t.true(modifiedMessages[0].content[1].type === 'image');
t.true(modifiedMessages[0].content[1].source.type === 'base64');
t.true(validateBase64Image(modifiedMessages[0].content[1].source.data), 'Base64 data should be a valid image');
});
// Test OpenAI to Claude conversion with a regular image url
test('OpenAI to Claude conversion image url', async (t) => {
const { openai, claude } = createPlugins();
const openaiMessages = [
{ role: 'system', content: 'You are a helpful assistant.' },
{ role: 'user', content: [
{ type: 'text', text: 'What\'s in this image?' },
{ type: 'image_url', image_url: { url: "https://static.toiimg.com/thumb/msid-102827471,width-1280,height-720,resizemode-4/102827471.jpg" } }
]}
];
const parsedOpenAI = await openai.tryParseMessages(openaiMessages);
const { system, modifiedMessages } = await claude.convertMessagesToClaudeVertex(parsedOpenAI);
t.is(modifiedMessages.length, 1);
t.is(system, 'You are a helpful assistant.');
t.is(modifiedMessages[0].role, 'user');
t.true(modifiedMessages[0].content[0].type === 'text');
t.is(modifiedMessages[0].content[0].text, 'What\'s in this image?');
t.true(modifiedMessages[0].content[1].type === 'image');
t.true(validateBase64Image(modifiedMessages[0].content[1].source.data), 'Base64 data should be a valid image');
});
// Test OpenAI to Gemini conversion
test('OpenAI to Gemini conversion', async (t) => {
const { gemini, gemini15 } = createPlugins();
const openaiMessages = [
{ role: 'system', content: 'You are a helpful assistant.' },
{ role: 'user', content: [
{ type: 'text', text: 'Describe this image:' },
{ type: 'image_url', image_url: { url: 'gs://my-bucket/image.jpg' } }
]}
];
const { modifiedMessages, system } = gemini.convertMessagesToGemini(openaiMessages);
const { modifiedMessages: modifiedMessages15, system: system15 } = gemini15.convertMessagesToGemini(openaiMessages);
// Gemini
t.is(modifiedMessages.length, 1);
t.is(modifiedMessages[0].role, 'user');
t.is(modifiedMessages[0].parts.length, 3);
t.is(modifiedMessages[0].parts[0].text, 'You are a helpful assistant.');
t.is(modifiedMessages[0].parts[1].text, 'Describe this image:');
t.is(modifiedMessages[0].parts[2].fileData.fileUri, 'gs://my-bucket/image.jpg');
// Gemini 1.5
t.is(system15.parts.length, 1);
t.is(modifiedMessages15.length, 1);
t.is(modifiedMessages15[0].role, 'user');
t.is(modifiedMessages15[0].parts.length, 2);
t.is(modifiedMessages15[0].parts[0].text, 'Describe this image:');
t.is(modifiedMessages15[0].parts[1].fileData.fileUri, 'gs://my-bucket/image.jpg');
t.is(system15.parts[0].text, 'You are a helpful assistant.');
});
// Test special Cortex properties (gcs and url)
test('Cortex special properties conversion', async (t) => {
const { openai, claude, gemini, gemini15 } = createPlugins();
const cortexMessages = [
{ role: 'user', content: [
{ type: 'text', text: 'Analyze this image:' },
{ type: 'image_url', gcs: 'gs://cortex-bucket/special-image.png', url: 'https://static.toiimg.com/thumb/msid-102827471,width-1280,height-720,resizemode-4/102827471.jpg' }
]}
];
const { system: claudeSystem, modifiedMessages: claudeMessages } = await claude.convertMessagesToClaudeVertex(cortexMessages);
const { modifiedMessages: geminiMessages } = gemini.convertMessagesToGemini(cortexMessages);
const { modifiedMessages: geminiMessages15, system: geminiSystem15 } = gemini15.convertMessagesToGemini(cortexMessages);
// Check Claude conversion
t.true(claudeMessages[0].content[1].source.data.startsWith('/9j/4AAQ'));
// Check Gemini conversion
t.is(geminiMessages[0].parts[1].fileData.fileUri, 'gs://cortex-bucket/special-image.png');
t.is(geminiMessages15[0].parts[1].fileData.fileUri, 'gs://cortex-bucket/special-image.png');
});
// Test mixed content types
test('Mixed content types conversion', async (t) => {
const { openai, claude, gemini, gemini15 } = createPlugins();
const mixedMessages = [
{ role: 'system', content: 'You are a vision analysis AI.' },
{ role: 'user', content: 'What do you see?' },
{ role: 'assistant', content: 'I need an image to analyze.' },
{ role: 'user', content: [
{ type: 'text', text: 'Here\'s an image:' },
{ type: 'image_url', image_url: { url: sampleBase64Image } },
{ type: 'text', text: 'And another one:' },
{ type: 'image_url', gcs: 'gs://cortex-bucket/another-image.jpg', url: 'https://static.toiimg.com/thumb/msid-102827471,width-1280,height-720,resizemode-4/102827471.jpg' }
]}
];
const { system: claudeSystem, modifiedMessages: claudeMessages } = await claude.convertMessagesToClaudeVertex(mixedMessages);
const { modifiedMessages } = gemini.convertMessagesToGemini(mixedMessages);
const { modifiedMessages: modifiedMessages15, system: system15 } = gemini15.convertMessagesToGemini(mixedMessages);
// Check Claude conversion
t.is(claudeMessages.length, 3);
t.true(claudeMessages[2].content[0].text.includes('Here\'s an image:'));
t.true(claudeMessages[2].content[1].source.type === 'base64');
t.true(validateBase64Image(claudeMessages[2].content[1].source.data), 'First image should be valid');
t.true(claudeMessages[2].content[2].text.includes('And another one:'));
t.true(claudeMessages[2].content[3].source.type === 'base64');
t.true(validateBase64Image(claudeMessages[2].content[3].source.data), 'Second image should be valid');
t.is(claudeSystem, 'You are a vision analysis AI.');
// Check Gemini conversion
t.is(modifiedMessages.length, 3);
t.is(modifiedMessages[0].parts.length, 2);
t.is(modifiedMessages[0].parts[0].text, 'You are a vision analysis AI.');
t.is(modifiedMessages[0].parts[1].text, 'What do you see?');
t.is(modifiedMessages[1].parts[0].text, 'I need an image to analyze.');
t.is(modifiedMessages[2].parts.length, 4);
t.is(modifiedMessages[2].parts[0].text, 'Here\'s an image:');
t.true('inlineData' in modifiedMessages[2].parts[1]);
t.is(modifiedMessages[2].parts[2].text, 'And another one:');
t.is(modifiedMessages[2].parts[3].fileData.fileUri, 'gs://cortex-bucket/another-image.jpg');
// Check Gemini 1.5 conversion
t.is(modifiedMessages15.length, 3);
t.is(modifiedMessages15[2].parts.length, 4);
t.is(modifiedMessages15[2].parts[0].text, 'Here\'s an image:');
t.true('inlineData' in modifiedMessages15[2].parts[1]);
t.is(modifiedMessages15[2].parts[2].text, 'And another one:');
t.is(modifiedMessages15[2].parts[3].fileData.fileUri, 'gs://cortex-bucket/another-image.jpg');
t.is(system15.parts[0].text, 'You are a vision analysis AI.');
});
// Test unsupported mime types (e.g., PDF for Claude)
test('Unsupported mime type conversion', async (t) => {
const { openai, claude } = createPlugins();
const pdfMessage = [
{ role: 'user', content: [
{ type: 'text', text: 'Can you analyze this PDF?' },
{ type: 'image_url', image_url: { url: 'https://www.w3.org/WAI/ER/tests/xhtml/testfiles/resources/pdf/dummy.pdf' } }
]}
];
const parsedOpenAI = await openai.tryParseMessages(pdfMessage);
const { system, modifiedMessages } = await claude.convertMessagesToClaudeVertex(parsedOpenAI);
t.is(modifiedMessages[0].content.length, 2);
t.is(modifiedMessages[0].content[0].text, 'Can you analyze this PDF?');
t.true(modifiedMessages[0].content[1].text.includes('image_url'));
});
// Test pathological cases
test('Pathological cases', async (t) => {
const { openai, claude, gemini, gemini15 } = createPlugins();
const pathologicalMessages = [
{ role: 'system', content: 'You are a helpful assistant.' },
{ role: 'user', content: 'Hello' },
{ role: 'user', content: 'Another greeting' },
{ role: 'assistant', content: 'Hi there!' },
{ role: 'system', content: 'You are also very knowledgeable.' },
{ role: 'user', content: '' },
{ role: 'assistant', content: '' },
{ role: 'user', content: 'How are you?' },
{ role: 'user', content: [
{ type: 'text', text: 'What\'s this?' },
{ type: 'image_url', image_url: { url: sampleBase64Image } }
]},
{ role: 'user', content: 'Another question' },
];
const parsedOpenAI = await openai.tryParseMessages(pathologicalMessages);
// Test Claude conversion
const { system: claudeSystem, modifiedMessages: claudeMessages } = await claude.convertMessagesToClaudeVertex(parsedOpenAI);
t.is(claudeSystem, 'You are a helpful assistant.\nYou are also very knowledgeable.');
t.is(claudeMessages.length, 3);
t.is(claudeMessages[0].role, 'user');
t.is(claudeMessages[0].content[0].text, 'Hello\nAnother greeting');
t.is(claudeMessages[1].role, 'assistant');
t.is(claudeMessages[1].content[0].text, 'Hi there!');
t.is(claudeMessages[2].role, 'user');
t.true(Array.isArray(claudeMessages[2].content));
t.is(claudeMessages[2].content[0].text, 'How are you?');
t.is(claudeMessages[2].content[1].text, 'What\'s this?');
t.is(claudeMessages[2].content[2].type, 'image');
t.true(claudeMessages[2].content[2].source.data.startsWith('/9j/4AAQ'));
t.is(claudeMessages[2].content[3].text, 'Another question');
// Test Gemini conversion
const { modifiedMessages: geminiMessages } = gemini.convertMessagesToGemini(parsedOpenAI);
t.is(geminiMessages.length, 3);
t.is(geminiMessages[0].role, 'user');
t.is(geminiMessages[0].parts[0].text, 'You are a helpful assistant.');
t.is(geminiMessages[0].parts[1].text, 'Hello');
t.is(geminiMessages[0].parts[2].text, 'Another greeting');
t.is(geminiMessages[1].parts[0].text, 'Hi there!');
t.is(geminiMessages[2].parts[0].text, 'You are also very knowledgeable.');
t.is(geminiMessages[2].parts[1].text, 'How are you?');
t.is(geminiMessages[2].parts[2].text, 'What\'s this?');
t.true('inlineData' in geminiMessages[2].parts[3]);
t.is(geminiMessages[2].parts[4].text, 'Another question');
// Test Gemini 1.5 conversion
const { modifiedMessages: geminiMessages15, system: geminiSystem15 } = gemini15.convertMessagesToGemini(parsedOpenAI);
t.is(geminiSystem15.parts[0].text, 'You are a helpful assistant.');
t.is(geminiSystem15.parts[1].text, 'You are also very knowledgeable.');
t.is(geminiMessages15.length, 3);
// First user message combines "Hello" and "Another greeting"
t.is(geminiMessages15[0].role, 'user');
t.is(geminiMessages15[0].parts[0].text, 'Hello');
t.is(geminiMessages15[0].parts[1].text, 'Another greeting');
// Assistant message "Hi there!"
t.is(geminiMessages15[1].role, 'assistant');
t.is(geminiMessages15[1].parts[0].text, 'Hi there!');
// Final user message combines "How are you?", image content, and "Another question"
t.is(geminiMessages15[2].role, 'user');
t.is(geminiMessages15[2].parts[0].text, 'How are you?');
t.is(geminiMessages15[2].parts[1].text, 'What\'s this?');
t.true('inlineData' in geminiMessages15[2].parts[2]);
t.is(geminiMessages15[2].parts[3].text, 'Another question');
});
// Test empty message array
test('Empty message array', async (t) => {
const { openai, claude, gemini, gemini15 } = createPlugins();
const emptyMessages = [];
const parsedOpenAI = await openai.tryParseMessages(emptyMessages);
// Test Claude conversion
const { system: claudeSystem, modifiedMessages: claudeMessages } = await claude.convertMessagesToClaudeVertex(parsedOpenAI);
t.is(claudeSystem, '');
t.is(claudeMessages.length, 0);
// Test Gemini conversion
const { modifiedMessages: geminiMessages } = gemini.convertMessagesToGemini(parsedOpenAI);
t.is(geminiMessages.length, 0);
// Test Gemini 1.5 conversion
const { modifiedMessages: geminiMessages15, system: geminiSystem15 } = gemini15.convertMessagesToGemini(parsedOpenAI);
t.is(geminiSystem15, null);
t.is(geminiMessages15.length, 0);
});
// Test simple string array content
test('Simple string array content', async (t) => {
const { gemini15 } = createPlugins();
const messages = [
{ role: 'user', content: "Initial message" },
{ role: 'assistant', content: [
"\"Searchin' for my lost shaker of salt...\"\n",
]},
{ role: 'user', content: [
"Here's another simple string in an array",
]}
];
const { modifiedMessages } = gemini15.convertMessagesToGemini(messages);
t.is(modifiedMessages.length, 3);
t.is(modifiedMessages[0].role, 'user');
t.is(modifiedMessages[0].parts.length, 1);
t.is(modifiedMessages[0].parts[0].text, "Initial message");
t.is(modifiedMessages[1].role, 'assistant');
t.is(modifiedMessages[1].parts.length, 1);
t.is(modifiedMessages[1].parts[0].text, "\"Searchin' for my lost shaker of salt...\"\n");
t.is(modifiedMessages[2].role, 'user');
t.is(modifiedMessages[2].parts.length, 1);
t.is(modifiedMessages[2].parts[0].text, "Here's another simple string in an array");
});
// Test string-encoded multimodal content
test('String-encoded multimodal content', async (t) => {
const { gemini15 } = createPlugins();
const messages = [
{ role: 'user', content: [
JSON.stringify({
type: 'text',
text: 'What is in this image?'
}),
JSON.stringify({
type: 'image_url',
image_url: { url: 'gs://my-bucket/image.jpg' }
})
]},
{ role: 'assistant', content: [
JSON.stringify({
type: 'text',
text: 'I see a cat.'
})
]},
{ role: 'user', content: [
JSON.stringify({
type: 'text',
text: 'Is it a big cat?'
})
]}
];
const { modifiedMessages } = gemini15.convertMessagesToGemini(messages);
t.is(modifiedMessages.length, 3);
t.is(modifiedMessages[0].role, 'user');
t.is(modifiedMessages[0].parts.length, 2);
t.is(modifiedMessages[0].parts[0].text, 'What is in this image?');
t.true('fileData' in modifiedMessages[0].parts[1]);
t.is(modifiedMessages[0].parts[1].fileData.fileUri, 'gs://my-bucket/image.jpg');
t.is(modifiedMessages[1].role, 'assistant');
t.is(modifiedMessages[1].parts.length, 1);
t.is(modifiedMessages[1].parts[0].text, 'I see a cat.');
t.is(modifiedMessages[2].role, 'user');
t.is(modifiedMessages[2].parts.length, 1);
t.is(modifiedMessages[2].parts[0].text, 'Is it a big cat?');
});
// Test messages with only system messages
test('Only system messages', async (t) => {
const { openai, claude, gemini, gemini15 } = createPlugins();
const onlySystemMessages = [
{ role: 'system', content: 'You are an AI assistant.' },
{ role: 'system', content: 'You are helpful and friendly.' },
];
const parsedOpenAI = await openai.tryParseMessages(onlySystemMessages);
// Test Claude conversion
const { system: claudeSystem, modifiedMessages: claudeMessages } = await claude.convertMessagesToClaudeVertex(parsedOpenAI);
t.is(claudeSystem, 'You are an AI assistant.\nYou are helpful and friendly.');
t.is(claudeMessages.length, 0);
// Test Gemini conversion
const { modifiedMessages: geminiMessages } = gemini.convertMessagesToGemini(parsedOpenAI);
t.is(geminiMessages.length, 1);
t.is(geminiMessages[0].parts[0].text, 'You are an AI assistant.');
t.is(geminiMessages[0].parts[1].text, 'You are helpful and friendly.');
// Test Gemini 1.5 conversion
const { modifiedMessages: geminiMessages15, system: geminiSystem15 } = gemini15.convertMessagesToGemini(parsedOpenAI);
t.is(geminiSystem15.parts[0].text, 'You are an AI assistant.');
t.is(geminiSystem15.parts[1].text, 'You are helpful and friendly.');
t.is(geminiMessages15.length, 0);
});
// Test different image URL types for Gemini 1.5
test('Gemini 1.5 image URL type handling', t => {
const { gemini15 } = createPlugins();
const messages = [
{ role: 'user', content: [
{ type: 'text', text: 'Process these images:' },
// GCS URL - should be converted to fileData
{ type: 'image_url', image_url: { url: 'gs://my-bucket/image1.jpg' } },
// Base64 URL - should be converted to inlineData
{ type: 'image_url', image_url: { url: '...' } },
// Regular HTTP URL - should be dropped (return null)
{ type: 'image_url', image_url: { url: 'https://example.com/image.jpg' } },
// Azure blob URL - should be dropped (return null)
{ type: 'image_url', image_url: { url: 'https://myaccount.blob.core.windows.net/container/image.jpg' } }
]}
];
const { modifiedMessages } = gemini15.convertMessagesToGemini(messages);
t.is(modifiedMessages.length, 1);
t.is(modifiedMessages[0].parts.length, 3); // text + gcs + base64 (2 urls dropped)
// Check text part
t.is(modifiedMessages[0].parts[0].text, 'Process these images:');
// Check GCS URL handling
t.true('fileData' in modifiedMessages[0].parts[1]);
t.is(modifiedMessages[0].parts[1].fileData.fileUri, 'gs://my-bucket/image1.jpg');
t.is(modifiedMessages[0].parts[1].fileData.mimeType, 'image/jpeg');
// Check base64 URL handling
t.true('inlineData' in modifiedMessages[0].parts[2]);
t.is(modifiedMessages[0].parts[2].inlineData.mimeType, 'image/jpeg');
t.is(modifiedMessages[0].parts[2].inlineData.data, '/9j/4AAQSkZJRg...');
});
// Test edge cases for image URLs in Gemini 1.5
test('Gemini 1.5 image URL edge cases', t => {
const { gemini15 } = createPlugins();
const messages = [
{ role: 'user', content: [
{ type: 'text', text: 'Process these edge cases:' },
// Empty URL
{ type: 'image_url', image_url: { url: '' } },
// Malformed base64
{ type: 'image_url', image_url: { url: 'data:image/jpeg;base64,' } },
// Malformed GCS URL
{ type: 'image_url', image_url: { url: 'gs://' } },
// Missing URL property
{ type: 'image_url', image_url: {} },
// Null URL
{ type: 'image_url', image_url: { url: null } }
]}
];
const { modifiedMessages } = gemini15.convertMessagesToGemini(messages);
// Verify basic message structure
t.is(modifiedMessages.length, 1);
t.true(Array.isArray(modifiedMessages[0].parts));
// Check each part to ensure no invalid images were converted
modifiedMessages[0].parts.forEach(part => {
if (part.text) {
t.is(part.text, 'Process these edge cases:', 'Only expected text content should be present');
} else {
t.fail('Found non-text part that should have been filtered out: ' + JSON.stringify(part));
}
});
// Verify we only have one part (the text)
t.is(modifiedMessages[0].parts.length, 1, 'Should only have the text part');
});
// Test multiple images in single message for Claude
test('Multiple images in single Claude message', async (t) => {
const { claude } = createPlugins();
const multiImageMessage = [
{ role: 'user', content: [
{ type: 'text', text: 'Compare these images:' },
{ type: 'image_url', image_url: { url: sampleBase64Image } },
{ type: 'text', text: 'with this one:' },
{ type: 'image_url', image_url: { url: sampleBase64Image } },
{ type: 'image_url', gcs: 'gs://cortex-bucket/image.jpg' }
]}
];
const { modifiedMessages } = await claude.convertMessagesToClaudeVertex(multiImageMessage);
t.is(modifiedMessages.length, 1);
t.is(modifiedMessages[0].role, 'user');
t.is(modifiedMessages[0].content.length, 4);
t.is(modifiedMessages[0].content[0].text, 'Compare these images:');
t.true(modifiedMessages[0].content[1].source.type === 'base64');
t.is(modifiedMessages[0].content[2].text, 'with this one:');
t.true(modifiedMessages[0].content[3].source.type === 'base64');
});
// Test conversation history with mixed image types
test('Conversation history with mixed image types', async (t) => {
const { claude, gemini15 } = createPlugins();
const conversationHistory = [
{ role: 'system', content: 'You are a visual analysis assistant.' },
{ role: 'user', content: [
{ type: 'text', text: 'What\'s in this image?' },
{ type: 'image_url', image_url: { url: sampleBase64Image } }
]},
{ role: 'assistant', content: 'I see a landscape.' },
{ role: 'user', content: [
{ type: 'text', text: 'Compare it with this:' },
{ type: 'image_url', gcs: 'gs://cortex-bucket/image2.jpg' }
]},
{ role: 'assistant', content: 'The second image shows a different scene.' },
{ role: 'user', content: 'Which one do you prefer?' }
];
// Test Claude conversion
const { system: claudeSystem, modifiedMessages: claudeMessages } = await claude.convertMessagesToClaudeVertex(conversationHistory);
t.is(claudeSystem, 'You are a visual analysis assistant.');
t.is(claudeMessages.length, 5);
t.is(claudeMessages[1].content[0].text, 'I see a landscape.');
t.is(claudeMessages[3].content[0].text, 'The second image shows a different scene.');
t.is(claudeMessages[4].content[0].text, 'Which one do you prefer?');
// Test Gemini 1.5 conversion
const { system: geminiSystem15, modifiedMessages: geminiMessages15 } = gemini15.convertMessagesToGemini(conversationHistory);
t.is(geminiSystem15.parts[0].text, 'You are a visual analysis assistant.');
t.is(geminiMessages15.length, 5);
t.true('inlineData' in geminiMessages15[0].parts[1]);
t.is(geminiMessages15[1].parts[0].text, 'I see a landscape.');
t.true('fileData' in geminiMessages15[2].parts[1]);
t.is(geminiMessages15[2].parts[1].fileData.fileUri, 'gs://cortex-bucket/image2.jpg');
t.is(geminiMessages15[3].parts[0].text, 'The second image shows a different scene.');
t.is(geminiMessages15[4].parts[0].text, 'Which one do you prefer?');
});
// Test handling of large images
test('Large image handling', async (t) => {
const { claude, gemini15 } = createPlugins();
// Create a large base64 string (>10MB)
const largeSampleImage = 'data:image/jpeg;base64,' + 'A'.repeat(10 * 1024 * 1024);
const largeImageMessage = [
{ role: 'user', content: [
{ type: 'text', text: 'Check this large image:' },
{ type: 'image_url', image_url: { url: largeSampleImage } }
]}
];
// Both Claude and Gemini should handle or reject oversized images gracefully
const { modifiedMessages: claudeMessages } = await claude.convertMessagesToClaudeVertex(largeImageMessage);
const { modifiedMessages: geminiMessages } = gemini15.convertMessagesToGemini(largeImageMessage);
// Verify both models handle the oversized image appropriately
// (The exact behavior - rejection vs. compression - should match the model's specifications)
t.is(claudeMessages[0].content[0].text, 'Check this large image:');
t.is(geminiMessages[0].parts[0].text, 'Check this large image:');
});