UNPKG

@llumiverse/drivers

Version:

LLM driver implementations. Currently supported are: openai, huggingface, bedrock, replicate.

github.com/vertesia/llumiverse

vertesia/llumiverse

261 lines • 9.93 kB

JavaScript

import { ModelType, PromptRole, readStreamAsBase64 } from "@llumiverse/core"; import { asyncMap } from "@llumiverse/core/async"; function claudeFinishReason(reason) { if (!reason) return undefined; switch (reason) { case 'end_turn': return "stop"; case 'max_tokens': return "length"; default: return reason; //stop_sequence } } function collectTextParts(content) { const out = []; for (const block of content) { if (block?.text) { out.push(block.text); } } return out.join('\n'); } function maxToken(max_tokens, model) { const contains = (str, substr) => str.indexOf(substr) !== -1; if (max_tokens) { return max_tokens; } else if (contains(model, "claude-3-5")) { return 8192; } else { return 4096; } } async function collectImageBlocks(segment, contentBlocks) { for (const file of segment.files || []) { if (file.mime_type?.startsWith("image/")) { const allowedTypes = ["image/png", "image/jpeg", "image/gif", "image/webp"]; if (!allowedTypes.includes(file.mime_type)) { throw new Error(`Unsupported image type: ${file.mime_type}`); } const mimeType = String(file.mime_type); contentBlocks.push({ type: 'image', source: { type: 'base64', data: await readStreamAsBase64(await file.getStream()), media_type: mimeType } }); } else if (file.mime_type?.startsWith("text/")) { contentBlocks.push({ source: { type: 'text', data: await readStreamAsBase64(await file.getStream()), media_type: 'text/plain' }, type: 'document' }); } } } export class ClaudeModelDefinition { model; constructor(modelId) { this.model = { id: modelId, name: modelId, provider: 'vertexai', type: ModelType.Text, can_stream: true, }; } async createPrompt(_driver, segments, options) { // Convert the prompt to the format expected by the Claude API const systemSegments = segments .filter(segment => segment.role === PromptRole.system) .map(segment => ({ text: segment.content, type: 'text' })); const safetySegments = segments .filter(segment => segment.role === PromptRole.safety) .map(segment => ({ text: segment.content, type: 'text' })); if (options.result_schema) { const schemaSegments = { text: "The answer must be a JSON object using the following JSON Schema:\n" + JSON.stringify(options.result_schema), type: 'text' }; safetySegments.push(schemaSegments); } const messages = []; for (const segment of segments) { if (segment.role === PromptRole.system || segment.role === PromptRole.safety) { continue; } if (segment.role === PromptRole.tool) { if (!segment.tool_use_id) { throw new Error("Tool prompt segment must have a tool_use_id"); } const imageBlocks = []; await collectImageBlocks(segment, imageBlocks); messages.push({ role: 'user', content: [{ type: 'tool_result', tool_use_id: segment.tool_use_id, content: [{ type: 'text', text: segment.content || '' }, ...imageBlocks] }] }); } else { const contentBlocks = []; collectImageBlocks(segment, contentBlocks); if (segment.content) { contentBlocks.push({ type: 'text', text: segment.content }); } messages.push({ role: segment.role === PromptRole.assistant ? 'assistant' : 'user', content: contentBlocks }); } } const system = systemSegments.concat(safetySegments); return { messages: messages, system: system }; } async requestTextCompletion(driver, prompt, options) { const client = driver.getAnthropicClient(); const splits = options.model.split("/"); const modelName = splits[splits.length - 1]; options = { ...options, model: modelName }; options.model_options = options.model_options; if (options.model_options?._option_id !== "vertexai-claude") { driver.logger.warn("Invalid model options", { options: options.model_options }); } let conversation = updateConversation(options.conversation, prompt); const result = await client.messages.create({ ...conversation, // messages, system, tools: options.tools, // we are using the same shape as claude for tools temperature: options.model_options?.temperature, model: modelName, max_tokens: maxToken(options.model_options?.max_tokens, modelName), top_p: options.model_options?.top_p, top_k: options.model_options?.top_k, stop_sequences: options.model_options?.stop_sequence, thinking: options.model_options?.thinking_mode ? { budget_tokens: options.model_options?.thinking_budget_tokens ?? 1024, type: "enabled" } : { type: "disabled" } }); const text = collectTextParts(result.content); const tool_use = collectTools(result.content); conversation = updateConversation(conversation, createPromptFromResponse(result)); return { chat: [prompt, { role: result.role, content: result.content }], result: text ?? '', tool_use, token_usage: { prompt: result?.usage.input_tokens, result: result?.usage.output_tokens, total: result?.usage.input_tokens + result?.usage.output_tokens }, // make sure we set finish_reason to the correct value (claude is normally setting this by itself) finish_reason: tool_use ? "tool_use" : claudeFinishReason(result?.stop_reason ?? ''), conversation }; } async requestTextCompletionStream(driver, prompt, options) { const client = driver.getAnthropicClient(); const splits = options.model.split("/"); const modelName = splits[splits.length - 1]; options = { ...options, model: modelName }; options.model_options = options.model_options; if (options.model_options?._option_id !== "vertexai-claude") { driver.logger.warn("Invalid model options", { options: options.model_options }); } const response_stream = await client.messages.stream({ ...prompt, // messages, system, tools: options.tools, // we are using the same shape as claude for tools temperature: options.model_options?.temperature, model: modelName, max_tokens: maxToken(options.model_options?.max_tokens, modelName), top_p: options.model_options?.top_p, top_k: options.model_options?.top_k, stop_sequences: options.model_options?.stop_sequence, thinking: options.model_options?.thinking_mode ? { budget_tokens: options.model_options?.thinking_budget_tokens ?? 1024, type: "enabled" } : { type: "disabled" } }); const stream = asyncMap(response_stream, async (item) => { if (item.type == "message_start") { return { result: '', token_usage: { prompt: item?.message?.usage?.input_tokens, result: item?.message?.usage?.output_tokens }, finish_reason: undefined, }; } return { result: item?.delta?.text ?? '', token_usage: { result: item?.usage?.output_tokens }, finish_reason: claudeFinishReason(item?.delta?.stop_reason ?? ''), }; }); return stream; } } export function collectTools(content) { const out = []; for (const block of content) { if (block?.type === "tool_use") { out.push({ id: block.id, tool_name: block.name, tool_input: block.input, }); } } return out.length > 0 ? out : undefined; } function createPromptFromResponse(response) { return { messages: [{ role: PromptRole.assistant, content: response.content, }], system: [] }; } /** * Update the conversation messages * @param prompt * @param response * @returns */ function updateConversation(conversation, prompt) { const baseSystemMessages = conversation ? conversation.system : []; const baseMessages = conversation ? conversation.messages : []; return { messages: baseMessages.concat(prompt.messages || []), system: baseSystemMessages.concat(prompt.system || []) }; } //# sourceMappingURL=claude.js.map