UNPKG

documind2

Version:
89 lines (79 loc) 2.56 kB
import axios from "axios"; import type { CompletionArgs, CompletionResponse } from "./types"; import { convertKeysToSnakeCase, encodeImageToBase64 } from "./utils"; export const getCompletion = async ({ apiKey, imagePath, llmParams, maintainFormat, model, priorPage, }: CompletionArgs): Promise<CompletionResponse> => { const validModelsForCustomBaseUrl = ["llava", "llama3.2-vision"]; const validModelsForOpenAi = ["gpt-4o", "gpt-4o-mini"]; const baseUrl = process.env.BASE_URL || "https://api.openai.com/v1"; if (baseUrl !== "https://api.openai.com/v1") { if (!validModelsForCustomBaseUrl.includes(model as any)) { throw new Error( `Invalid model "${model}" for custom base URL. Valid options are: ${validModelsForCustomBaseUrl.join(", ")}.`, ); } } else { if (!validModelsForOpenAi.includes(model as any)) { throw new Error( `Invalid model "${model}" for OpenAI. Valid options are: ${validModelsForOpenAi.join(", ")}.`, ); } } const systemPrompt = ` Convert the following image/document to markdown. Return only the markdown with no explanation text. Do not include deliminators like '''markdown. You must include all information on the page. Do not exclude headers, footers, or subtext. `; // Default system message. const messages: any = [{ role: "system", content: systemPrompt }]; // If content has already been generated, add it to context. // This helps maintain the same format across pages if (maintainFormat && priorPage && priorPage.length) { messages.push({ role: "system", content: `Markdown must maintain consistent formatting with the following page: \n\n """${priorPage}"""`, }); } // Add Image to request const base64Image = await encodeImageToBase64(imagePath); messages.push({ role: "user", content: [ { type: "image_url", image_url: { url: `data:image/png;base64,${base64Image}` }, }, ], }); try { const response = await axios.post( `${baseUrl}/chat/completions`, { messages, model, ...convertKeysToSnakeCase(llmParams ?? null), }, { headers: { Authorization: `Bearer ${apiKey}`, "Content-Type": "application/json", }, }, ); const data = response.data; return { content: data.choices[0].message.content, inputTokens: data.usage.prompt_tokens, outputTokens: data.usage.completion_tokens, }; } catch (err) { console.error("Error in OpenAI completion", err); throw err; } };