@llumiverse/drivers

Version:

LLM driver implementations. Currently supported are: openai, huggingface, bedrock, replicate.

55 lines (44 loc) • 1.47 kB

text/typescript

import { EmbeddingsResult } from '@llumiverse/core'; import { VertexAIDriver } from '../index.js'; export interface TextEmbeddingsOptions { model?: string; task_type?: "RETRIEVAL_QUERY" | "RETRIEVAL_DOCUMENT" | "SEMANTIC_SIMILARITY" | "CLASSIFICATION" | "CLUSTERING", title?: string, // the title for the embedding content: string // the text to generate embeddings for } interface EmbeddingsForTextPrompt { instances: TextEmbeddingsOptions[] } interface TextEmbeddingsResult { predictions: [ { embeddings: TextEmbeddings } ] } interface TextEmbeddings { statistics: { truncated: boolean, token_count: number }, values: [number] } export async function getEmbeddingsForText(driver: VertexAIDriver, options: TextEmbeddingsOptions): Promise<EmbeddingsResult> { const prompt = { instances: [{ task_type: options.task_type, title: options.title, content: options.content }] } satisfies EmbeddingsForTextPrompt; const model = options.model || "gemini-embedding-001"; const client = driver.getFetchClient(); const result = await client.post(`/publishers/google/models/${model}:predict`, { payload: prompt }) as TextEmbeddingsResult; return { ...result.predictions[0].embeddings, model, token_count: result.predictions[0].embeddings.statistics?.token_count }; }