UNPKG

@llumiverse/core

Version:

Provide an universal API to LLMs. Support for existing LLMs can be added by writing a driver.

github.com/vertesia/llumiverse

vertesia/llumiverse

174 lines • 8.95 kB

JavaScript

export class DefaultCompletionStream { driver; prompt; options; chunks; // Counter for number of chunks instead of storing strings completion; constructor(driver, prompt, options) { this.driver = driver; this.prompt = prompt; this.options = options; this.chunks = 0; } async *[Symbol.asyncIterator]() { // reset state this.completion = undefined; this.chunks = 0; const accumulatedResults = []; // Accumulate CompletionResult[] from chunks this.driver.logger.debug(`[${this.driver.provider}] Streaming Execution of ${this.options.model} with prompt`); const start = Date.now(); let finish_reason = undefined; let promptTokens = 0; let resultTokens = undefined; try { const stream = await this.driver.requestTextCompletionStream(this.prompt, this.options); for await (const chunk of stream) { if (chunk) { if (typeof chunk === 'string') { this.chunks++; yield chunk; } else { if (chunk.finish_reason) { //Do not replace non-null values with null values finish_reason = chunk.finish_reason; //Used to skip empty finish_reason chunks coming after "stop" or "length" } if (chunk.token_usage) { //Tokens returned include prior parts of stream, //so overwrite rather than accumulate //Math.max used as some models report final token count at beginning of stream promptTokens = Math.max(promptTokens, chunk.token_usage.prompt ?? 0); resultTokens = Math.max(resultTokens ?? 0, chunk.token_usage.result ?? 0); } if (Array.isArray(chunk.result) && chunk.result.length > 0) { // Process each result in the chunk, combining consecutive text/JSON for (const result of chunk.result) { // Check if we can combine with the last accumulated result const lastResult = accumulatedResults[accumulatedResults.length - 1]; if (lastResult && ((lastResult.type === 'text' && result.type === 'text') || (lastResult.type === 'json' && result.type === 'json'))) { // Combine consecutive text or JSON results if (result.type === 'text') { lastResult.value += result.value; } else if (result.type === 'json') { // For JSON, combine the parsed objects directly try { const lastParsed = lastResult.value; const currentParsed = result.value; if (lastParsed !== null && typeof lastParsed === 'object' && currentParsed !== null && typeof currentParsed === 'object') { const combined = { ...lastParsed, ...currentParsed }; lastResult.value = combined; } else { // If not objects, convert to string and concatenate const lastStr = typeof lastParsed === 'string' ? lastParsed : JSON.stringify(lastParsed); const currentStr = typeof currentParsed === 'string' ? currentParsed : JSON.stringify(currentParsed); lastResult.value = lastStr + currentStr; } } catch { // If anything fails, just concatenate string representations lastResult.value = String(lastResult.value) + String(result.value); } } } else { // Add as new result accumulatedResults.push(result); } } // Convert CompletionResult[] to string for streaming // Only yield if we have results to show const resultText = chunk.result.map(r => { switch (r.type) { case 'text': return r.value; case 'json': return JSON.stringify(r.value); case 'image': // Show truncated image placeholder for streaming const truncatedValue = typeof r.value === 'string' ? r.value.slice(0, 10) : String(r.value).slice(0, 10); return `\n[Image: ${truncatedValue}...]\n`; default: return String(r.value || ''); } }).join(''); if (resultText) { this.chunks++; yield resultText; } } } } } } catch (error) { error.prompt = this.prompt; throw error; } // Return undefined for the ExecutionTokenUsage object if there is nothing to fill it with. // Allows for checking for truthy-ness on token_usage, rather than it's internals. For testing and downstream usage. const tokens = resultTokens ? { prompt: promptTokens, result: resultTokens, total: resultTokens + promptTokens, } : undefined; this.completion = { result: accumulatedResults, // Return the accumulated CompletionResult[] instead of text prompt: this.prompt, execution_time: Date.now() - start, token_usage: tokens, finish_reason: finish_reason, chunks: this.chunks, }; try { if (this.completion) { this.driver.validateResult(this.completion, this.options); } } catch (error) { error.prompt = this.prompt; throw error; } } } export class FallbackCompletionStream { driver; prompt; options; completion; constructor(driver, prompt, options) { this.driver = driver; this.prompt = prompt; this.options = options; } async *[Symbol.asyncIterator]() { // reset state this.completion = undefined; this.driver.logger.debug(`[${this.driver.provider}] Streaming is not supported, falling back to blocking execution`); try { const completion = await this.driver._execute(this.prompt, this.options); // For fallback streaming, yield the text content but keep the original completion const content = completion.result.map(r => { switch (r.type) { case 'text': return r.value; case 'json': return JSON.stringify(r.value); case 'image': // Show truncated image placeholder for streaming const truncatedValue = typeof r.value === 'string' ? r.value.slice(0, 10) : String(r.value).slice(0, 10); return `[Image: ${truncatedValue}...]`; default: return String(r.value || ''); } }).join(''); yield content; this.completion = completion; // Return the original completion with untouched CompletionResult[] } catch (error) { error.prompt = this.prompt; throw error; } } } //# sourceMappingURL=CompletionStream.js.map