UNPKG

llamaindex

Version:

<p align="center"> <img height="100" width="100" alt="LlamaIndex logo" src="https://ts.llamaindex.ai/square.svg" /> </p> <h1 align="center">LlamaIndex.TS</h1> <h3 align="center"> Data framework for your LLM application. </h3>

86 lines (85 loc) 2.91 kB
import { PromptMixin } from "@llamaindex/core/prompts"; import { MetadataMode } from "@llamaindex/core/schema"; import { extractText } from "@llamaindex/core/utils"; import { Settings } from "../Settings.js"; import { defaultCorrectnessSystemPrompt, defaultUserPrompt } from "./prompts.js"; import { defaultEvaluationParser } from "./utils.js"; /** Correctness Evaluator */ export class CorrectnessEvaluator extends PromptMixin { scoreThreshold; parserFunction; llm; correctnessPrompt = defaultCorrectnessSystemPrompt; constructor(params){ super(); this.llm = Settings.llm; this.correctnessPrompt = defaultCorrectnessSystemPrompt; this.scoreThreshold = params?.scoreThreshold ?? 4.0; this.parserFunction = params?.parserFunction ?? defaultEvaluationParser; } _getPrompts() { return { correctnessPrompt: this.correctnessPrompt }; } _getPromptModules() { return {}; } _updatePrompts(prompts) { if ("correctnessPrompt" in prompts) { this.correctnessPrompt = prompts["correctnessPrompt"]; } } /** * * @param query Query to evaluate * @param response Response to evaluate * @param contexts Array of contexts * @param reference Reference response */ async evaluate({ query, response, contexts, reference }) { if (query === null || response === null) { throw new Error("query, and response must be provided"); } const messages = [ { role: "system", content: this.correctnessPrompt.format() }, { role: "user", content: defaultUserPrompt.format({ query: extractText(query), generatedAnswer: response, referenceAnswer: reference || "(NO REFERENCE ANSWER SUPPLIED)" }) } ]; const evalResponse = await this.llm.chat({ messages }); const [score, reasoning] = this.parserFunction(extractText(evalResponse.message.content)); return { query: query, response: response, passing: score >= this.scoreThreshold || score === null, score: score, feedback: reasoning }; } /** * @param query Query to evaluate * @param response Response to evaluate */ async evaluateResponse({ query, response }) { const responseStr = extractText(response?.message.content); const contexts = []; if (response) { for (const node of response.sourceNodes || []){ contexts.push(node.node.getContent(MetadataMode.ALL)); } } return this.evaluate({ query, response: responseStr, contexts }); } }