@future-agi/ai-evaluation

Version:

We help GenAI teams maintain high-accuracy for their Models in production.

67 lines • 2.56 kB

TypeScript

import { APIKeyAuth, ResponseHandler } from '@future-agi/sdk'; import { AxiosResponse } from 'axios'; import { EvalTemplate } from './templates'; import { BatchRunResult } from './types'; /** * Handles responses for evaluation requests */ export declare class EvalResponseHandler extends ResponseHandler<BatchRunResult, any> { static _parseSuccess(response: AxiosResponse): BatchRunResult; static _handleError(response: AxiosResponse): never; } /** * Handles responses for evaluation info requests */ export declare class EvalInfoResponseHandler extends ResponseHandler<Record<string, any>, any> { static _parseSuccess(response: AxiosResponse): Record<string, any>; static _handleError(response: AxiosResponse): never; } /** * Client for evaluating LLM test cases */ export declare class Evaluator extends APIKeyAuth { private readonly maxWorkers; private evalInfoCache; constructor(options?: { fiApiKey?: string; fiSecretKey?: string; fiBaseUrl?: string; timeout?: number; maxQueue?: number; maxWorkers?: number; }); evaluate(evalTemplates: string | EvalTemplate | (string | EvalTemplate)[], inputs: Record<string, string | string[]>, options: { timeout?: number; modelName: string; customEvalName?: string; traceEval?: boolean; }): Promise<BatchRunResult>; private _get_eval_info; list_evaluations(): Promise<Record<string, any>[]>; } /** * Convenience function to run a single or batch of evaluations. * @param evalTemplates - Evaluation name string (e.g., "Factual Accuracy") or list of templates. * @param inputs - Single test case or list of test cases as dictionaries. * @param options - Optional parameters for the evaluation. * @returns BatchRunResult containing evaluation results. */ export declare const evaluate: (evalTemplates: string | EvalTemplate | (string | EvalTemplate)[], inputs: Record<string, string | string[]>, options: { fiApiKey?: string; fiSecretKey?: string; fiBaseUrl?: string; timeout?: number; modelName: string; customEvalName?: string; traceEval?: boolean; }) => Promise<BatchRunResult>; /** * Convenience function to fetch information about all available evaluation templates. * @returns A list of evaluation template information dictionaries. */ export declare const list_evaluations: (options?: { fiApiKey?: string; fiSecretKey?: string; fiBaseUrl?: string; }) => Promise<Record<string, any>[]>; //# sourceMappingURL=evaluator.d.ts.map