zon-format
Version:
ZON: The most token-efficient serialization format for LLMs - beats CSV, TOON, JSON, and all competitors
49 lines (48 loc) • 1.35 kB
TypeScript
/**
* Core ZON LLM Evaluation Framework
*
* Provides automated testing and regression detection for LLM interactions.
*/
import type { EvalConfig, EvalResult, Regression } from './types';
/**
* Main evaluation engine for ZON LLM testing
*/
export declare class ZonEvaluator {
private metrics;
constructor();
/**
* Register a metric for use in evaluations
*/
registerMetric(name: string, metric: any): void;
/**
* Run an evaluation with the given configuration
*
* @param config - Evaluation configuration
* @returns Evaluation results
*/
run(config: EvalConfig): Promise<EvalResult>;
/**
* Evaluates a single dataset against a model
*/
private evaluateDataset;
/**
* Compare current results with baseline to detect regressions
*
* @param baseline - Baseline evaluation result
* @param current - Current evaluation result
* @returns List of detected regressions
*/
compare(baseline: EvalResult, current: EvalResult): Promise<Regression[]>;
/**
* Check if results meet configured thresholds
*/
private checkThresholds;
/**
* Determine severity of a regression based on magnitude
*/
private determineSeverity;
}
/**
* Global evaluator instance
*/
export declare const globalEvaluator: ZonEvaluator;