UNPKG

zon-format

Version:

ZON: The most token-efficient serialization format for LLMs - beats CSV, TOON, JSON, and all competitors

49 lines (48 loc) 1.35 kB
/** * Core ZON LLM Evaluation Framework * * Provides automated testing and regression detection for LLM interactions. */ import type { EvalConfig, EvalResult, Regression } from './types'; /** * Main evaluation engine for ZON LLM testing */ export declare class ZonEvaluator { private metrics; constructor(); /** * Register a metric for use in evaluations */ registerMetric(name: string, metric: any): void; /** * Run an evaluation with the given configuration * * @param config - Evaluation configuration * @returns Evaluation results */ run(config: EvalConfig): Promise<EvalResult>; /** * Evaluates a single dataset against a model */ private evaluateDataset; /** * Compare current results with baseline to detect regressions * * @param baseline - Baseline evaluation result * @param current - Current evaluation result * @returns List of detected regressions */ compare(baseline: EvalResult, current: EvalResult): Promise<Regression[]>; /** * Check if results meet configured thresholds */ private checkThresholds; /** * Determine severity of a regression based on magnitude */ private determineSeverity; } /** * Global evaluator instance */ export declare const globalEvaluator: ZonEvaluator;