UNPKG

llmverify

Version:

AI Output Verification Toolkit — Local-first LLM safety, hallucination detection, PII redaction, prompt injection defense, and runtime monitoring. Zero telemetry. OWASP LLM Top 10 aligned.

124 lines 12.9 kB
"use strict"; /** * Baseline Engine * * Maintains and updates baseline metrics for drift detection. * Uses exponential moving average for stability. * * WHAT THIS DOES: * ✅ Tracks average latency, token rate, similarity * ✅ Maintains response fingerprint baseline * ✅ Uses EMA for smooth baseline updates * * WHAT THIS DOES NOT DO: * ❌ Persist baselines across sessions (in-memory only) * ❌ Account for intentional model changes * ❌ Distinguish normal variation from anomalies * * @module engines/runtime/baseline * @author Haiec * @license MIT */ Object.defineProperty(exports, "__esModule", { value: true }); exports.BaselineEngine = void 0; /** * Manages baseline state for LLM monitoring. * * @example * const baseline = new BaselineEngine(); * * // After each call * baseline.update(callRecord, fingerprint, similarity); * * // Get current baseline * const state = baseline.get(); */ class BaselineEngine { /** * Creates a new BaselineEngine. * * @param learningRate - EMA learning rate (0-1, default: 0.1) * @param minSamples - Minimum samples before baseline is stable (default: 5) */ constructor(learningRate = 0.1, minSamples = 5) { this.learningRate = Math.max(0.01, Math.min(1, learningRate)); this.minSamples = minSamples; this.baseline = { avgLatencyMs: 0, avgTokensPerSecond: 0, avgSimilarity: 0.85, fingerprint: {}, sampleCount: 0 }; } /** * Updates baseline with new call data. * * @param call - The call record * @param fingerprint - Response fingerprint * @param similarity - Similarity score (0-1) */ update(call, fingerprint, similarity = 1) { const alpha = this.learningRate; const tps = call.responseTokens / Math.max(call.latencyMs / 1000, 0.001); if (this.baseline.sampleCount === 0) { // First sample - initialize directly this.baseline.avgLatencyMs = call.latencyMs; this.baseline.avgTokensPerSecond = tps; this.baseline.fingerprint = fingerprint; this.baseline.avgSimilarity = similarity; } else { // EMA update this.baseline.avgLatencyMs = alpha * call.latencyMs + (1 - alpha) * this.baseline.avgLatencyMs; this.baseline.avgTokensPerSecond = alpha * tps + (1 - alpha) * this.baseline.avgTokensPerSecond; this.baseline.avgSimilarity = alpha * similarity + (1 - alpha) * this.baseline.avgSimilarity; // Update fingerprint with EMA if (this.baseline.fingerprint && 'tokens' in this.baseline.fingerprint) { const fp = this.baseline.fingerprint; this.baseline.fingerprint = { tokens: alpha * fingerprint.tokens + (1 - alpha) * fp.tokens, sentences: alpha * fingerprint.sentences + (1 - alpha) * fp.sentences, avgSentLength: alpha * fingerprint.avgSentLength + (1 - alpha) * fp.avgSentLength, entropy: alpha * fingerprint.entropy + (1 - alpha) * fp.entropy }; } else { this.baseline.fingerprint = fingerprint; } } this.baseline.sampleCount++; } /** * Gets current baseline state. */ get() { return { ...this.baseline }; } /** * Checks if baseline has enough samples to be stable. */ isStable() { return this.baseline.sampleCount >= this.minSamples; } /** * Resets baseline to initial state. */ reset() { this.baseline = { avgLatencyMs: 0, avgTokensPerSecond: 0, avgSimilarity: 0.85, fingerprint: {}, sampleCount: 0 }; } /** * Gets sample count. */ getSampleCount() { return this.baseline.sampleCount; } } exports.BaselineEngine = BaselineEngine; //# sourceMappingURL=data:application/json;base64,{"version":3,"file":"baseline.js","sourceRoot":"","sources":["../../../src/engines/runtime/baseline.ts"],"names":[],"mappings":";AAAA;;;;;;;;;;;;;;;;;;;GAmBG;;;AAIH;;;;;;;;;;;GAWG;AACH,MAAa,cAAc;IAKzB;;;;;OAKG;IACH,YAAY,eAAuB,GAAG,EAAE,aAAqB,CAAC;QAC5D,IAAI,CAAC,YAAY,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,EAAE,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,YAAY,CAAC,CAAC,CAAC;QAC9D,IAAI,CAAC,UAAU,GAAG,UAAU,CAAC;QAC7B,IAAI,CAAC,QAAQ,GAAG;YACd,YAAY,EAAE,CAAC;YACf,kBAAkB,EAAE,CAAC;YACrB,aAAa,EAAE,IAAI;YACnB,WAAW,EAAE,EAAE;YACf,WAAW,EAAE,CAAC;SACf,CAAC;IACJ,CAAC;IAED;;;;;;OAMG;IACH,MAAM,CAAC,IAAgB,EAAE,WAAgC,EAAE,aAAqB,CAAC;QAC/E,MAAM,KAAK,GAAG,IAAI,CAAC,YAAY,CAAC;QAChC,MAAM,GAAG,GAAG,IAAI,CAAC,cAAc,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,SAAS,GAAG,IAAI,EAAE,KAAK,CAAC,CAAC;QAEzE,IAAI,IAAI,CAAC,QAAQ,CAAC,WAAW,KAAK,CAAC,EAAE,CAAC;YACpC,qCAAqC;YACrC,IAAI,CAAC,QAAQ,CAAC,YAAY,GAAG,IAAI,CAAC,SAAS,CAAC;YAC5C,IAAI,CAAC,QAAQ,CAAC,kBAAkB,GAAG,GAAG,CAAC;YACvC,IAAI,CAAC,QAAQ,CAAC,WAAW,GAAG,WAAW,CAAC;YACxC,IAAI,CAAC,QAAQ,CAAC,aAAa,GAAG,UAAU,CAAC;QAC3C,CAAC;aAAM,CAAC;YACN,aAAa;YACb,IAAI,CAAC,QAAQ,CAAC,YAAY,GAAG,KAAK,GAAG,IAAI,CAAC,SAAS,GAAG,CAAC,CAAC,GAAG,KAAK,CAAC,GAAG,IAAI,CAAC,QAAQ,CAAC,YAAY,CAAC;YAC/F,IAAI,CAAC,QAAQ,CAAC,kBAAkB,GAAG,KAAK,GAAG,GAAG,GAAG,CAAC,CAAC,GAAG,KAAK,CAAC,GAAG,IAAI,CAAC,QAAQ,CAAC,kBAAkB,CAAC;YAChG,IAAI,CAAC,QAAQ,CAAC,aAAa,GAAG,KAAK,GAAG,UAAU,GAAG,CAAC,CAAC,GAAG,KAAK,CAAC,GAAG,IAAI,CAAC,QAAQ,CAAC,aAAa,CAAC;YAE7F,8BAA8B;YAC9B,IAAI,IAAI,CAAC,QAAQ,CAAC,WAAW,IAAI,QAAQ,IAAI,IAAI,CAAC,QAAQ,CAAC,WAAW,EAAE,CAAC;gBACvE,MAAM,EAAE,GAAG,IAAI,CAAC,QAAQ,CAAC,WAAkC,CAAC;gBAC5D,IAAI,CAAC,QAAQ,CAAC,WAAW,GAAG;oBAC1B,MAAM,EAAE,KAAK,GAAG,WAAW,CAAC,MAAM,GAAG,CAAC,CAAC,GAAG,KAAK,CAAC,GAAG,EAAE,CAAC,MAAM;oBAC5D,SAAS,EAAE,KAAK,GAAG,WAAW,CAAC,SAAS,GAAG,CAAC,CAAC,GAAG,KAAK,CAAC,GAAG,EAAE,CAAC,SAAS;oBACrE,aAAa,EAAE,KAAK,GAAG,WAAW,CAAC,aAAa,GAAG,CAAC,CAAC,GAAG,KAAK,CAAC,GAAG,EAAE,CAAC,aAAa;oBACjF,OAAO,EAAE,KAAK,GAAG,WAAW,CAAC,OAAO,GAAG,CAAC,CAAC,GAAG,KAAK,CAAC,GAAG,EAAE,CAAC,OAAO;iBAChE,CAAC;YACJ,CAAC;iBAAM,CAAC;gBACN,IAAI,CAAC,QAAQ,CAAC,WAAW,GAAG,WAAW,CAAC;YAC1C,CAAC;QACH,CAAC;QAED,IAAI,CAAC,QAAQ,CAAC,WAAW,EAAE,CAAC;IAC9B,CAAC;IAED;;OAEG;IACH,GAAG;QACD,OAAO,EAAE,GAAG,IAAI,CAAC,QAAQ,EAAE,CAAC;IAC9B,CAAC;IAED;;OAEG;IACH,QAAQ;QACN,OAAO,IAAI,CAAC,QAAQ,CAAC,WAAW,IAAI,IAAI,CAAC,UAAU,CAAC;IACtD,CAAC;IAED;;OAEG;IACH,KAAK;QACH,IAAI,CAAC,QAAQ,GAAG;YACd,YAAY,EAAE,CAAC;YACf,kBAAkB,EAAE,CAAC;YACrB,aAAa,EAAE,IAAI;YACnB,WAAW,EAAE,EAAE;YACf,WAAW,EAAE,CAAC;SACf,CAAC;IACJ,CAAC;IAED;;OAEG;IACH,cAAc;QACZ,OAAO,IAAI,CAAC,QAAQ,CAAC,WAAW,CAAC;IACnC,CAAC;CACF;AAhGD,wCAgGC","sourcesContent":["/**\n * Baseline Engine\n * \n * Maintains and updates baseline metrics for drift detection.\n * Uses exponential moving average for stability.\n * \n * WHAT THIS DOES:\n * ✅ Tracks average latency, token rate, similarity\n * ✅ Maintains response fingerprint baseline\n * ✅ Uses EMA for smooth baseline updates\n * \n * WHAT THIS DOES NOT DO:\n * ❌ Persist baselines across sessions (in-memory only)\n * ❌ Account for intentional model changes\n * ❌ Distinguish normal variation from anomalies\n * \n * @module engines/runtime/baseline\n * @author Haiec\n * @license MIT\n */\n\nimport { CallRecord, BaselineState, ResponseFingerprint } from '../../types/runtime';\n\n/**\n * Manages baseline state for LLM monitoring.\n * \n * @example\n * const baseline = new BaselineEngine();\n * \n * // After each call\n * baseline.update(callRecord, fingerprint, similarity);\n * \n * // Get current baseline\n * const state = baseline.get();\n */\nexport class BaselineEngine {\n  private baseline: BaselineState;\n  private readonly learningRate: number;\n  private readonly minSamples: number;\n\n  /**\n   * Creates a new BaselineEngine.\n   * \n   * @param learningRate - EMA learning rate (0-1, default: 0.1)\n   * @param minSamples - Minimum samples before baseline is stable (default: 5)\n   */\n  constructor(learningRate: number = 0.1, minSamples: number = 5) {\n    this.learningRate = Math.max(0.01, Math.min(1, learningRate));\n    this.minSamples = minSamples;\n    this.baseline = {\n      avgLatencyMs: 0,\n      avgTokensPerSecond: 0,\n      avgSimilarity: 0.85,\n      fingerprint: {},\n      sampleCount: 0\n    };\n  }\n\n  /**\n   * Updates baseline with new call data.\n   * \n   * @param call - The call record\n   * @param fingerprint - Response fingerprint\n   * @param similarity - Similarity score (0-1)\n   */\n  update(call: CallRecord, fingerprint: ResponseFingerprint, similarity: number = 1): void {\n    const alpha = this.learningRate;\n    const tps = call.responseTokens / Math.max(call.latencyMs / 1000, 0.001);\n\n    if (this.baseline.sampleCount === 0) {\n      // First sample - initialize directly\n      this.baseline.avgLatencyMs = call.latencyMs;\n      this.baseline.avgTokensPerSecond = tps;\n      this.baseline.fingerprint = fingerprint;\n      this.baseline.avgSimilarity = similarity;\n    } else {\n      // EMA update\n      this.baseline.avgLatencyMs = alpha * call.latencyMs + (1 - alpha) * this.baseline.avgLatencyMs;\n      this.baseline.avgTokensPerSecond = alpha * tps + (1 - alpha) * this.baseline.avgTokensPerSecond;\n      this.baseline.avgSimilarity = alpha * similarity + (1 - alpha) * this.baseline.avgSimilarity;\n\n      // Update fingerprint with EMA\n      if (this.baseline.fingerprint && 'tokens' in this.baseline.fingerprint) {\n        const fp = this.baseline.fingerprint as ResponseFingerprint;\n        this.baseline.fingerprint = {\n          tokens: alpha * fingerprint.tokens + (1 - alpha) * fp.tokens,\n          sentences: alpha * fingerprint.sentences + (1 - alpha) * fp.sentences,\n          avgSentLength: alpha * fingerprint.avgSentLength + (1 - alpha) * fp.avgSentLength,\n          entropy: alpha * fingerprint.entropy + (1 - alpha) * fp.entropy\n        };\n      } else {\n        this.baseline.fingerprint = fingerprint;\n      }\n    }\n\n    this.baseline.sampleCount++;\n  }\n\n  /**\n   * Gets current baseline state.\n   */\n  get(): BaselineState {\n    return { ...this.baseline };\n  }\n\n  /**\n   * Checks if baseline has enough samples to be stable.\n   */\n  isStable(): boolean {\n    return this.baseline.sampleCount >= this.minSamples;\n  }\n\n  /**\n   * Resets baseline to initial state.\n   */\n  reset(): void {\n    this.baseline = {\n      avgLatencyMs: 0,\n      avgTokensPerSecond: 0,\n      avgSimilarity: 0.85,\n      fingerprint: {},\n      sampleCount: 0\n    };\n  }\n\n  /**\n   * Gets sample count.\n   */\n  getSampleCount(): number {\n    return this.baseline.sampleCount;\n  }\n}\n"]}