UNPKG

llmverify

Version:

AI Output Verification Toolkit — Local-first LLM safety, hallucination detection, PII redaction, prompt injection defense, and runtime monitoring. Zero telemetry. OWASP LLM Top 10 aligned.

111 lines 14.4 kB
"use strict"; /** * Hallucination Engine * * Identifies risk indicators in AI outputs. * Does NOT definitively detect hallucinations - that requires ground truth. * * @module engines/hallucination * @author Haiec * @license MIT */ Object.defineProperty(exports, "__esModule", { value: true }); exports.HallucinationEngine = void 0; const claim_extractor_1 = require("./claim-extractor"); const risk_analyzer_1 = require("./risk-analyzer"); class HallucinationEngine { constructor(config) { this.config = config; this.LIMITATIONS = [ 'Pattern-based detection only (free tier)', 'Cannot verify factual accuracy without ground truth sources', 'English language only', 'Context-dependent false positives possible', 'Novel phrasings may not be detected', 'Requires human validation for production use' ]; this.METHODOLOGY = 'Risk indicator identification using linguistic pattern analysis. ' + 'Analyzes claim specificity, citation presence, language patterns, and ' + 'contradiction signals. Does NOT verify factual accuracy. ' + 'Results indicate likelihood that claims need human review.'; } async detect(content) { // Step 1: Extract claims let claims = (0, claim_extractor_1.extractClaims)(content); // Step 2: Analyze risk indicators for each claim claims = claims.map(claim => (0, risk_analyzer_1.analyzeRiskIndicators)(claim, this.config)); // Step 3: Check for contradictions claims = (0, risk_analyzer_1.checkContradictions)(claims); // Step 4: Identify suspicious claims const suspiciousClaims = claims.filter(claim => { const totalRisk = this.calculateClaimRisk(claim); return totalRisk > 0.5; }); // Step 5: Calculate overall risk score const riskScore = this.calculateRiskScore(claims); // Step 6: Calculate risk indicators summary const riskIndicators = this.summarizeRiskIndicators(claims); // Step 7: Calculate confidence const confidence = this.calculateConfidence(claims); return { claims, suspiciousClaims, riskScore, confidence, riskIndicators, limitations: this.LIMITATIONS, methodology: this.METHODOLOGY }; } calculateClaimRisk(claim) { return (claim.riskIndicators.lackOfSpecificity * 0.3 + (claim.riskIndicators.missingCitation ? 0.3 : 0) + (claim.riskIndicators.vagueLanguage ? 0.2 : 0) + (claim.riskIndicators.contradictionSignal ? 0.2 : 0)); } calculateRiskScore(claims) { if (claims.length === 0) return 0; const totalRisk = claims.reduce((sum, claim) => { return sum + this.calculateClaimRisk(claim); }, 0); return Math.min(totalRisk / claims.length, 1.0); } summarizeRiskIndicators(claims) { if (claims.length === 0) { return { lackOfSpecificity: 0, missingCitations: 0, vagueLanguage: 0, contradictionSignals: 0 }; } return { lackOfSpecificity: claims.reduce((sum, c) => sum + c.riskIndicators.lackOfSpecificity, 0) / claims.length, missingCitations: claims.filter(c => c.riskIndicators.missingCitation).length, vagueLanguage: claims.filter(c => c.riskIndicators.vagueLanguage).length, contradictionSignals: claims.filter(c => c.riskIndicators.contradictionSignal).length }; } calculateConfidence(claims) { const sampleSize = claims.length; const baseLine = Math.min(sampleSize / 10, 1.0); const value = sampleSize < 3 ? baseLine * 0.5 : baseLine; const margin = 0.2 * (1 - value); return { value: Math.max(0.3, value), interval: [ Math.max(0, value - margin), Math.min(1, value + margin) ], method: 'heuristic', factors: { patternStrength: value, contextClarity: value, historicalAccuracy: 0.7 } }; } } exports.HallucinationEngine = HallucinationEngine; //# sourceMappingURL=data:application/json;base64,{"version":3,"file":"index.js","sourceRoot":"","sources":["../../../src/engines/hallucination/index.ts"],"names":[],"mappings":";AAAA;;;;;;;;;GASG;;;AAIH,uDAAkD;AAClD,mDAA6E;AAE7E,MAAa,mBAAmB;IAgB9B,YAAoB,MAAc;QAAd,WAAM,GAAN,MAAM,CAAQ;QAfjB,gBAAW,GAAG;YAC7B,0CAA0C;YAC1C,6DAA6D;YAC7D,uBAAuB;YACvB,4CAA4C;YAC5C,qCAAqC;YACrC,8CAA8C;SAC/C,CAAC;QAEe,gBAAW,GAC1B,mEAAmE;YACnE,wEAAwE;YACxE,2DAA2D;YAC3D,4DAA4D,CAAC;IAE1B,CAAC;IAEtC,KAAK,CAAC,MAAM,CAAC,OAAe;QAC1B,yBAAyB;QACzB,IAAI,MAAM,GAAG,IAAA,+BAAa,EAAC,OAAO,CAAC,CAAC;QAEpC,iDAAiD;QACjD,MAAM,GAAG,MAAM,CAAC,GAAG,CAAC,KAAK,CAAC,EAAE,CAC1B,IAAA,qCAAqB,EAAC,KAAK,EAAE,IAAI,CAAC,MAAM,CAAC,CAC1C,CAAC;QAEF,mCAAmC;QACnC,MAAM,GAAG,IAAA,mCAAmB,EAAC,MAAM,CAAC,CAAC;QAErC,qCAAqC;QACrC,MAAM,gBAAgB,GAAG,MAAM,CAAC,MAAM,CAAC,KAAK,CAAC,EAAE;YAC7C,MAAM,SAAS,GAAG,IAAI,CAAC,kBAAkB,CAAC,KAAK,CAAC,CAAC;YACjD,OAAO,SAAS,GAAG,GAAG,CAAC;QACzB,CAAC,CAAC,CAAC;QAEH,uCAAuC;QACvC,MAAM,SAAS,GAAG,IAAI,CAAC,kBAAkB,CAAC,MAAM,CAAC,CAAC;QAElD,4CAA4C;QAC5C,MAAM,cAAc,GAAG,IAAI,CAAC,uBAAuB,CAAC,MAAM,CAAC,CAAC;QAE5D,+BAA+B;QAC/B,MAAM,UAAU,GAAG,IAAI,CAAC,mBAAmB,CAAC,MAAM,CAAC,CAAC;QAEpD,OAAO;YACL,MAAM;YACN,gBAAgB;YAChB,SAAS;YACT,UAAU;YACV,cAAc;YACd,WAAW,EAAE,IAAI,CAAC,WAAW;YAC7B,WAAW,EAAE,IAAI,CAAC,WAAW;SAC9B,CAAC;IACJ,CAAC;IAEO,kBAAkB,CAAC,KAAY;QACrC,OAAO,CACL,KAAK,CAAC,cAAc,CAAC,iBAAiB,GAAG,GAAG;YAC5C,CAAC,KAAK,CAAC,cAAc,CAAC,eAAe,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC;YAChD,CAAC,KAAK,CAAC,cAAc,CAAC,aAAa,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC;YAC9C,CAAC,KAAK,CAAC,cAAc,CAAC,mBAAmB,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CACrD,CAAC;IACJ,CAAC;IAEO,kBAAkB,CAAC,MAAe;QACxC,IAAI,MAAM,CAAC,MAAM,KAAK,CAAC;YAAE,OAAO,CAAC,CAAC;QAElC,MAAM,SAAS,GAAG,MAAM,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,KAAK,EAAE,EAAE;YAC7C,OAAO,GAAG,GAAG,IAAI,CAAC,kBAAkB,CAAC,KAAK,CAAC,CAAC;QAC9C,CAAC,EAAE,CAAC,CAAC,CAAC;QAEN,OAAO,IAAI,CAAC,GAAG,CAAC,SAAS,GAAG,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;IAClD,CAAC;IAEO,uBAAuB,CAAC,MAAe;QAC7C,IAAI,MAAM,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;YACxB,OAAO;gBACL,iBAAiB,EAAE,CAAC;gBACpB,gBAAgB,EAAE,CAAC;gBACnB,aAAa,EAAE,CAAC;gBAChB,oBAAoB,EAAE,CAAC;aACxB,CAAC;QACJ,CAAC;QAED,OAAO;YACL,iBAAiB,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,CAAC,EAAE,EAAE,CAC1C,GAAG,GAAG,CAAC,CAAC,cAAc,CAAC,iBAAiB,EAAE,CAAC,CAAC,GAAG,MAAM,CAAC,MAAM;YAC9D,gBAAgB,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAClC,CAAC,CAAC,cAAc,CAAC,eAAe,CAAC,CAAC,MAAM;YAC1C,aAAa,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAC/B,CAAC,CAAC,cAAc,CAAC,aAAa,CAAC,CAAC,MAAM;YACxC,oBAAoB,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CACtC,CAAC,CAAC,cAAc,CAAC,mBAAmB,CAAC,CAAC,MAAM;SAC/C,CAAC;IACJ,CAAC;IAEO,mBAAmB,CAAC,MAAe;QACzC,MAAM,UAAU,GAAG,MAAM,CAAC,MAAM,CAAC;QACjC,MAAM,QAAQ,GAAG,IAAI,CAAC,GAAG,CAAC,UAAU,GAAG,EAAE,EAAE,GAAG,CAAC,CAAC;QAEhD,MAAM,KAAK,GAAG,UAAU,GAAG,CAAC,CAAC,CAAC,CAAC,QAAQ,GAAG,GAAG,CAAC,CAAC,CAAC,QAAQ,CAAC;QACzD,MAAM,MAAM,GAAG,GAAG,GAAG,CAAC,CAAC,GAAG,KAAK,CAAC,CAAC;QAEjC,OAAO;YACL,KAAK,EAAE,IAAI,CAAC,GAAG,CAAC,GAAG,EAAE,KAAK,CAAC;YAC3B,QAAQ,EAAE;gBACR,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,GAAG,MAAM,CAAC;gBAC3B,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,GAAG,MAAM,CAAC;aAC5B;YACD,MAAM,EAAE,WAAW;YACnB,OAAO,EAAE;gBACP,eAAe,EAAE,KAAK;gBACtB,cAAc,EAAE,KAAK;gBACrB,kBAAkB,EAAE,GAAG;aACxB;SACF,CAAC;IACJ,CAAC;CACF;AAtHD,kDAsHC","sourcesContent":["/**\n * Hallucination Engine\n * \n * Identifies risk indicators in AI outputs.\n * Does NOT definitively detect hallucinations - that requires ground truth.\n * \n * @module engines/hallucination\n * @author Haiec\n * @license MIT\n */\n\nimport { Config } from '../../types/config';\nimport { HallucinationResult, Claim, ConfidenceScore } from '../../types/results';\nimport { extractClaims } from './claim-extractor';\nimport { analyzeRiskIndicators, checkContradictions } from './risk-analyzer';\n\nexport class HallucinationEngine {\n  private readonly LIMITATIONS = [\n    'Pattern-based detection only (free tier)',\n    'Cannot verify factual accuracy without ground truth sources',\n    'English language only',\n    'Context-dependent false positives possible',\n    'Novel phrasings may not be detected',\n    'Requires human validation for production use'\n  ];\n  \n  private readonly METHODOLOGY = \n    'Risk indicator identification using linguistic pattern analysis. ' +\n    'Analyzes claim specificity, citation presence, language patterns, and ' +\n    'contradiction signals. Does NOT verify factual accuracy. ' +\n    'Results indicate likelihood that claims need human review.';\n  \n  constructor(private config: Config) {}\n  \n  async detect(content: string): Promise<HallucinationResult> {\n    // Step 1: Extract claims\n    let claims = extractClaims(content);\n    \n    // Step 2: Analyze risk indicators for each claim\n    claims = claims.map(claim => \n      analyzeRiskIndicators(claim, this.config)\n    );\n    \n    // Step 3: Check for contradictions\n    claims = checkContradictions(claims);\n    \n    // Step 4: Identify suspicious claims\n    const suspiciousClaims = claims.filter(claim => {\n      const totalRisk = this.calculateClaimRisk(claim);\n      return totalRisk > 0.5;\n    });\n    \n    // Step 5: Calculate overall risk score\n    const riskScore = this.calculateRiskScore(claims);\n    \n    // Step 6: Calculate risk indicators summary\n    const riskIndicators = this.summarizeRiskIndicators(claims);\n    \n    // Step 7: Calculate confidence\n    const confidence = this.calculateConfidence(claims);\n    \n    return {\n      claims,\n      suspiciousClaims,\n      riskScore,\n      confidence,\n      riskIndicators,\n      limitations: this.LIMITATIONS,\n      methodology: this.METHODOLOGY\n    };\n  }\n  \n  private calculateClaimRisk(claim: Claim): number {\n    return (\n      claim.riskIndicators.lackOfSpecificity * 0.3 +\n      (claim.riskIndicators.missingCitation ? 0.3 : 0) +\n      (claim.riskIndicators.vagueLanguage ? 0.2 : 0) +\n      (claim.riskIndicators.contradictionSignal ? 0.2 : 0)\n    );\n  }\n  \n  private calculateRiskScore(claims: Claim[]): number {\n    if (claims.length === 0) return 0;\n    \n    const totalRisk = claims.reduce((sum, claim) => {\n      return sum + this.calculateClaimRisk(claim);\n    }, 0);\n    \n    return Math.min(totalRisk / claims.length, 1.0);\n  }\n  \n  private summarizeRiskIndicators(claims: Claim[]) {\n    if (claims.length === 0) {\n      return {\n        lackOfSpecificity: 0,\n        missingCitations: 0,\n        vagueLanguage: 0,\n        contradictionSignals: 0\n      };\n    }\n    \n    return {\n      lackOfSpecificity: claims.reduce((sum, c) => \n        sum + c.riskIndicators.lackOfSpecificity, 0) / claims.length,\n      missingCitations: claims.filter(c => \n        c.riskIndicators.missingCitation).length,\n      vagueLanguage: claims.filter(c => \n        c.riskIndicators.vagueLanguage).length,\n      contradictionSignals: claims.filter(c => \n        c.riskIndicators.contradictionSignal).length\n    };\n  }\n  \n  private calculateConfidence(claims: Claim[]): ConfidenceScore {\n    const sampleSize = claims.length;\n    const baseLine = Math.min(sampleSize / 10, 1.0);\n    \n    const value = sampleSize < 3 ? baseLine * 0.5 : baseLine;\n    const margin = 0.2 * (1 - value);\n    \n    return {\n      value: Math.max(0.3, value),\n      interval: [\n        Math.max(0, value - margin),\n        Math.min(1, value + margin)\n      ],\n      method: 'heuristic',\n      factors: {\n        patternStrength: value,\n        contextClarity: value,\n        historicalAccuracy: 0.7\n      }\n    };\n  }\n}\n"]}