llmverify
Version:
AI Output Verification Toolkit — Local-first LLM safety, hallucination detection, PII redaction, prompt injection defense, and runtime monitoring. Zero telemetry. OWASP LLM Top 10 aligned.
111 lines • 14.4 kB
JavaScript
;
/**
* Hallucination Engine
*
* Identifies risk indicators in AI outputs.
* Does NOT definitively detect hallucinations - that requires ground truth.
*
* @module engines/hallucination
* @author Haiec
* @license MIT
*/
Object.defineProperty(exports, "__esModule", { value: true });
exports.HallucinationEngine = void 0;
const claim_extractor_1 = require("./claim-extractor");
const risk_analyzer_1 = require("./risk-analyzer");
class HallucinationEngine {
constructor(config) {
this.config = config;
this.LIMITATIONS = [
'Pattern-based detection only (free tier)',
'Cannot verify factual accuracy without ground truth sources',
'English language only',
'Context-dependent false positives possible',
'Novel phrasings may not be detected',
'Requires human validation for production use'
];
this.METHODOLOGY = 'Risk indicator identification using linguistic pattern analysis. ' +
'Analyzes claim specificity, citation presence, language patterns, and ' +
'contradiction signals. Does NOT verify factual accuracy. ' +
'Results indicate likelihood that claims need human review.';
}
async detect(content) {
// Step 1: Extract claims
let claims = (0, claim_extractor_1.extractClaims)(content);
// Step 2: Analyze risk indicators for each claim
claims = claims.map(claim => (0, risk_analyzer_1.analyzeRiskIndicators)(claim, this.config));
// Step 3: Check for contradictions
claims = (0, risk_analyzer_1.checkContradictions)(claims);
// Step 4: Identify suspicious claims
const suspiciousClaims = claims.filter(claim => {
const totalRisk = this.calculateClaimRisk(claim);
return totalRisk > 0.5;
});
// Step 5: Calculate overall risk score
const riskScore = this.calculateRiskScore(claims);
// Step 6: Calculate risk indicators summary
const riskIndicators = this.summarizeRiskIndicators(claims);
// Step 7: Calculate confidence
const confidence = this.calculateConfidence(claims);
return {
claims,
suspiciousClaims,
riskScore,
confidence,
riskIndicators,
limitations: this.LIMITATIONS,
methodology: this.METHODOLOGY
};
}
calculateClaimRisk(claim) {
return (claim.riskIndicators.lackOfSpecificity * 0.3 +
(claim.riskIndicators.missingCitation ? 0.3 : 0) +
(claim.riskIndicators.vagueLanguage ? 0.2 : 0) +
(claim.riskIndicators.contradictionSignal ? 0.2 : 0));
}
calculateRiskScore(claims) {
if (claims.length === 0)
return 0;
const totalRisk = claims.reduce((sum, claim) => {
return sum + this.calculateClaimRisk(claim);
}, 0);
return Math.min(totalRisk / claims.length, 1.0);
}
summarizeRiskIndicators(claims) {
if (claims.length === 0) {
return {
lackOfSpecificity: 0,
missingCitations: 0,
vagueLanguage: 0,
contradictionSignals: 0
};
}
return {
lackOfSpecificity: claims.reduce((sum, c) => sum + c.riskIndicators.lackOfSpecificity, 0) / claims.length,
missingCitations: claims.filter(c => c.riskIndicators.missingCitation).length,
vagueLanguage: claims.filter(c => c.riskIndicators.vagueLanguage).length,
contradictionSignals: claims.filter(c => c.riskIndicators.contradictionSignal).length
};
}
calculateConfidence(claims) {
const sampleSize = claims.length;
const baseLine = Math.min(sampleSize / 10, 1.0);
const value = sampleSize < 3 ? baseLine * 0.5 : baseLine;
const margin = 0.2 * (1 - value);
return {
value: Math.max(0.3, value),
interval: [
Math.max(0, value - margin),
Math.min(1, value + margin)
],
method: 'heuristic',
factors: {
patternStrength: value,
contextClarity: value,
historicalAccuracy: 0.7
}
};
}
}
exports.HallucinationEngine = HallucinationEngine;
//# sourceMappingURL=data:application/json;base64,{"version":3,"file":"index.js","sourceRoot":"","sources":["../../../src/engines/hallucination/index.ts"],"names":[],"mappings":";AAAA;;;;;;;;;GASG;;;AAIH,uDAAkD;AAClD,mDAA6E;AAE7E,MAAa,mBAAmB;IAgB9B,YAAoB,MAAc;QAAd,WAAM,GAAN,MAAM,CAAQ;QAfjB,gBAAW,GAAG;YAC7B,0CAA0C;YAC1C,6DAA6D;YAC7D,uBAAuB;YACvB,4CAA4C;YAC5C,qCAAqC;YACrC,8CAA8C;SAC/C,CAAC;QAEe,gBAAW,GAC1B,mEAAmE;YACnE,wEAAwE;YACxE,2DAA2D;YAC3D,4DAA4D,CAAC;IAE1B,CAAC;IAEtC,KAAK,CAAC,MAAM,CAAC,OAAe;QAC1B,yBAAyB;QACzB,IAAI,MAAM,GAAG,IAAA,+BAAa,EAAC,OAAO,CAAC,CAAC;QAEpC,iDAAiD;QACjD,MAAM,GAAG,MAAM,CAAC,GAAG,CAAC,KAAK,CAAC,EAAE,CAC1B,IAAA,qCAAqB,EAAC,KAAK,EAAE,IAAI,CAAC,MAAM,CAAC,CAC1C,CAAC;QAEF,mCAAmC;QACnC,MAAM,GAAG,IAAA,mCAAmB,EAAC,MAAM,CAAC,CAAC;QAErC,qCAAqC;QACrC,MAAM,gBAAgB,GAAG,MAAM,CAAC,MAAM,CAAC,KAAK,CAAC,EAAE;YAC7C,MAAM,SAAS,GAAG,IAAI,CAAC,kBAAkB,CAAC,KAAK,CAAC,CAAC;YACjD,OAAO,SAAS,GAAG,GAAG,CAAC;QACzB,CAAC,CAAC,CAAC;QAEH,uCAAuC;QACvC,MAAM,SAAS,GAAG,IAAI,CAAC,kBAAkB,CAAC,MAAM,CAAC,CAAC;QAElD,4CAA4C;QAC5C,MAAM,cAAc,GAAG,IAAI,CAAC,uBAAuB,CAAC,MAAM,CAAC,CAAC;QAE5D,+BAA+B;QAC/B,MAAM,UAAU,GAAG,IAAI,CAAC,mBAAmB,CAAC,MAAM,CAAC,CAAC;QAEpD,OAAO;YACL,MAAM;YACN,gBAAgB;YAChB,SAAS;YACT,UAAU;YACV,cAAc;YACd,WAAW,EAAE,IAAI,CAAC,WAAW;YAC7B,WAAW,EAAE,IAAI,CAAC,WAAW;SAC9B,CAAC;IACJ,CAAC;IAEO,kBAAkB,CAAC,KAAY;QACrC,OAAO,CACL,KAAK,CAAC,cAAc,CAAC,iBAAiB,GAAG,GAAG;YAC5C,CAAC,KAAK,CAAC,cAAc,CAAC,eAAe,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC;YAChD,CAAC,KAAK,CAAC,cAAc,CAAC,aAAa,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC;YAC9C,CAAC,KAAK,CAAC,cAAc,CAAC,mBAAmB,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CACrD,CAAC;IACJ,CAAC;IAEO,kBAAkB,CAAC,MAAe;QACxC,IAAI,MAAM,CAAC,MAAM,KAAK,CAAC;YAAE,OAAO,CAAC,CAAC;QAElC,MAAM,SAAS,GAAG,MAAM,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,KAAK,EAAE,EAAE;YAC7C,OAAO,GAAG,GAAG,IAAI,CAAC,kBAAkB,CAAC,KAAK,CAAC,CAAC;QAC9C,CAAC,EAAE,CAAC,CAAC,CAAC;QAEN,OAAO,IAAI,CAAC,GAAG,CAAC,SAAS,GAAG,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,CAAC;IAClD,CAAC;IAEO,uBAAuB,CAAC,MAAe;QAC7C,IAAI,MAAM,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;YACxB,OAAO;gBACL,iBAAiB,EAAE,CAAC;gBACpB,gBAAgB,EAAE,CAAC;gBACnB,aAAa,EAAE,CAAC;gBAChB,oBAAoB,EAAE,CAAC;aACxB,CAAC;QACJ,CAAC;QAED,OAAO;YACL,iBAAiB,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,GAAG,EAAE,CAAC,EAAE,EAAE,CAC1C,GAAG,GAAG,CAAC,CAAC,cAAc,CAAC,iBAAiB,EAAE,CAAC,CAAC,GAAG,MAAM,CAAC,MAAM;YAC9D,gBAAgB,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAClC,CAAC,CAAC,cAAc,CAAC,eAAe,CAAC,CAAC,MAAM;YAC1C,aAAa,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAC/B,CAAC,CAAC,cAAc,CAAC,aAAa,CAAC,CAAC,MAAM;YACxC,oBAAoB,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CACtC,CAAC,CAAC,cAAc,CAAC,mBAAmB,CAAC,CAAC,MAAM;SAC/C,CAAC;IACJ,CAAC;IAEO,mBAAmB,CAAC,MAAe;QACzC,MAAM,UAAU,GAAG,MAAM,CAAC,MAAM,CAAC;QACjC,MAAM,QAAQ,GAAG,IAAI,CAAC,GAAG,CAAC,UAAU,GAAG,EAAE,EAAE,GAAG,CAAC,CAAC;QAEhD,MAAM,KAAK,GAAG,UAAU,GAAG,CAAC,CAAC,CAAC,CAAC,QAAQ,GAAG,GAAG,CAAC,CAAC,CAAC,QAAQ,CAAC;QACzD,MAAM,MAAM,GAAG,GAAG,GAAG,CAAC,CAAC,GAAG,KAAK,CAAC,CAAC;QAEjC,OAAO;YACL,KAAK,EAAE,IAAI,CAAC,GAAG,CAAC,GAAG,EAAE,KAAK,CAAC;YAC3B,QAAQ,EAAE;gBACR,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,GAAG,MAAM,CAAC;gBAC3B,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,KAAK,GAAG,MAAM,CAAC;aAC5B;YACD,MAAM,EAAE,WAAW;YACnB,OAAO,EAAE;gBACP,eAAe,EAAE,KAAK;gBACtB,cAAc,EAAE,KAAK;gBACrB,kBAAkB,EAAE,GAAG;aACxB;SACF,CAAC;IACJ,CAAC;CACF;AAtHD,kDAsHC","sourcesContent":["/**\n * Hallucination Engine\n * \n * Identifies risk indicators in AI outputs.\n * Does NOT definitively detect hallucinations - that requires ground truth.\n * \n * @module engines/hallucination\n * @author Haiec\n * @license MIT\n */\n\nimport { Config } from '../../types/config';\nimport { HallucinationResult, Claim, ConfidenceScore } from '../../types/results';\nimport { extractClaims } from './claim-extractor';\nimport { analyzeRiskIndicators, checkContradictions } from './risk-analyzer';\n\nexport class HallucinationEngine {\n  private readonly LIMITATIONS = [\n    'Pattern-based detection only (free tier)',\n    'Cannot verify factual accuracy without ground truth sources',\n    'English language only',\n    'Context-dependent false positives possible',\n    'Novel phrasings may not be detected',\n    'Requires human validation for production use'\n  ];\n  \n  private readonly METHODOLOGY = \n    'Risk indicator identification using linguistic pattern analysis. ' +\n    'Analyzes claim specificity, citation presence, language patterns, and ' +\n    'contradiction signals. Does NOT verify factual accuracy. ' +\n    'Results indicate likelihood that claims need human review.';\n  \n  constructor(private config: Config) {}\n  \n  async detect(content: string): Promise<HallucinationResult> {\n    // Step 1: Extract claims\n    let claims = extractClaims(content);\n    \n    // Step 2: Analyze risk indicators for each claim\n    claims = claims.map(claim => \n      analyzeRiskIndicators(claim, this.config)\n    );\n    \n    // Step 3: Check for contradictions\n    claims = checkContradictions(claims);\n    \n    // Step 4: Identify suspicious claims\n    const suspiciousClaims = claims.filter(claim => {\n      const totalRisk = this.calculateClaimRisk(claim);\n      return totalRisk > 0.5;\n    });\n    \n    // Step 5: Calculate overall risk score\n    const riskScore = this.calculateRiskScore(claims);\n    \n    // Step 6: Calculate risk indicators summary\n    const riskIndicators = this.summarizeRiskIndicators(claims);\n    \n    // Step 7: Calculate confidence\n    const confidence = this.calculateConfidence(claims);\n    \n    return {\n      claims,\n      suspiciousClaims,\n      riskScore,\n      confidence,\n      riskIndicators,\n      limitations: this.LIMITATIONS,\n      methodology: this.METHODOLOGY\n    };\n  }\n  \n  private calculateClaimRisk(claim: Claim): number {\n    return (\n      claim.riskIndicators.lackOfSpecificity * 0.3 +\n      (claim.riskIndicators.missingCitation ? 0.3 : 0) +\n      (claim.riskIndicators.vagueLanguage ? 0.2 : 0) +\n      (claim.riskIndicators.contradictionSignal ? 0.2 : 0)\n    );\n  }\n  \n  private calculateRiskScore(claims: Claim[]): number {\n    if (claims.length === 0) return 0;\n    \n    const totalRisk = claims.reduce((sum, claim) => {\n      return sum + this.calculateClaimRisk(claim);\n    }, 0);\n    \n    return Math.min(totalRisk / claims.length, 1.0);\n  }\n  \n  private summarizeRiskIndicators(claims: Claim[]) {\n    if (claims.length === 0) {\n      return {\n        lackOfSpecificity: 0,\n        missingCitations: 0,\n        vagueLanguage: 0,\n        contradictionSignals: 0\n      };\n    }\n    \n    return {\n      lackOfSpecificity: claims.reduce((sum, c) => \n        sum + c.riskIndicators.lackOfSpecificity, 0) / claims.length,\n      missingCitations: claims.filter(c => \n        c.riskIndicators.missingCitation).length,\n      vagueLanguage: claims.filter(c => \n        c.riskIndicators.vagueLanguage).length,\n      contradictionSignals: claims.filter(c => \n        c.riskIndicators.contradictionSignal).length\n    };\n  }\n  \n  private calculateConfidence(claims: Claim[]): ConfidenceScore {\n    const sampleSize = claims.length;\n    const baseLine = Math.min(sampleSize / 10, 1.0);\n    \n    const value = sampleSize < 3 ? baseLine * 0.5 : baseLine;\n    const margin = 0.2 * (1 - value);\n    \n    return {\n      value: Math.max(0.3, value),\n      interval: [\n        Math.max(0, value - margin),\n        Math.min(1, value + margin)\n      ],\n      method: 'heuristic',\n      factors: {\n        patternStrength: value,\n        contextClarity: value,\n        historicalAccuracy: 0.7\n      }\n    };\n  }\n}\n"]}