UNPKG

llmverify

Version:

AI Output Verification Toolkit — Local-first LLM safety, hallucination detection, PII redaction, prompt injection defense, and runtime monitoring. Zero telemetry. OWASP LLM Top 10 aligned.

197 lines 17.5 kB
"use strict"; /** * Intent Detection Module * * Detects the primary intent/purpose of LLM output. * * @module engines/classification/intent * @author Haiec * @license MIT */ Object.defineProperty(exports, "__esModule", { value: true }); exports.detectIntent = detectIntent; exports.getPrimaryIntent = getPrimaryIntent; const utils_1 = require("./utils"); /** * Intent detection patterns. */ const INTENT_PATTERNS = [ { tag: 'summary', patterns: [ /\b(in summary|to summarize|overall|in conclusion|key points?|main points?)\b/i, /\b(tldr|tl;dr|brief overview)\b/i ], weight: 1.0 }, { tag: 'explanation', patterns: [ /\b(because|therefore|this means|in other words|for example|such as)\b/i, /\b(the reason|explains?|due to|as a result)\b/i, /\b(works by|functions by|operates by)\b/i ], weight: 0.8 }, { tag: 'code', patterns: [ /```[\s\S]*```/, /\b(function|const|let|var|class|import|export|return|if|else|for|while)\b/, /[{}\[\]();]=>/, /\b(def|async|await|try|catch)\b/ ], weight: 1.0 }, { tag: 'list', patterns: [ /^[-*•]\s+/m, /^\d+[.)]\s+/m, /\b(here are|the following|steps?:|items?:)\b/i ], weight: 0.9 }, { tag: 'question', patterns: [ /\?$/m, /\b(what|why|how|when|where|who|which|would you|could you|can you)\b/i ], weight: 0.7 }, { tag: 'instruction', patterns: [ /\b(step \d|first,?|then,?|next,?|finally,?|make sure|ensure|remember to)\b/i, /\b(you should|you need to|you must|please|do not|don't)\b/i ], weight: 0.8 }, { tag: 'creative', patterns: [ /\b(once upon|imagine|picture this|in a world)\b/i, /\b(poem|story|tale|narrative|fiction)\b/i ], weight: 0.9 }, { tag: 'analysis', patterns: [ /\b(analysis|analyzing|examine|examining|evaluate|evaluating)\b/i, /\b(pros and cons|advantages|disadvantages|strengths|weaknesses)\b/i, /\b(factors|considerations|implications)\b/i ], weight: 0.8 }, { tag: 'comparison', patterns: [ /\b(compared to|versus|vs\.?|differ|difference|similar|unlike|whereas)\b/i, /\b(on the other hand|in contrast|alternatively)\b/i ], weight: 0.9 }, { tag: 'definition', patterns: [ /\b(is defined as|refers to|means|is a|are a)\b/i, /\b(definition|meaning|concept of)\b/i ], weight: 0.7 }, { tag: 'translation', patterns: [ /\b(translates? to|in [a-z]+ language|translation)\b/i ], weight: 1.0 }, { tag: 'conversation', patterns: [ /\b(hi|hello|hey|thanks|thank you|you're welcome|sure|okay|ok)\b/i, /\b(I think|I believe|in my opinion|personally)\b/i ], weight: 0.5 }, { tag: 'data', patterns: [ /\b(data|dataset|statistics|numbers|figures|metrics)\b/i, /\d+%|\d+\.\d+/, /\b(table|chart|graph)\b/i ], weight: 0.7 } ]; /** * Detects intent candidates from text. * * @param text - The text to analyze * @returns Array of intent candidates sorted by confidence */ function detectIntent(text) { const candidates = []; const words = (0, utils_1.tokenize)(text); const bullets = (0, utils_1.countBullets)(text); for (const { tag, patterns, weight } of INTENT_PATTERNS) { let matchCount = 0; const signals = []; for (const pattern of patterns) { if (pattern.test(text)) { matchCount++; signals.push(pattern.source.substring(0, 30)); } } if (matchCount > 0) { // Calculate confidence based on matches and text characteristics let confidence = (matchCount / patterns.length) * weight; // Boost for structural matches if (tag === 'list' && bullets >= 3) { confidence = Math.min(1, confidence + 0.3); } if (tag === 'code' && text.includes('```')) { confidence = Math.min(1, confidence + 0.4); } // Normalize by text length (longer text = more reliable) if (words.length < 20) { confidence *= 0.7; } else if (words.length > 100) { confidence = Math.min(1, confidence * 1.1); } candidates.push({ tag, confidence: Math.round(confidence * 100) / 100, signals }); } } // Sort by confidence descending candidates.sort((a, b) => b.confidence - a.confidence); // If no candidates, return unknown if (candidates.length === 0) { candidates.push({ tag: 'unknown', confidence: 0.5, signals: ['no_patterns_matched'] }); } return candidates; } /** * Gets the primary intent from candidates. */ function getPrimaryIntent(candidates) { if (candidates.length === 0) return null; const top = candidates[0]; // Only return if confidence is reasonable if (top.confidence >= 0.3) { return top.tag; } return null; } //# sourceMappingURL=data:application/json;base64,{"version":3,"file":"intent.js","sourceRoot":"","sources":["../../../src/engines/classification/intent.ts"],"names":[],"mappings":";AAAA;;;;;;;;GAQG;;AAkIH,oCAwDC;AAKD,4CAUC;AAtMD,mCAAiD;AAEjD;;GAEG;AACH,MAAM,eAAe,GAIhB;IACH;QACE,GAAG,EAAE,SAAS;QACd,QAAQ,EAAE;YACR,+EAA+E;YAC/E,kCAAkC;SACnC;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,aAAa;QAClB,QAAQ,EAAE;YACR,wEAAwE;YACxE,gDAAgD;YAChD,0CAA0C;SAC3C;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,MAAM;QACX,QAAQ,EAAE;YACR,eAAe;YACf,2EAA2E;YAC3E,eAAe;YACf,iCAAiC;SAClC;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,MAAM;QACX,QAAQ,EAAE;YACR,YAAY;YACZ,cAAc;YACd,+CAA+C;SAChD;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,UAAU;QACf,QAAQ,EAAE;YACR,MAAM;YACN,sEAAsE;SACvE;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,aAAa;QAClB,QAAQ,EAAE;YACR,6EAA6E;YAC7E,4DAA4D;SAC7D;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,UAAU;QACf,QAAQ,EAAE;YACR,kDAAkD;YAClD,0CAA0C;SAC3C;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,UAAU;QACf,QAAQ,EAAE;YACR,iEAAiE;YACjE,oEAAoE;YACpE,4CAA4C;SAC7C;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,YAAY;QACjB,QAAQ,EAAE;YACR,0EAA0E;YAC1E,oDAAoD;SACrD;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,YAAY;QACjB,QAAQ,EAAE;YACR,iDAAiD;YACjD,sCAAsC;SACvC;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,aAAa;QAClB,QAAQ,EAAE;YACR,sDAAsD;SACvD;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,cAAc;QACnB,QAAQ,EAAE;YACR,kEAAkE;YAClE,mDAAmD;SACpD;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,MAAM;QACX,QAAQ,EAAE;YACR,wDAAwD;YACxD,eAAe;YACf,0BAA0B;SAC3B;QACD,MAAM,EAAE,GAAG;KACZ;CACF,CAAC;AAEF;;;;;GAKG;AACH,SAAgB,YAAY,CAAC,IAAY;IACvC,MAAM,UAAU,GAAsB,EAAE,CAAC;IACzC,MAAM,KAAK,GAAG,IAAA,gBAAQ,EAAC,IAAI,CAAC,CAAC;IAC7B,MAAM,OAAO,GAAG,IAAA,oBAAY,EAAC,IAAI,CAAC,CAAC;IAEnC,KAAK,MAAM,EAAE,GAAG,EAAE,QAAQ,EAAE,MAAM,EAAE,IAAI,eAAe,EAAE,CAAC;QACxD,IAAI,UAAU,GAAG,CAAC,CAAC;QACnB,MAAM,OAAO,GAAa,EAAE,CAAC;QAE7B,KAAK,MAAM,OAAO,IAAI,QAAQ,EAAE,CAAC;YAC/B,IAAI,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;gBACvB,UAAU,EAAE,CAAC;gBACb,OAAO,CAAC,IAAI,CAAC,OAAO,CAAC,MAAM,CAAC,SAAS,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC;YAChD,CAAC;QACH,CAAC;QAED,IAAI,UAAU,GAAG,CAAC,EAAE,CAAC;YACnB,iEAAiE;YACjE,IAAI,UAAU,GAAG,CAAC,UAAU,GAAG,QAAQ,CAAC,MAAM,CAAC,GAAG,MAAM,CAAC;YAEzD,+BAA+B;YAC/B,IAAI,GAAG,KAAK,MAAM,IAAI,OAAO,IAAI,CAAC,EAAE,CAAC;gBACnC,UAAU,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,UAAU,GAAG,GAAG,CAAC,CAAC;YAC7C,CAAC;YACD,IAAI,GAAG,KAAK,MAAM,IAAI,IAAI,CAAC,QAAQ,CAAC,KAAK,CAAC,EAAE,CAAC;gBAC3C,UAAU,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,UAAU,GAAG,GAAG,CAAC,CAAC;YAC7C,CAAC;YAED,yDAAyD;YACzD,IAAI,KAAK,CAAC,MAAM,GAAG,EAAE,EAAE,CAAC;gBACtB,UAAU,IAAI,GAAG,CAAC;YACpB,CAAC;iBAAM,IAAI,KAAK,CAAC,MAAM,GAAG,GAAG,EAAE,CAAC;gBAC9B,UAAU,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,UAAU,GAAG,GAAG,CAAC,CAAC;YAC7C,CAAC;YAED,UAAU,CAAC,IAAI,CAAC;gBACd,GAAG;gBACH,UAAU,EAAE,IAAI,CAAC,KAAK,CAAC,UAAU,GAAG,GAAG,CAAC,GAAG,GAAG;gBAC9C,OAAO;aACR,CAAC,CAAC;QACL,CAAC;IACH,CAAC;IAED,gCAAgC;IAChC,UAAU,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,UAAU,GAAG,CAAC,CAAC,UAAU,CAAC,CAAC;IAEvD,mCAAmC;IACnC,IAAI,UAAU,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QAC5B,UAAU,CAAC,IAAI,CAAC;YACd,GAAG,EAAE,SAAS;YACd,UAAU,EAAE,GAAG;YACf,OAAO,EAAE,CAAC,qBAAqB,CAAC;SACjC,CAAC,CAAC;IACL,CAAC;IAED,OAAO,UAAU,CAAC;AACpB,CAAC;AAED;;GAEG;AACH,SAAgB,gBAAgB,CAAC,UAA6B;IAC5D,IAAI,UAAU,CAAC,MAAM,KAAK,CAAC;QAAE,OAAO,IAAI,CAAC;IAEzC,MAAM,GAAG,GAAG,UAAU,CAAC,CAAC,CAAC,CAAC;IAC1B,0CAA0C;IAC1C,IAAI,GAAG,CAAC,UAAU,IAAI,GAAG,EAAE,CAAC;QAC1B,OAAO,GAAG,CAAC,GAAG,CAAC;IACjB,CAAC;IAED,OAAO,IAAI,CAAC;AACd,CAAC","sourcesContent":["/**\n * Intent Detection Module\n * \n * Detects the primary intent/purpose of LLM output.\n * \n * @module engines/classification/intent\n * @author Haiec\n * @license MIT\n */\n\nimport { IntentTag, IntentCandidate } from './types';\nimport { countBullets, tokenize } from './utils';\n\n/**\n * Intent detection patterns.\n */\nconst INTENT_PATTERNS: Array<{\n  tag: IntentTag;\n  patterns: RegExp[];\n  weight: number;\n}> = [\n  {\n    tag: 'summary',\n    patterns: [\n      /\\b(in summary|to summarize|overall|in conclusion|key points?|main points?)\\b/i,\n      /\\b(tldr|tl;dr|brief overview)\\b/i\n    ],\n    weight: 1.0\n  },\n  {\n    tag: 'explanation',\n    patterns: [\n      /\\b(because|therefore|this means|in other words|for example|such as)\\b/i,\n      /\\b(the reason|explains?|due to|as a result)\\b/i,\n      /\\b(works by|functions by|operates by)\\b/i\n    ],\n    weight: 0.8\n  },\n  {\n    tag: 'code',\n    patterns: [\n      /```[\\s\\S]*```/,\n      /\\b(function|const|let|var|class|import|export|return|if|else|for|while)\\b/,\n      /[{}\\[\\]();]=>/,\n      /\\b(def|async|await|try|catch)\\b/\n    ],\n    weight: 1.0\n  },\n  {\n    tag: 'list',\n    patterns: [\n      /^[-*•]\\s+/m,\n      /^\\d+[.)]\\s+/m,\n      /\\b(here are|the following|steps?:|items?:)\\b/i\n    ],\n    weight: 0.9\n  },\n  {\n    tag: 'question',\n    patterns: [\n      /\\?$/m,\n      /\\b(what|why|how|when|where|who|which|would you|could you|can you)\\b/i\n    ],\n    weight: 0.7\n  },\n  {\n    tag: 'instruction',\n    patterns: [\n      /\\b(step \\d|first,?|then,?|next,?|finally,?|make sure|ensure|remember to)\\b/i,\n      /\\b(you should|you need to|you must|please|do not|don't)\\b/i\n    ],\n    weight: 0.8\n  },\n  {\n    tag: 'creative',\n    patterns: [\n      /\\b(once upon|imagine|picture this|in a world)\\b/i,\n      /\\b(poem|story|tale|narrative|fiction)\\b/i\n    ],\n    weight: 0.9\n  },\n  {\n    tag: 'analysis',\n    patterns: [\n      /\\b(analysis|analyzing|examine|examining|evaluate|evaluating)\\b/i,\n      /\\b(pros and cons|advantages|disadvantages|strengths|weaknesses)\\b/i,\n      /\\b(factors|considerations|implications)\\b/i\n    ],\n    weight: 0.8\n  },\n  {\n    tag: 'comparison',\n    patterns: [\n      /\\b(compared to|versus|vs\\.?|differ|difference|similar|unlike|whereas)\\b/i,\n      /\\b(on the other hand|in contrast|alternatively)\\b/i\n    ],\n    weight: 0.9\n  },\n  {\n    tag: 'definition',\n    patterns: [\n      /\\b(is defined as|refers to|means|is a|are a)\\b/i,\n      /\\b(definition|meaning|concept of)\\b/i\n    ],\n    weight: 0.7\n  },\n  {\n    tag: 'translation',\n    patterns: [\n      /\\b(translates? to|in [a-z]+ language|translation)\\b/i\n    ],\n    weight: 1.0\n  },\n  {\n    tag: 'conversation',\n    patterns: [\n      /\\b(hi|hello|hey|thanks|thank you|you're welcome|sure|okay|ok)\\b/i,\n      /\\b(I think|I believe|in my opinion|personally)\\b/i\n    ],\n    weight: 0.5\n  },\n  {\n    tag: 'data',\n    patterns: [\n      /\\b(data|dataset|statistics|numbers|figures|metrics)\\b/i,\n      /\\d+%|\\d+\\.\\d+/,\n      /\\b(table|chart|graph)\\b/i\n    ],\n    weight: 0.7\n  }\n];\n\n/**\n * Detects intent candidates from text.\n * \n * @param text - The text to analyze\n * @returns Array of intent candidates sorted by confidence\n */\nexport function detectIntent(text: string): IntentCandidate[] {\n  const candidates: IntentCandidate[] = [];\n  const words = tokenize(text);\n  const bullets = countBullets(text);\n  \n  for (const { tag, patterns, weight } of INTENT_PATTERNS) {\n    let matchCount = 0;\n    const signals: string[] = [];\n    \n    for (const pattern of patterns) {\n      if (pattern.test(text)) {\n        matchCount++;\n        signals.push(pattern.source.substring(0, 30));\n      }\n    }\n    \n    if (matchCount > 0) {\n      // Calculate confidence based on matches and text characteristics\n      let confidence = (matchCount / patterns.length) * weight;\n      \n      // Boost for structural matches\n      if (tag === 'list' && bullets >= 3) {\n        confidence = Math.min(1, confidence + 0.3);\n      }\n      if (tag === 'code' && text.includes('```')) {\n        confidence = Math.min(1, confidence + 0.4);\n      }\n      \n      // Normalize by text length (longer text = more reliable)\n      if (words.length < 20) {\n        confidence *= 0.7;\n      } else if (words.length > 100) {\n        confidence = Math.min(1, confidence * 1.1);\n      }\n      \n      candidates.push({\n        tag,\n        confidence: Math.round(confidence * 100) / 100,\n        signals\n      });\n    }\n  }\n  \n  // Sort by confidence descending\n  candidates.sort((a, b) => b.confidence - a.confidence);\n  \n  // If no candidates, return unknown\n  if (candidates.length === 0) {\n    candidates.push({\n      tag: 'unknown',\n      confidence: 0.5,\n      signals: ['no_patterns_matched']\n    });\n  }\n  \n  return candidates;\n}\n\n/**\n * Gets the primary intent from candidates.\n */\nexport function getPrimaryIntent(candidates: IntentCandidate[]): IntentTag | null {\n  if (candidates.length === 0) return null;\n  \n  const top = candidates[0];\n  // Only return if confidence is reasonable\n  if (top.confidence >= 0.3) {\n    return top.tag;\n  }\n  \n  return null;\n}\n"]}