llmverify
Version:
AI Output Verification Toolkit — Local-first LLM safety, hallucination detection, PII redaction, prompt injection defense, and runtime monitoring. Zero telemetry. OWASP LLM Top 10 aligned.
197 lines • 17.5 kB
JavaScript
;
/**
* Intent Detection Module
*
* Detects the primary intent/purpose of LLM output.
*
* @module engines/classification/intent
* @author Haiec
* @license MIT
*/
Object.defineProperty(exports, "__esModule", { value: true });
exports.detectIntent = detectIntent;
exports.getPrimaryIntent = getPrimaryIntent;
const utils_1 = require("./utils");
/**
* Intent detection patterns.
*/
const INTENT_PATTERNS = [
{
tag: 'summary',
patterns: [
/\b(in summary|to summarize|overall|in conclusion|key points?|main points?)\b/i,
/\b(tldr|tl;dr|brief overview)\b/i
],
weight: 1.0
},
{
tag: 'explanation',
patterns: [
/\b(because|therefore|this means|in other words|for example|such as)\b/i,
/\b(the reason|explains?|due to|as a result)\b/i,
/\b(works by|functions by|operates by)\b/i
],
weight: 0.8
},
{
tag: 'code',
patterns: [
/```[\s\S]*```/,
/\b(function|const|let|var|class|import|export|return|if|else|for|while)\b/,
/[{}\[\]();]=>/,
/\b(def|async|await|try|catch)\b/
],
weight: 1.0
},
{
tag: 'list',
patterns: [
/^[-*•]\s+/m,
/^\d+[.)]\s+/m,
/\b(here are|the following|steps?:|items?:)\b/i
],
weight: 0.9
},
{
tag: 'question',
patterns: [
/\?$/m,
/\b(what|why|how|when|where|who|which|would you|could you|can you)\b/i
],
weight: 0.7
},
{
tag: 'instruction',
patterns: [
/\b(step \d|first,?|then,?|next,?|finally,?|make sure|ensure|remember to)\b/i,
/\b(you should|you need to|you must|please|do not|don't)\b/i
],
weight: 0.8
},
{
tag: 'creative',
patterns: [
/\b(once upon|imagine|picture this|in a world)\b/i,
/\b(poem|story|tale|narrative|fiction)\b/i
],
weight: 0.9
},
{
tag: 'analysis',
patterns: [
/\b(analysis|analyzing|examine|examining|evaluate|evaluating)\b/i,
/\b(pros and cons|advantages|disadvantages|strengths|weaknesses)\b/i,
/\b(factors|considerations|implications)\b/i
],
weight: 0.8
},
{
tag: 'comparison',
patterns: [
/\b(compared to|versus|vs\.?|differ|difference|similar|unlike|whereas)\b/i,
/\b(on the other hand|in contrast|alternatively)\b/i
],
weight: 0.9
},
{
tag: 'definition',
patterns: [
/\b(is defined as|refers to|means|is a|are a)\b/i,
/\b(definition|meaning|concept of)\b/i
],
weight: 0.7
},
{
tag: 'translation',
patterns: [
/\b(translates? to|in [a-z]+ language|translation)\b/i
],
weight: 1.0
},
{
tag: 'conversation',
patterns: [
/\b(hi|hello|hey|thanks|thank you|you're welcome|sure|okay|ok)\b/i,
/\b(I think|I believe|in my opinion|personally)\b/i
],
weight: 0.5
},
{
tag: 'data',
patterns: [
/\b(data|dataset|statistics|numbers|figures|metrics)\b/i,
/\d+%|\d+\.\d+/,
/\b(table|chart|graph)\b/i
],
weight: 0.7
}
];
/**
* Detects intent candidates from text.
*
* @param text - The text to analyze
* @returns Array of intent candidates sorted by confidence
*/
function detectIntent(text) {
const candidates = [];
const words = (0, utils_1.tokenize)(text);
const bullets = (0, utils_1.countBullets)(text);
for (const { tag, patterns, weight } of INTENT_PATTERNS) {
let matchCount = 0;
const signals = [];
for (const pattern of patterns) {
if (pattern.test(text)) {
matchCount++;
signals.push(pattern.source.substring(0, 30));
}
}
if (matchCount > 0) {
// Calculate confidence based on matches and text characteristics
let confidence = (matchCount / patterns.length) * weight;
// Boost for structural matches
if (tag === 'list' && bullets >= 3) {
confidence = Math.min(1, confidence + 0.3);
}
if (tag === 'code' && text.includes('```')) {
confidence = Math.min(1, confidence + 0.4);
}
// Normalize by text length (longer text = more reliable)
if (words.length < 20) {
confidence *= 0.7;
}
else if (words.length > 100) {
confidence = Math.min(1, confidence * 1.1);
}
candidates.push({
tag,
confidence: Math.round(confidence * 100) / 100,
signals
});
}
}
// Sort by confidence descending
candidates.sort((a, b) => b.confidence - a.confidence);
// If no candidates, return unknown
if (candidates.length === 0) {
candidates.push({
tag: 'unknown',
confidence: 0.5,
signals: ['no_patterns_matched']
});
}
return candidates;
}
/**
* Gets the primary intent from candidates.
*/
function getPrimaryIntent(candidates) {
if (candidates.length === 0)
return null;
const top = candidates[0];
// Only return if confidence is reasonable
if (top.confidence >= 0.3) {
return top.tag;
}
return null;
}
//# sourceMappingURL=data:application/json;base64,{"version":3,"file":"intent.js","sourceRoot":"","sources":["../../../src/engines/classification/intent.ts"],"names":[],"mappings":";AAAA;;;;;;;;GAQG;;AAkIH,oCAwDC;AAKD,4CAUC;AAtMD,mCAAiD;AAEjD;;GAEG;AACH,MAAM,eAAe,GAIhB;IACH;QACE,GAAG,EAAE,SAAS;QACd,QAAQ,EAAE;YACR,+EAA+E;YAC/E,kCAAkC;SACnC;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,aAAa;QAClB,QAAQ,EAAE;YACR,wEAAwE;YACxE,gDAAgD;YAChD,0CAA0C;SAC3C;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,MAAM;QACX,QAAQ,EAAE;YACR,eAAe;YACf,2EAA2E;YAC3E,eAAe;YACf,iCAAiC;SAClC;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,MAAM;QACX,QAAQ,EAAE;YACR,YAAY;YACZ,cAAc;YACd,+CAA+C;SAChD;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,UAAU;QACf,QAAQ,EAAE;YACR,MAAM;YACN,sEAAsE;SACvE;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,aAAa;QAClB,QAAQ,EAAE;YACR,6EAA6E;YAC7E,4DAA4D;SAC7D;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,UAAU;QACf,QAAQ,EAAE;YACR,kDAAkD;YAClD,0CAA0C;SAC3C;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,UAAU;QACf,QAAQ,EAAE;YACR,iEAAiE;YACjE,oEAAoE;YACpE,4CAA4C;SAC7C;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,YAAY;QACjB,QAAQ,EAAE;YACR,0EAA0E;YAC1E,oDAAoD;SACrD;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,YAAY;QACjB,QAAQ,EAAE;YACR,iDAAiD;YACjD,sCAAsC;SACvC;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,aAAa;QAClB,QAAQ,EAAE;YACR,sDAAsD;SACvD;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,cAAc;QACnB,QAAQ,EAAE;YACR,kEAAkE;YAClE,mDAAmD;SACpD;QACD,MAAM,EAAE,GAAG;KACZ;IACD;QACE,GAAG,EAAE,MAAM;QACX,QAAQ,EAAE;YACR,wDAAwD;YACxD,eAAe;YACf,0BAA0B;SAC3B;QACD,MAAM,EAAE,GAAG;KACZ;CACF,CAAC;AAEF;;;;;GAKG;AACH,SAAgB,YAAY,CAAC,IAAY;IACvC,MAAM,UAAU,GAAsB,EAAE,CAAC;IACzC,MAAM,KAAK,GAAG,IAAA,gBAAQ,EAAC,IAAI,CAAC,CAAC;IAC7B,MAAM,OAAO,GAAG,IAAA,oBAAY,EAAC,IAAI,CAAC,CAAC;IAEnC,KAAK,MAAM,EAAE,GAAG,EAAE,QAAQ,EAAE,MAAM,EAAE,IAAI,eAAe,EAAE,CAAC;QACxD,IAAI,UAAU,GAAG,CAAC,CAAC;QACnB,MAAM,OAAO,GAAa,EAAE,CAAC;QAE7B,KAAK,MAAM,OAAO,IAAI,QAAQ,EAAE,CAAC;YAC/B,IAAI,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC;gBACvB,UAAU,EAAE,CAAC;gBACb,OAAO,CAAC,IAAI,CAAC,OAAO,CAAC,MAAM,CAAC,SAAS,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC;YAChD,CAAC;QACH,CAAC;QAED,IAAI,UAAU,GAAG,CAAC,EAAE,CAAC;YACnB,iEAAiE;YACjE,IAAI,UAAU,GAAG,CAAC,UAAU,GAAG,QAAQ,CAAC,MAAM,CAAC,GAAG,MAAM,CAAC;YAEzD,+BAA+B;YAC/B,IAAI,GAAG,KAAK,MAAM,IAAI,OAAO,IAAI,CAAC,EAAE,CAAC;gBACnC,UAAU,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,UAAU,GAAG,GAAG,CAAC,CAAC;YAC7C,CAAC;YACD,IAAI,GAAG,KAAK,MAAM,IAAI,IAAI,CAAC,QAAQ,CAAC,KAAK,CAAC,EAAE,CAAC;gBAC3C,UAAU,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,UAAU,GAAG,GAAG,CAAC,CAAC;YAC7C,CAAC;YAED,yDAAyD;YACzD,IAAI,KAAK,CAAC,MAAM,GAAG,EAAE,EAAE,CAAC;gBACtB,UAAU,IAAI,GAAG,CAAC;YACpB,CAAC;iBAAM,IAAI,KAAK,CAAC,MAAM,GAAG,GAAG,EAAE,CAAC;gBAC9B,UAAU,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,EAAE,UAAU,GAAG,GAAG,CAAC,CAAC;YAC7C,CAAC;YAED,UAAU,CAAC,IAAI,CAAC;gBACd,GAAG;gBACH,UAAU,EAAE,IAAI,CAAC,KAAK,CAAC,UAAU,GAAG,GAAG,CAAC,GAAG,GAAG;gBAC9C,OAAO;aACR,CAAC,CAAC;QACL,CAAC;IACH,CAAC;IAED,gCAAgC;IAChC,UAAU,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,UAAU,GAAG,CAAC,CAAC,UAAU,CAAC,CAAC;IAEvD,mCAAmC;IACnC,IAAI,UAAU,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QAC5B,UAAU,CAAC,IAAI,CAAC;YACd,GAAG,EAAE,SAAS;YACd,UAAU,EAAE,GAAG;YACf,OAAO,EAAE,CAAC,qBAAqB,CAAC;SACjC,CAAC,CAAC;IACL,CAAC;IAED,OAAO,UAAU,CAAC;AACpB,CAAC;AAED;;GAEG;AACH,SAAgB,gBAAgB,CAAC,UAA6B;IAC5D,IAAI,UAAU,CAAC,MAAM,KAAK,CAAC;QAAE,OAAO,IAAI,CAAC;IAEzC,MAAM,GAAG,GAAG,UAAU,CAAC,CAAC,CAAC,CAAC;IAC1B,0CAA0C;IAC1C,IAAI,GAAG,CAAC,UAAU,IAAI,GAAG,EAAE,CAAC;QAC1B,OAAO,GAAG,CAAC,GAAG,CAAC;IACjB,CAAC;IAED,OAAO,IAAI,CAAC;AACd,CAAC","sourcesContent":["/**\n * Intent Detection Module\n * \n * Detects the primary intent/purpose of LLM output.\n * \n * @module engines/classification/intent\n * @author Haiec\n * @license MIT\n */\n\nimport { IntentTag, IntentCandidate } from './types';\nimport { countBullets, tokenize } from './utils';\n\n/**\n * Intent detection patterns.\n */\nconst INTENT_PATTERNS: Array<{\n  tag: IntentTag;\n  patterns: RegExp[];\n  weight: number;\n}> = [\n  {\n    tag: 'summary',\n    patterns: [\n      /\\b(in summary|to summarize|overall|in conclusion|key points?|main points?)\\b/i,\n      /\\b(tldr|tl;dr|brief overview)\\b/i\n    ],\n    weight: 1.0\n  },\n  {\n    tag: 'explanation',\n    patterns: [\n      /\\b(because|therefore|this means|in other words|for example|such as)\\b/i,\n      /\\b(the reason|explains?|due to|as a result)\\b/i,\n      /\\b(works by|functions by|operates by)\\b/i\n    ],\n    weight: 0.8\n  },\n  {\n    tag: 'code',\n    patterns: [\n      /```[\\s\\S]*```/,\n      /\\b(function|const|let|var|class|import|export|return|if|else|for|while)\\b/,\n      /[{}\\[\\]();]=>/,\n      /\\b(def|async|await|try|catch)\\b/\n    ],\n    weight: 1.0\n  },\n  {\n    tag: 'list',\n    patterns: [\n      /^[-*•]\\s+/m,\n      /^\\d+[.)]\\s+/m,\n      /\\b(here are|the following|steps?:|items?:)\\b/i\n    ],\n    weight: 0.9\n  },\n  {\n    tag: 'question',\n    patterns: [\n      /\\?$/m,\n      /\\b(what|why|how|when|where|who|which|would you|could you|can you)\\b/i\n    ],\n    weight: 0.7\n  },\n  {\n    tag: 'instruction',\n    patterns: [\n      /\\b(step \\d|first,?|then,?|next,?|finally,?|make sure|ensure|remember to)\\b/i,\n      /\\b(you should|you need to|you must|please|do not|don't)\\b/i\n    ],\n    weight: 0.8\n  },\n  {\n    tag: 'creative',\n    patterns: [\n      /\\b(once upon|imagine|picture this|in a world)\\b/i,\n      /\\b(poem|story|tale|narrative|fiction)\\b/i\n    ],\n    weight: 0.9\n  },\n  {\n    tag: 'analysis',\n    patterns: [\n      /\\b(analysis|analyzing|examine|examining|evaluate|evaluating)\\b/i,\n      /\\b(pros and cons|advantages|disadvantages|strengths|weaknesses)\\b/i,\n      /\\b(factors|considerations|implications)\\b/i\n    ],\n    weight: 0.8\n  },\n  {\n    tag: 'comparison',\n    patterns: [\n      /\\b(compared to|versus|vs\\.?|differ|difference|similar|unlike|whereas)\\b/i,\n      /\\b(on the other hand|in contrast|alternatively)\\b/i\n    ],\n    weight: 0.9\n  },\n  {\n    tag: 'definition',\n    patterns: [\n      /\\b(is defined as|refers to|means|is a|are a)\\b/i,\n      /\\b(definition|meaning|concept of)\\b/i\n    ],\n    weight: 0.7\n  },\n  {\n    tag: 'translation',\n    patterns: [\n      /\\b(translates? to|in [a-z]+ language|translation)\\b/i\n    ],\n    weight: 1.0\n  },\n  {\n    tag: 'conversation',\n    patterns: [\n      /\\b(hi|hello|hey|thanks|thank you|you're welcome|sure|okay|ok)\\b/i,\n      /\\b(I think|I believe|in my opinion|personally)\\b/i\n    ],\n    weight: 0.5\n  },\n  {\n    tag: 'data',\n    patterns: [\n      /\\b(data|dataset|statistics|numbers|figures|metrics)\\b/i,\n      /\\d+%|\\d+\\.\\d+/,\n      /\\b(table|chart|graph)\\b/i\n    ],\n    weight: 0.7\n  }\n];\n\n/**\n * Detects intent candidates from text.\n * \n * @param text - The text to analyze\n * @returns Array of intent candidates sorted by confidence\n */\nexport function detectIntent(text: string): IntentCandidate[] {\n  const candidates: IntentCandidate[] = [];\n  const words = tokenize(text);\n  const bullets = countBullets(text);\n  \n  for (const { tag, patterns, weight } of INTENT_PATTERNS) {\n    let matchCount = 0;\n    const signals: string[] = [];\n    \n    for (const pattern of patterns) {\n      if (pattern.test(text)) {\n        matchCount++;\n        signals.push(pattern.source.substring(0, 30));\n      }\n    }\n    \n    if (matchCount > 0) {\n      // Calculate confidence based on matches and text characteristics\n      let confidence = (matchCount / patterns.length) * weight;\n      \n      // Boost for structural matches\n      if (tag === 'list' && bullets >= 3) {\n        confidence = Math.min(1, confidence + 0.3);\n      }\n      if (tag === 'code' && text.includes('```')) {\n        confidence = Math.min(1, confidence + 0.4);\n      }\n      \n      // Normalize by text length (longer text = more reliable)\n      if (words.length < 20) {\n        confidence *= 0.7;\n      } else if (words.length > 100) {\n        confidence = Math.min(1, confidence * 1.1);\n      }\n      \n      candidates.push({\n        tag,\n        confidence: Math.round(confidence * 100) / 100,\n        signals\n      });\n    }\n  }\n  \n  // Sort by confidence descending\n  candidates.sort((a, b) => b.confidence - a.confidence);\n  \n  // If no candidates, return unknown\n  if (candidates.length === 0) {\n    candidates.push({\n      tag: 'unknown',\n      confidence: 0.5,\n      signals: ['no_patterns_matched']\n    });\n  }\n  \n  return candidates;\n}\n\n/**\n * Gets the primary intent from candidates.\n */\nexport function getPrimaryIntent(candidates: IntentCandidate[]): IntentTag | null {\n  if (candidates.length === 0) return null;\n  \n  const top = candidates[0];\n  // Only return if confidence is reasonable\n  if (top.confidence >= 0.3) {\n    return top.tag;\n  }\n  \n  return null;\n}\n"]}