UNPKG

llmverify

Version:

AI Output Verification Toolkit — Local-first LLM safety, hallucination detection, PII redaction, prompt injection defense, and runtime monitoring. Zero telemetry. OWASP LLM Top 10 aligned.

107 lines 12.2 kB
"use strict"; /** * Text Similarity Utilities * * Simple similarity measures for consistency checking. * * @module utils/similarity * @author Haiec * @license MIT */ Object.defineProperty(exports, "__esModule", { value: true }); exports.jaccardSimilarity = jaccardSimilarity; exports.cosineSimilarity = cosineSimilarity; exports.levenshteinDistance = levenshteinDistance; exports.levenshteinSimilarity = levenshteinSimilarity; exports.combinedSimilarity = combinedSimilarity; /** * Calculate Jaccard similarity between two texts */ function jaccardSimilarity(text1, text2) { const words1 = new Set(text1.toLowerCase().split(/\s+/)); const words2 = new Set(text2.toLowerCase().split(/\s+/)); const intersection = new Set([...words1].filter(x => words2.has(x))); const union = new Set([...words1, ...words2]); if (union.size === 0) return 1; return intersection.size / union.size; } /** * Calculate cosine similarity using word frequency vectors */ function cosineSimilarity(text1, text2) { const freq1 = getWordFrequency(text1); const freq2 = getWordFrequency(text2); const allWords = new Set([...Object.keys(freq1), ...Object.keys(freq2)]); let dotProduct = 0; let norm1 = 0; let norm2 = 0; for (const word of allWords) { const v1 = freq1[word] || 0; const v2 = freq2[word] || 0; dotProduct += v1 * v2; norm1 += v1 * v1; norm2 += v2 * v2; } if (norm1 === 0 || norm2 === 0) return 0; return dotProduct / (Math.sqrt(norm1) * Math.sqrt(norm2)); } /** * Get word frequency map */ function getWordFrequency(text) { const words = text.toLowerCase().split(/\s+/); const freq = {}; for (const word of words) { if (word.length > 0) { freq[word] = (freq[word] || 0) + 1; } } return freq; } /** * Calculate Levenshtein distance between two strings */ function levenshteinDistance(str1, str2) { const m = str1.length; const n = str2.length; const dp = Array(m + 1) .fill(null) .map(() => Array(n + 1).fill(0)); for (let i = 0; i <= m; i++) dp[i][0] = i; for (let j = 0; j <= n; j++) dp[0][j] = j; for (let i = 1; i <= m; i++) { for (let j = 1; j <= n; j++) { if (str1[i - 1] === str2[j - 1]) { dp[i][j] = dp[i - 1][j - 1]; } else { dp[i][j] = 1 + Math.min(dp[i - 1][j], dp[i][j - 1], dp[i - 1][j - 1]); } } } return dp[m][n]; } /** * Calculate normalized Levenshtein similarity (0-1) */ function levenshteinSimilarity(str1, str2) { const maxLen = Math.max(str1.length, str2.length); if (maxLen === 0) return 1; const distance = levenshteinDistance(str1, str2); return 1 - distance / maxLen; } /** * Combined similarity score using multiple methods */ function combinedSimilarity(text1, text2) { const jaccard = jaccardSimilarity(text1, text2); const cosine = cosineSimilarity(text1, text2); // Weighted average return jaccard * 0.4 + cosine * 0.6; } //# sourceMappingURL=data:application/json;base64,{"version":3,"file":"similarity.js","sourceRoot":"","sources":["../../src/utils/similarity.ts"],"names":[],"mappings":";AAAA;;;;;;;;GAQG;;AAKH,8CAUC;AAKD,4CAsBC;AAqBD,kDA0BC;AAKD,sDAMC;AAKD,gDAMC;AA7GD;;GAEG;AACH,SAAgB,iBAAiB,CAAC,KAAa,EAAE,KAAa;IAC5D,MAAM,MAAM,GAAG,IAAI,GAAG,CAAC,KAAK,CAAC,WAAW,EAAE,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC,CAAC;IACzD,MAAM,MAAM,GAAG,IAAI,GAAG,CAAC,KAAK,CAAC,WAAW,EAAE,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC,CAAC;IAEzD,MAAM,YAAY,GAAG,IAAI,GAAG,CAAC,CAAC,GAAG,MAAM,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,MAAM,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;IACrE,MAAM,KAAK,GAAG,IAAI,GAAG,CAAC,CAAC,GAAG,MAAM,EAAE,GAAG,MAAM,CAAC,CAAC,CAAC;IAE9C,IAAI,KAAK,CAAC,IAAI,KAAK,CAAC;QAAE,OAAO,CAAC,CAAC;IAE/B,OAAO,YAAY,CAAC,IAAI,GAAG,KAAK,CAAC,IAAI,CAAC;AACxC,CAAC;AAED;;GAEG;AACH,SAAgB,gBAAgB,CAAC,KAAa,EAAE,KAAa;IAC3D,MAAM,KAAK,GAAG,gBAAgB,CAAC,KAAK,CAAC,CAAC;IACtC,MAAM,KAAK,GAAG,gBAAgB,CAAC,KAAK,CAAC,CAAC;IAEtC,MAAM,QAAQ,GAAG,IAAI,GAAG,CAAC,CAAC,GAAG,MAAM,CAAC,IAAI,CAAC,KAAK,CAAC,EAAE,GAAG,MAAM,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;IAEzE,IAAI,UAAU,GAAG,CAAC,CAAC;IACnB,IAAI,KAAK,GAAG,CAAC,CAAC;IACd,IAAI,KAAK,GAAG,CAAC,CAAC;IAEd,KAAK,MAAM,IAAI,IAAI,QAAQ,EAAE,CAAC;QAC5B,MAAM,EAAE,GAAG,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QAC5B,MAAM,EAAE,GAAG,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QAE5B,UAAU,IAAI,EAAE,GAAG,EAAE,CAAC;QACtB,KAAK,IAAI,EAAE,GAAG,EAAE,CAAC;QACjB,KAAK,IAAI,EAAE,GAAG,EAAE,CAAC;IACnB,CAAC;IAED,IAAI,KAAK,KAAK,CAAC,IAAI,KAAK,KAAK,CAAC;QAAE,OAAO,CAAC,CAAC;IAEzC,OAAO,UAAU,GAAG,CAAC,IAAI,CAAC,IAAI,CAAC,KAAK,CAAC,GAAG,IAAI,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC,CAAC;AAC5D,CAAC;AAED;;GAEG;AACH,SAAS,gBAAgB,CAAC,IAAY;IACpC,MAAM,KAAK,GAAG,IAAI,CAAC,WAAW,EAAE,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC;IAC9C,MAAM,IAAI,GAA2B,EAAE,CAAC;IAExC,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;QACzB,IAAI,IAAI,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;YACpB,IAAI,CAAC,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC,GAAG,CAAC,CAAC;QACrC,CAAC;IACH,CAAC;IAED,OAAO,IAAI,CAAC;AACd,CAAC;AAED;;GAEG;AACH,SAAgB,mBAAmB,CAAC,IAAY,EAAE,IAAY;IAC5D,MAAM,CAAC,GAAG,IAAI,CAAC,MAAM,CAAC;IACtB,MAAM,CAAC,GAAG,IAAI,CAAC,MAAM,CAAC;IAEtB,MAAM,EAAE,GAAe,KAAK,CAAC,CAAC,GAAG,CAAC,CAAC;SAChC,IAAI,CAAC,IAAI,CAAC;SACV,GAAG,CAAC,GAAG,EAAE,CAAC,KAAK,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC,CAAC;IAEnC,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC,EAAE;QAAE,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC;IAC1C,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC,EAAE;QAAE,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC;IAE1C,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC;QAC5B,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC;YAC5B,IAAI,IAAI,CAAC,CAAC,GAAG,CAAC,CAAC,KAAK,IAAI,CAAC,CAAC,GAAG,CAAC,CAAC,EAAE,CAAC;gBAChC,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,GAAG,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC;YAC9B,CAAC;iBAAM,CAAC;gBACN,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,GAAG,IAAI,CAAC,GAAG,CACrB,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,EACZ,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,EACZ,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CACjB,CAAC;YACJ,CAAC;QACH,CAAC;IACH,CAAC;IAED,OAAO,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;AAClB,CAAC;AAED;;GAEG;AACH,SAAgB,qBAAqB,CAAC,IAAY,EAAE,IAAY;IAC9D,MAAM,MAAM,GAAG,IAAI,CAAC,GAAG,CAAC,IAAI,CAAC,MAAM,EAAE,IAAI,CAAC,MAAM,CAAC,CAAC;IAClD,IAAI,MAAM,KAAK,CAAC;QAAE,OAAO,CAAC,CAAC;IAE3B,MAAM,QAAQ,GAAG,mBAAmB,CAAC,IAAI,EAAE,IAAI,CAAC,CAAC;IACjD,OAAO,CAAC,GAAG,QAAQ,GAAG,MAAM,CAAC;AAC/B,CAAC;AAED;;GAEG;AACH,SAAgB,kBAAkB,CAAC,KAAa,EAAE,KAAa;IAC7D,MAAM,OAAO,GAAG,iBAAiB,CAAC,KAAK,EAAE,KAAK,CAAC,CAAC;IAChD,MAAM,MAAM,GAAG,gBAAgB,CAAC,KAAK,EAAE,KAAK,CAAC,CAAC;IAE9C,mBAAmB;IACnB,OAAO,OAAO,GAAG,GAAG,GAAG,MAAM,GAAG,GAAG,CAAC;AACtC,CAAC","sourcesContent":["/**\n * Text Similarity Utilities\n * \n * Simple similarity measures for consistency checking.\n * \n * @module utils/similarity\n * @author Haiec\n * @license MIT\n */\n\n/**\n * Calculate Jaccard similarity between two texts\n */\nexport function jaccardSimilarity(text1: string, text2: string): number {\n  const words1 = new Set(text1.toLowerCase().split(/\\s+/));\n  const words2 = new Set(text2.toLowerCase().split(/\\s+/));\n  \n  const intersection = new Set([...words1].filter(x => words2.has(x)));\n  const union = new Set([...words1, ...words2]);\n  \n  if (union.size === 0) return 1;\n  \n  return intersection.size / union.size;\n}\n\n/**\n * Calculate cosine similarity using word frequency vectors\n */\nexport function cosineSimilarity(text1: string, text2: string): number {\n  const freq1 = getWordFrequency(text1);\n  const freq2 = getWordFrequency(text2);\n  \n  const allWords = new Set([...Object.keys(freq1), ...Object.keys(freq2)]);\n  \n  let dotProduct = 0;\n  let norm1 = 0;\n  let norm2 = 0;\n  \n  for (const word of allWords) {\n    const v1 = freq1[word] || 0;\n    const v2 = freq2[word] || 0;\n    \n    dotProduct += v1 * v2;\n    norm1 += v1 * v1;\n    norm2 += v2 * v2;\n  }\n  \n  if (norm1 === 0 || norm2 === 0) return 0;\n  \n  return dotProduct / (Math.sqrt(norm1) * Math.sqrt(norm2));\n}\n\n/**\n * Get word frequency map\n */\nfunction getWordFrequency(text: string): Record<string, number> {\n  const words = text.toLowerCase().split(/\\s+/);\n  const freq: Record<string, number> = {};\n  \n  for (const word of words) {\n    if (word.length > 0) {\n      freq[word] = (freq[word] || 0) + 1;\n    }\n  }\n  \n  return freq;\n}\n\n/**\n * Calculate Levenshtein distance between two strings\n */\nexport function levenshteinDistance(str1: string, str2: string): number {\n  const m = str1.length;\n  const n = str2.length;\n  \n  const dp: number[][] = Array(m + 1)\n    .fill(null)\n    .map(() => Array(n + 1).fill(0));\n  \n  for (let i = 0; i <= m; i++) dp[i][0] = i;\n  for (let j = 0; j <= n; j++) dp[0][j] = j;\n  \n  for (let i = 1; i <= m; i++) {\n    for (let j = 1; j <= n; j++) {\n      if (str1[i - 1] === str2[j - 1]) {\n        dp[i][j] = dp[i - 1][j - 1];\n      } else {\n        dp[i][j] = 1 + Math.min(\n          dp[i - 1][j],\n          dp[i][j - 1],\n          dp[i - 1][j - 1]\n        );\n      }\n    }\n  }\n  \n  return dp[m][n];\n}\n\n/**\n * Calculate normalized Levenshtein similarity (0-1)\n */\nexport function levenshteinSimilarity(str1: string, str2: string): number {\n  const maxLen = Math.max(str1.length, str2.length);\n  if (maxLen === 0) return 1;\n  \n  const distance = levenshteinDistance(str1, str2);\n  return 1 - distance / maxLen;\n}\n\n/**\n * Combined similarity score using multiple methods\n */\nexport function combinedSimilarity(text1: string, text2: string): number {\n  const jaccard = jaccardSimilarity(text1, text2);\n  const cosine = cosineSimilarity(text1, text2);\n  \n  // Weighted average\n  return jaccard * 0.4 + cosine * 0.6;\n}\n"]}