llmverify
Version:
AI Output Verification Toolkit — Local-first LLM safety, hallucination detection, PII redaction, prompt injection defense, and runtime monitoring. Zero telemetry. OWASP LLM Top 10 aligned.
189 lines • 23.2 kB
JavaScript
;
/**
* Instruction-Following Evaluation Module
*
* Evaluates whether LLM output follows specified instruction rules.
*
* @module engines/classification/instruction-eval
* @author Haiec
* @license MIT
*/
Object.defineProperty(exports, "__esModule", { value: true });
exports.evaluateInstructionRules = evaluateInstructionRules;
const utils_1 = require("./utils");
/**
* Evaluates a format rule.
*/
function evaluateFormatRule(rule, text, isJson, bullets, sentences) {
const expect = rule.params.expect;
switch (expect) {
case 'json':
return {
id: rule.id,
passed: isJson,
reason: isJson ? undefined : 'Expected JSON output but none found'
};
case 'list':
return {
id: rule.id,
passed: bullets >= 1,
reason: bullets >= 1 ? undefined : 'Expected list format but no list items found'
};
case 'paragraph':
const isParagraph = bullets === 0 && sentences >= 2;
return {
id: rule.id,
passed: isParagraph,
reason: isParagraph ? undefined : 'Expected paragraph format'
};
case 'code':
const hasCode = /```[\s\S]*```/.test(text) || /^\s{4,}|\t/m.test(text);
return {
id: rule.id,
passed: hasCode,
reason: hasCode ? undefined : 'Expected code block but none found'
};
default:
return { id: rule.id, passed: true };
}
}
/**
* Evaluates a length rule.
*/
function evaluateLengthRule(rule, words, bullets) {
const { minWords, maxWords, minBullets, maxBullets } = rule.params;
const failures = [];
if (minWords !== undefined && words < minWords) {
failures.push(`Expected at least ${minWords} words, got ${words}`);
}
if (maxWords !== undefined && words > maxWords) {
failures.push(`Expected at most ${maxWords} words, got ${words}`);
}
if (minBullets !== undefined && bullets < minBullets) {
failures.push(`Expected at least ${minBullets} list items, got ${bullets}`);
}
if (maxBullets !== undefined && bullets > maxBullets) {
failures.push(`Expected at most ${maxBullets} list items, got ${bullets}`);
}
return {
id: rule.id,
passed: failures.length === 0,
reason: failures.length > 0 ? failures[0] : undefined
};
}
/**
* Evaluates an include rule.
*/
function evaluateIncludeRule(rule, text) {
const terms = rule.params.terms || [];
const lower = text.toLowerCase();
const missing = terms.filter(t => !lower.includes(t.toLowerCase()));
return {
id: rule.id,
passed: missing.length === 0,
reason: missing.length > 0 ? `Missing required terms: ${missing.join(', ')}` : undefined
};
}
/**
* Evaluates an exclude rule.
*/
function evaluateExcludeRule(rule, text) {
const terms = rule.params.terms || [];
const lower = text.toLowerCase();
const found = terms.filter(t => lower.includes(t.toLowerCase()));
return {
id: rule.id,
passed: found.length === 0,
reason: found.length > 0 ? `Found forbidden terms: ${found.join(', ')}` : undefined
};
}
/**
* Evaluates a schema rule.
*/
function evaluateSchemaRule(rule, normalizedJson) {
if (!normalizedJson || typeof normalizedJson !== 'object' || Array.isArray(normalizedJson)) {
return {
id: rule.id,
passed: false,
reason: 'Expected JSON object for schema validation'
};
}
const requiredKeys = rule.params.requiredKeys || [];
const obj = normalizedJson;
const missing = requiredKeys.filter(k => !(k in obj));
return {
id: rule.id,
passed: missing.length === 0,
reason: missing.length > 0 ? `Missing required keys: ${missing.join(', ')}` : undefined
};
}
/**
* Evaluates a coverage rule.
*/
function evaluateCoverageRule(rule, text) {
const entities = rule.params.entities || [];
const lower = text.toLowerCase();
const missing = entities.filter(e => !lower.includes(e.toLowerCase()));
return {
id: rule.id,
passed: missing.length === 0,
reason: missing.length > 0 ? `Missing coverage of: ${missing.join(', ')}` : undefined
};
}
/**
* Evaluates all instruction rules against output.
*
* @param text - The output text
* @param normalizedJson - Parsed JSON if available
* @param rules - Instruction rules to evaluate
* @param isJson - Whether output is valid JSON
* @returns Evaluation result with compliance ratio
*/
function evaluateInstructionRules(text, normalizedJson, rules, isJson) {
if (!rules || rules.length === 0) {
return {
ruleResults: [],
complianceRatio: 1,
instructionFollowed: true
};
}
const words = (0, utils_1.tokenize)(text).length;
const bullets = (0, utils_1.countBullets)(text);
const sentences = text.split(/[.!?]+/).filter(s => s.trim().length > 0).length;
const ruleResults = [];
for (const rule of rules) {
let result;
switch (rule.type) {
case 'format':
result = evaluateFormatRule(rule, text, isJson, bullets, sentences);
break;
case 'length':
result = evaluateLengthRule(rule, words, bullets);
break;
case 'include':
result = evaluateIncludeRule(rule, text);
break;
case 'exclude':
result = evaluateExcludeRule(rule, text);
break;
case 'schema':
result = evaluateSchemaRule(rule, normalizedJson);
break;
case 'coverage':
result = evaluateCoverageRule(rule, text);
break;
default:
result = { id: rule.id, passed: true };
}
ruleResults.push(result);
}
const passedCount = ruleResults.filter(r => r.passed).length;
const complianceRatio = rules.length > 0 ? passedCount / rules.length : 1;
const instructionFollowed = complianceRatio >= 0.8;
return {
ruleResults,
complianceRatio,
instructionFollowed
};
}
//# sourceMappingURL=data:application/json;base64,{"version":3,"file":"instruction-eval.js","sourceRoot":"","sources":["../../../src/engines/classification/instruction-eval.ts"],"names":[],"mappings":";AAAA;;;;;;;;GAQG;;AAsLH,4DA0DC;AA7OD,mCAAiD;AAWjD;;GAEG;AACH,SAAS,kBAAkB,CACzB,IAAqB,EACrB,IAAY,EACZ,MAAe,EACf,OAAe,EACf,SAAiB;IAEjB,MAAM,MAAM,GAAG,IAAI,CAAC,MAAM,CAAC,MAAM,CAAC;IAElC,QAAQ,MAAM,EAAE,CAAC;QACf,KAAK,MAAM;YACT,OAAO;gBACL,EAAE,EAAE,IAAI,CAAC,EAAE;gBACX,MAAM,EAAE,MAAM;gBACd,MAAM,EAAE,MAAM,CAAC,CAAC,CAAC,SAAS,CAAC,CAAC,CAAC,qCAAqC;aACnE,CAAC;QAEJ,KAAK,MAAM;YACT,OAAO;gBACL,EAAE,EAAE,IAAI,CAAC,EAAE;gBACX,MAAM,EAAE,OAAO,IAAI,CAAC;gBACpB,MAAM,EAAE,OAAO,IAAI,CAAC,CAAC,CAAC,CAAC,SAAS,CAAC,CAAC,CAAC,8CAA8C;aAClF,CAAC;QAEJ,KAAK,WAAW;YACd,MAAM,WAAW,GAAG,OAAO,KAAK,CAAC,IAAI,SAAS,IAAI,CAAC,CAAC;YACpD,OAAO;gBACL,EAAE,EAAE,IAAI,CAAC,EAAE;gBACX,MAAM,EAAE,WAAW;gBACnB,MAAM,EAAE,WAAW,CAAC,CAAC,CAAC,SAAS,CAAC,CAAC,CAAC,2BAA2B;aAC9D,CAAC;QAEJ,KAAK,MAAM;YACT,MAAM,OAAO,GAAG,eAAe,CAAC,IAAI,CAAC,IAAI,CAAC,IAAI,aAAa,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;YACvE,OAAO;gBACL,EAAE,EAAE,IAAI,CAAC,EAAE;gBACX,MAAM,EAAE,OAAO;gBACf,MAAM,EAAE,OAAO,CAAC,CAAC,CAAC,SAAS,CAAC,CAAC,CAAC,oCAAoC;aACnE,CAAC;QAEJ;YACE,OAAO,EAAE,EAAE,EAAE,IAAI,CAAC,EAAE,EAAE,MAAM,EAAE,IAAI,EAAE,CAAC;IACzC,CAAC;AACH,CAAC;AAED;;GAEG;AACH,SAAS,kBAAkB,CACzB,IAAqB,EACrB,KAAa,EACb,OAAe;IAEf,MAAM,EAAE,QAAQ,EAAE,QAAQ,EAAE,UAAU,EAAE,UAAU,EAAE,GAAG,IAAI,CAAC,MAAM,CAAC;IACnE,MAAM,QAAQ,GAAa,EAAE,CAAC;IAE9B,IAAI,QAAQ,KAAK,SAAS,IAAI,KAAK,GAAG,QAAQ,EAAE,CAAC;QAC/C,QAAQ,CAAC,IAAI,CAAC,qBAAqB,QAAQ,eAAe,KAAK,EAAE,CAAC,CAAC;IACrE,CAAC;IACD,IAAI,QAAQ,KAAK,SAAS,IAAI,KAAK,GAAG,QAAQ,EAAE,CAAC;QAC/C,QAAQ,CAAC,IAAI,CAAC,oBAAoB,QAAQ,eAAe,KAAK,EAAE,CAAC,CAAC;IACpE,CAAC;IACD,IAAI,UAAU,KAAK,SAAS,IAAI,OAAO,GAAG,UAAU,EAAE,CAAC;QACrD,QAAQ,CAAC,IAAI,CAAC,qBAAqB,UAAU,oBAAoB,OAAO,EAAE,CAAC,CAAC;IAC9E,CAAC;IACD,IAAI,UAAU,KAAK,SAAS,IAAI,OAAO,GAAG,UAAU,EAAE,CAAC;QACrD,QAAQ,CAAC,IAAI,CAAC,oBAAoB,UAAU,oBAAoB,OAAO,EAAE,CAAC,CAAC;IAC7E,CAAC;IAED,OAAO;QACL,EAAE,EAAE,IAAI,CAAC,EAAE;QACX,MAAM,EAAE,QAAQ,CAAC,MAAM,KAAK,CAAC;QAC7B,MAAM,EAAE,QAAQ,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,QAAQ,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,SAAS;KACtD,CAAC;AACJ,CAAC;AAED;;GAEG;AACH,SAAS,mBAAmB,CAC1B,IAAqB,EACrB,IAAY;IAEZ,MAAM,KAAK,GAAG,IAAI,CAAC,MAAM,CAAC,KAAK,IAAI,EAAE,CAAC;IACtC,MAAM,KAAK,GAAG,IAAI,CAAC,WAAW,EAAE,CAAC;IACjC,MAAM,OAAO,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,KAAK,CAAC,QAAQ,CAAC,CAAC,CAAC,WAAW,EAAE,CAAC,CAAC,CAAC;IAEpE,OAAO;QACL,EAAE,EAAE,IAAI,CAAC,EAAE;QACX,MAAM,EAAE,OAAO,CAAC,MAAM,KAAK,CAAC;QAC5B,MAAM,EAAE,OAAO,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,2BAA2B,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC,CAAC,CAAC,SAAS;KACzF,CAAC;AACJ,CAAC;AAED;;GAEG;AACH,SAAS,mBAAmB,CAC1B,IAAqB,EACrB,IAAY;IAEZ,MAAM,KAAK,GAAG,IAAI,CAAC,MAAM,CAAC,KAAK,IAAI,EAAE,CAAC;IACtC,MAAM,KAAK,GAAG,IAAI,CAAC,WAAW,EAAE,CAAC;IACjC,MAAM,KAAK,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,KAAK,CAAC,QAAQ,CAAC,CAAC,CAAC,WAAW,EAAE,CAAC,CAAC,CAAC;IAEjE,OAAO;QACL,EAAE,EAAE,IAAI,CAAC,EAAE;QACX,MAAM,EAAE,KAAK,CAAC,MAAM,KAAK,CAAC;QAC1B,MAAM,EAAE,KAAK,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,0BAA0B,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC,CAAC,CAAC,SAAS;KACpF,CAAC;AACJ,CAAC;AAED;;GAEG;AACH,SAAS,kBAAkB,CACzB,IAAqB,EACrB,cAAuB;IAEvB,IAAI,CAAC,cAAc,IAAI,OAAO,cAAc,KAAK,QAAQ,IAAI,KAAK,CAAC,OAAO,CAAC,cAAc,CAAC,EAAE,CAAC;QAC3F,OAAO;YACL,EAAE,EAAE,IAAI,CAAC,EAAE;YACX,MAAM,EAAE,KAAK;YACb,MAAM,EAAE,4CAA4C;SACrD,CAAC;IACJ,CAAC;IAED,MAAM,YAAY,GAAG,IAAI,CAAC,MAAM,CAAC,YAAY,IAAI,EAAE,CAAC;IACpD,MAAM,GAAG,GAAG,cAAyC,CAAC;IACtD,MAAM,OAAO,GAAG,YAAY,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC;IAEtD,OAAO;QACL,EAAE,EAAE,IAAI,CAAC,EAAE;QACX,MAAM,EAAE,OAAO,CAAC,MAAM,KAAK,CAAC;QAC5B,MAAM,EAAE,OAAO,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,0BAA0B,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC,CAAC,CAAC,SAAS;KACxF,CAAC;AACJ,CAAC;AAED;;GAEG;AACH,SAAS,oBAAoB,CAC3B,IAAqB,EACrB,IAAY;IAEZ,MAAM,QAAQ,GAAG,IAAI,CAAC,MAAM,CAAC,QAAQ,IAAI,EAAE,CAAC;IAC5C,MAAM,KAAK,GAAG,IAAI,CAAC,WAAW,EAAE,CAAC;IACjC,MAAM,OAAO,GAAG,QAAQ,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,KAAK,CAAC,QAAQ,CAAC,CAAC,CAAC,WAAW,EAAE,CAAC,CAAC,CAAC;IAEvE,OAAO;QACL,EAAE,EAAE,IAAI,CAAC,EAAE;QACX,MAAM,EAAE,OAAO,CAAC,MAAM,KAAK,CAAC;QAC5B,MAAM,EAAE,OAAO,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,wBAAwB,OAAO,CAAC,IAAI,CAAC,IAAI,CAAC,EAAE,CAAC,CAAC,CAAC,SAAS;KACtF,CAAC;AACJ,CAAC;AAED;;;;;;;;GAQG;AACH,SAAgB,wBAAwB,CACtC,IAAY,EACZ,cAAmC,EACnC,KAAwB,EACxB,MAAe;IAEf,IAAI,CAAC,KAAK,IAAI,KAAK,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QACjC,OAAO;YACL,WAAW,EAAE,EAAE;YACf,eAAe,EAAE,CAAC;YAClB,mBAAmB,EAAE,IAAI;SAC1B,CAAC;IACJ,CAAC;IAED,MAAM,KAAK,GAAG,IAAA,gBAAQ,EAAC,IAAI,CAAC,CAAC,MAAM,CAAC;IACpC,MAAM,OAAO,GAAG,IAAA,oBAAY,EAAC,IAAI,CAAC,CAAC;IACnC,MAAM,SAAS,GAAG,IAAI,CAAC,KAAK,CAAC,QAAQ,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,MAAM,CAAC;IAE/E,MAAM,WAAW,GAAiB,EAAE,CAAC;IAErC,KAAK,MAAM,IAAI,IAAI,KAAK,EAAE,CAAC;QACzB,IAAI,MAAkB,CAAC;QAEvB,QAAQ,IAAI,CAAC,IAAI,EAAE,CAAC;YAClB,KAAK,QAAQ;gBACX,MAAM,GAAG,kBAAkB,CAAC,IAAI,EAAE,IAAI,EAAE,MAAM,EAAE,OAAO,EAAE,SAAS,CAAC,CAAC;gBACpE,MAAM;YACR,KAAK,QAAQ;gBACX,MAAM,GAAG,kBAAkB,CAAC,IAAI,EAAE,KAAK,EAAE,OAAO,CAAC,CAAC;gBAClD,MAAM;YACR,KAAK,SAAS;gBACZ,MAAM,GAAG,mBAAmB,CAAC,IAAI,EAAE,IAAI,CAAC,CAAC;gBACzC,MAAM;YACR,KAAK,SAAS;gBACZ,MAAM,GAAG,mBAAmB,CAAC,IAAI,EAAE,IAAI,CAAC,CAAC;gBACzC,MAAM;YACR,KAAK,QAAQ;gBACX,MAAM,GAAG,kBAAkB,CAAC,IAAI,EAAE,cAAc,CAAC,CAAC;gBAClD,MAAM;YACR,KAAK,UAAU;gBACb,MAAM,GAAG,oBAAoB,CAAC,IAAI,EAAE,IAAI,CAAC,CAAC;gBAC1C,MAAM;YACR;gBACE,MAAM,GAAG,EAAE,EAAE,EAAE,IAAI,CAAC,EAAE,EAAE,MAAM,EAAE,IAAI,EAAE,CAAC;QAC3C,CAAC;QAED,WAAW,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;IAC3B,CAAC;IAED,MAAM,WAAW,GAAG,WAAW,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,MAAM,CAAC;IAC7D,MAAM,eAAe,GAAG,KAAK,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,WAAW,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC;IAC1E,MAAM,mBAAmB,GAAG,eAAe,IAAI,GAAG,CAAC;IAEnD,OAAO;QACL,WAAW;QACX,eAAe;QACf,mBAAmB;KACpB,CAAC;AACJ,CAAC","sourcesContent":["/**\n * Instruction-Following Evaluation Module\n * \n * Evaluates whether LLM output follows specified instruction rules.\n * \n * @module engines/classification/instruction-eval\n * @author Haiec\n * @license MIT\n */\n\nimport { InstructionRule, RuleResult } from './types';\nimport { tokenize, countBullets } from './utils';\n\n/**\n * Result of instruction evaluation.\n */\nexport interface InstructionEvalResult {\n  ruleResults: RuleResult[];\n  complianceRatio: number;\n  instructionFollowed: boolean;\n}\n\n/**\n * Evaluates a format rule.\n */\nfunction evaluateFormatRule(\n  rule: InstructionRule,\n  text: string,\n  isJson: boolean,\n  bullets: number,\n  sentences: number\n): RuleResult {\n  const expect = rule.params.expect;\n  \n  switch (expect) {\n    case 'json':\n      return {\n        id: rule.id,\n        passed: isJson,\n        reason: isJson ? undefined : 'Expected JSON output but none found'\n      };\n    \n    case 'list':\n      return {\n        id: rule.id,\n        passed: bullets >= 1,\n        reason: bullets >= 1 ? undefined : 'Expected list format but no list items found'\n      };\n    \n    case 'paragraph':\n      const isParagraph = bullets === 0 && sentences >= 2;\n      return {\n        id: rule.id,\n        passed: isParagraph,\n        reason: isParagraph ? undefined : 'Expected paragraph format'\n      };\n    \n    case 'code':\n      const hasCode = /```[\\s\\S]*```/.test(text) || /^\\s{4,}|\\t/m.test(text);\n      return {\n        id: rule.id,\n        passed: hasCode,\n        reason: hasCode ? undefined : 'Expected code block but none found'\n      };\n    \n    default:\n      return { id: rule.id, passed: true };\n  }\n}\n\n/**\n * Evaluates a length rule.\n */\nfunction evaluateLengthRule(\n  rule: InstructionRule,\n  words: number,\n  bullets: number\n): RuleResult {\n  const { minWords, maxWords, minBullets, maxBullets } = rule.params;\n  const failures: string[] = [];\n  \n  if (minWords !== undefined && words < minWords) {\n    failures.push(`Expected at least ${minWords} words, got ${words}`);\n  }\n  if (maxWords !== undefined && words > maxWords) {\n    failures.push(`Expected at most ${maxWords} words, got ${words}`);\n  }\n  if (minBullets !== undefined && bullets < minBullets) {\n    failures.push(`Expected at least ${minBullets} list items, got ${bullets}`);\n  }\n  if (maxBullets !== undefined && bullets > maxBullets) {\n    failures.push(`Expected at most ${maxBullets} list items, got ${bullets}`);\n  }\n  \n  return {\n    id: rule.id,\n    passed: failures.length === 0,\n    reason: failures.length > 0 ? failures[0] : undefined\n  };\n}\n\n/**\n * Evaluates an include rule.\n */\nfunction evaluateIncludeRule(\n  rule: InstructionRule,\n  text: string\n): RuleResult {\n  const terms = rule.params.terms || [];\n  const lower = text.toLowerCase();\n  const missing = terms.filter(t => !lower.includes(t.toLowerCase()));\n  \n  return {\n    id: rule.id,\n    passed: missing.length === 0,\n    reason: missing.length > 0 ? `Missing required terms: ${missing.join(', ')}` : undefined\n  };\n}\n\n/**\n * Evaluates an exclude rule.\n */\nfunction evaluateExcludeRule(\n  rule: InstructionRule,\n  text: string\n): RuleResult {\n  const terms = rule.params.terms || [];\n  const lower = text.toLowerCase();\n  const found = terms.filter(t => lower.includes(t.toLowerCase()));\n  \n  return {\n    id: rule.id,\n    passed: found.length === 0,\n    reason: found.length > 0 ? `Found forbidden terms: ${found.join(', ')}` : undefined\n  };\n}\n\n/**\n * Evaluates a schema rule.\n */\nfunction evaluateSchemaRule(\n  rule: InstructionRule,\n  normalizedJson: unknown\n): RuleResult {\n  if (!normalizedJson || typeof normalizedJson !== 'object' || Array.isArray(normalizedJson)) {\n    return {\n      id: rule.id,\n      passed: false,\n      reason: 'Expected JSON object for schema validation'\n    };\n  }\n  \n  const requiredKeys = rule.params.requiredKeys || [];\n  const obj = normalizedJson as Record<string, unknown>;\n  const missing = requiredKeys.filter(k => !(k in obj));\n  \n  return {\n    id: rule.id,\n    passed: missing.length === 0,\n    reason: missing.length > 0 ? `Missing required keys: ${missing.join(', ')}` : undefined\n  };\n}\n\n/**\n * Evaluates a coverage rule.\n */\nfunction evaluateCoverageRule(\n  rule: InstructionRule,\n  text: string\n): RuleResult {\n  const entities = rule.params.entities || [];\n  const lower = text.toLowerCase();\n  const missing = entities.filter(e => !lower.includes(e.toLowerCase()));\n  \n  return {\n    id: rule.id,\n    passed: missing.length === 0,\n    reason: missing.length > 0 ? `Missing coverage of: ${missing.join(', ')}` : undefined\n  };\n}\n\n/**\n * Evaluates all instruction rules against output.\n * \n * @param text - The output text\n * @param normalizedJson - Parsed JSON if available\n * @param rules - Instruction rules to evaluate\n * @param isJson - Whether output is valid JSON\n * @returns Evaluation result with compliance ratio\n */\nexport function evaluateInstructionRules(\n  text: string,\n  normalizedJson: unknown | undefined,\n  rules: InstructionRule[],\n  isJson: boolean\n): InstructionEvalResult {\n  if (!rules || rules.length === 0) {\n    return {\n      ruleResults: [],\n      complianceRatio: 1,\n      instructionFollowed: true\n    };\n  }\n  \n  const words = tokenize(text).length;\n  const bullets = countBullets(text);\n  const sentences = text.split(/[.!?]+/).filter(s => s.trim().length > 0).length;\n  \n  const ruleResults: RuleResult[] = [];\n  \n  for (const rule of rules) {\n    let result: RuleResult;\n    \n    switch (rule.type) {\n      case 'format':\n        result = evaluateFormatRule(rule, text, isJson, bullets, sentences);\n        break;\n      case 'length':\n        result = evaluateLengthRule(rule, words, bullets);\n        break;\n      case 'include':\n        result = evaluateIncludeRule(rule, text);\n        break;\n      case 'exclude':\n        result = evaluateExcludeRule(rule, text);\n        break;\n      case 'schema':\n        result = evaluateSchemaRule(rule, normalizedJson);\n        break;\n      case 'coverage':\n        result = evaluateCoverageRule(rule, text);\n        break;\n      default:\n        result = { id: rule.id, passed: true };\n    }\n    \n    ruleResults.push(result);\n  }\n  \n  const passedCount = ruleResults.filter(r => r.passed).length;\n  const complianceRatio = rules.length > 0 ? passedCount / rules.length : 1;\n  const instructionFollowed = complianceRatio >= 0.8;\n  \n  return {\n    ruleResults,\n    complianceRatio,\n    instructionFollowed\n  };\n}\n"]}