feat(humanizer): scenario read-test corpus + runner (SC-4) [skip-docs]

Step 9 of v5.1.0 humanizer Wave 4. Adds tests/scenario-read-test.mjs runner, tests/scenario-read-test.test.mjs wrapper, and 5 scenario fixtures in tests/scenarios/ that feed deterministic raw findings through humanizeFinding and assert the humanized title/description/recommendation match brief-owner-approved regex patterns encoding the ground-truth what/why/whatNext answers. Corpus selection (per brief criteria): - 01-tok-cascade.json - TOK/CPS category (token efficiency) - 02-cps-volatile.json - TOK/CPS category (cache prefix stability) - 03-cnf-conflict.json - CNF category (conflicts) - 04-gap-no-claude-md.json - GAP category (feature gap) - 05-set-invalid-json.json - SET category, AND its v5.0.0 title + description carry tier1 'invalid' (the brief criterion 'one finding whose v5.0.0 description uses a forbidden word'). Runner mechanics: - Loads scenarios matching ^\\d{2}-[a-z0-9-]+\\.json$ in sorted order. - Calls humanizeFinding(scannerInput) and matches each humanized field against its declared pattern (case-insensitive regex). - Verifies humanizer-added structural fields (userImpactCategory, userActionLanguage, relevanceContext) are non-empty strings. - Per session decision (1a) acceptance is deterministic regex matching without a runtime human approval gate. Wrapper adds 3 tests: scenario-match (binds runner to node --test), category-coverage (TOK/CPS, CNF, GAP, SET all present), and tier1-presence (at least one v5.0.0 title or description contains a tier1 forbidden word). Tests: 736 to 739 (+3 SC-4 tests). Full suite passes. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
2026-05-01 18:16:23 +02:00 · 2026-05-01 18:16:23 +02:00 · 8b146bf489
commit 8b146bf489
parent c5c937e94e
7 changed files with 373 additions and 0 deletions
--- a/plugins/config-audit/tests/scenarios/01-tok-cascade.json
+++ b/plugins/config-audit/tests/scenarios/01-tok-cascade.json
@ -0,0 +1,29 @@
+{
+  "_meta": {
+    "comment": "Scenario 01: TOK CLAUDE.md cascade exceeds 10k tokens. Covers the TOK/CPS (token-efficiency) category. v5.0.0 title contains tier3 'CLAUDE.md' — humanizer rewrites to non-jargon prose."
+  },
+  "findingId": "CA-TOK-001",
+  "scannerInput": {
+    "id": "CA-TOK-001",
+    "scanner": "TOK",
+    "severity": "high",
+    "title": "CLAUDE.md cascade exceeds 10k tokens per turn",
+    "description": "Total CLAUDE.md cascade is 12450 tokens across 4 files.",
+    "file": ".claude/CLAUDE.md",
+    "line": null,
+    "evidence": "tokens=12450; files=4",
+    "recommendation": "Reduce CLAUDE.md cascade size. Move content into modular skill files or trim verbose sections.",
+    "category": null,
+    "autoFixable": false
+  },
+  "expectedHumanized": {
+    "titlePattern": "instruction files take a lot of space on every turn",
+    "descriptionPattern": "10,000 tokens|every turn carries that weight",
+    "recommendationPattern": "Trim or split the largest files"
+  },
+  "groundTruth": {
+    "what": "The instruction files Claude reads on every turn are large enough that they slow each response.",
+    "why": "The combined size has gone above 10,000 tokens. That weight loads on every turn and leaves less room for the conversation itself.",
+    "whatNext": "Trim or split the largest files. The details show which file contributes most."
+  }
+}
--- a/plugins/config-audit/tests/scenarios/02-cps-volatile.json
+++ b/plugins/config-audit/tests/scenarios/02-cps-volatile.json
@ -0,0 +1,29 @@
+{
+  "_meta": {
+    "comment": "Scenario 02: CPS volatile content inside cached prefix. Covers the CPS half of the TOK/CPS category. Tests that the humanizer explains cache-prefix-stability in user-facing language."
+  },
+  "findingId": "CA-CPS-001",
+  "scannerInput": {
+    "id": "CA-CPS-001",
+    "scanner": "CPS",
+    "severity": "medium",
+    "title": "Volatile content inside cached prefix breaks reuse",
+    "description": "Volatile pattern matched at .claude/CLAUDE.md:42 (timestamp). Lines 31-150 form the cache prefix.",
+    "file": ".claude/CLAUDE.md",
+    "line": 42,
+    "evidence": "Pattern: timestamp; window: 31-150",
+    "recommendation": "Move volatile content (timestamps, session state) below line 150 or to a separate file.",
+    "category": null,
+    "autoFixable": false
+  },
+  "expectedHumanized": {
+    "titlePattern": "Content that changes between turns sits in the part Claude tries to reuse",
+    "descriptionPattern": "fresh read every time|slows responses",
+    "recommendationPattern": "Move the changing content|150 lines"
+  },
+  "groundTruth": {
+    "what": "Content that changes between turns is inside the part of the file Claude tries to reuse.",
+    "why": "Claude saves space by reusing the start of your instructions across turns. When that area changes, every turn re-reads the whole start, which slows responses.",
+    "whatNext": "Move the changing content (timestamps, session notes) below the first 150 lines, or out of the file entirely."
+  }
+}
--- a/plugins/config-audit/tests/scenarios/03-cnf-conflict.json
+++ b/plugins/config-audit/tests/scenarios/03-cnf-conflict.json
@ -0,0 +1,29 @@
+{
+  "_meta": {
+    "comment": "Scenario 03: CNF allow/deny conflict. Covers the conflicts category. v5.0.0 title contains tier3 'allow/deny' — humanizer rewrites with non-jargon language."
+  },
+  "findingId": "CA-CNF-001",
+  "scannerInput": {
+    "id": "CA-CNF-001",
+    "scanner": "CNF",
+    "severity": "high",
+    "title": "Permission allow/deny conflict",
+    "description": "Tool 'Bash(git:*)' appears in both allow and deny lists at .claude/settings.json.",
+    "file": ".claude/settings.json",
+    "line": null,
+    "evidence": "tool=Bash(git:*); allow=true; deny=true",
+    "recommendation": "Remove the tool from either the allow or deny list to make the intent unambiguous.",
+    "category": null,
+    "autoFixable": false
+  },
+  "expectedHumanized": {
+    "titlePattern": "let-in and shut-out by your permissions",
+    "descriptionPattern": "deny.*priority over an .*allow|looks like the tool is approved",
+    "recommendationPattern": "Remove either the .*allow.* or the .*deny"
+  },
+  "groundTruth": {
+    "what": "A tool you have configured is both let-in and shut-out by your permission rules.",
+    "why": "A `deny` entry takes priority over an `allow`, so the `allow` does nothing — but the configuration looks like the tool is approved, which can mislead readers of the file.",
+    "whatNext": "Remove either the `allow` or the `deny` entry so the intent is unambiguous."
+  }
+}
--- a/plugins/config-audit/tests/scenarios/04-gap-no-claude-md.json
+++ b/plugins/config-audit/tests/scenarios/04-gap-no-claude-md.json
@ -0,0 +1,29 @@
+{
+  "_meta": {
+    "comment": "Scenario 04: GAP no CLAUDE.md file. Covers the feature-gap category. v5.0.0 title and recommendation contain tier3 'CLAUDE.md' — humanizer wraps the term in backticks."
+  },
+  "findingId": "CA-GAP-001",
+  "scannerInput": {
+    "id": "CA-GAP-001",
+    "scanner": "GAP",
+    "severity": "medium",
+    "title": "No CLAUDE.md file",
+    "description": "No project instructions file detected.",
+    "file": null,
+    "line": null,
+    "evidence": null,
+    "recommendation": "Create a CLAUDE.md file with project-specific guidance.",
+    "category": "t1",
+    "autoFixable": false
+  },
+  "expectedHumanized": {
+    "titlePattern": "haven'?t added project instructions for Claude",
+    "descriptionPattern": "highest-impact thing you can add|tells Claude how you work",
+    "recommendationPattern": "Create .*CLAUDE\\.md.*one-paragraph overview"
+  },
+  "groundTruth": {
+    "what": "Your project doesn't have a top-level instructions file for Claude yet.",
+    "why": "A `CLAUDE.md` at the project root is the single highest-impact addition; it tells Claude how you work in this codebase so every session starts informed.",
+    "whatNext": "Create `CLAUDE.md` with a one-paragraph overview, common commands, and any conventions Claude should know."
+  }
+}
--- a/plugins/config-audit/tests/scenarios/05-set-invalid-json.json
+++ b/plugins/config-audit/tests/scenarios/05-set-invalid-json.json
@ -0,0 +1,29 @@
+{
+  "_meta": {
+    "comment": "Scenario 05: SET invalid JSON in settings file. Covers the settings category AND the brief criterion 'one finding whose v5.0.0 description contains a tier1 forbidden word' — both the v5.0.0 title and description carry tier1 'invalid'. Humanizer rewrites to plain language."
+  },
+  "findingId": "CA-SET-001",
+  "scannerInput": {
+    "id": "CA-SET-001",
+    "scanner": "SET",
+    "severity": "critical",
+    "title": "Invalid JSON in settings file",
+    "description": ".claude/settings.json contains invalid JSON and will be ignored by Claude Code.",
+    "file": ".claude/settings.json",
+    "line": null,
+    "evidence": "Unexpected token } in JSON at position 187",
+    "recommendation": "Fix JSON syntax errors. Use a JSON validator.",
+    "category": null,
+    "autoFixable": false
+  },
+  "expectedHumanized": {
+    "titlePattern": "settings file isn'?t readable as JSON",
+    "descriptionPattern": "Claude Code can'?t parse the file|settings are skipped",
+    "recommendationPattern": "Open the file and fix the JSON syntax"
+  },
+  "groundTruth": {
+    "what": "Your settings file can't be read as JSON, so none of the settings inside take effect.",
+    "why": "Claude Code parses the settings file once at startup. When that parse fails, all settings inside are skipped silently, and you get the defaults.",
+    "whatNext": "Open the file and fix the JSON syntax shown in the details (often a missing comma, an extra trailing comma, or an unterminated quote)."
+  }
+}