Step 11 of v3.4.1 plan. Adds the lifecycle subsection to Handover 7 documenting: - Producer/consumer arbeidsdeling (executor + helper write; ultracontinue reads; pre-compact-flush refreshes only) - Stale-file principle: status==='completed' state files SHOULD be removed via /ultracontinue-local --cleanup --confirm (operator-invoked, no auto-cleanup, no force flag) - Frontmatter contract for NEXT-SESSION-PROMPT.local.md: producers MUST write produced_by + produced_at (ISO-8601); files without frontmatter are tolerated (warning, not error) for backwards compatibility - Idempotency: --cleanup --confirm is safe to re-run; partial state reported but never auto-recovered Adds 3 doc-consistency pins: - next-session-prompt-validator CLI shim - Handover 7 § Lifecycle subsection present - Handover 7 § Lifecycle names --cleanup + produced_by contract 358 -> 361 tests, all green. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
268 lines
10 KiB
JavaScript
268 lines
10 KiB
JavaScript
// tests/lib/doc-consistency.test.mjs
|
|
// Pin invariants between prose (CLAUDE.md, README.md) and source files
|
|
// (agents/*.md, commands/*.md, templates/, settings.json).
|
|
//
|
|
// When this test fails, fix the source-of-truth — do NOT rewrite the test to
|
|
// hide drift. Borrowed pattern from llm-security commit 97c5c9d.
|
|
|
|
import { test } from 'node:test';
|
|
import { strict as assert } from 'node:assert';
|
|
import { readFileSync, readdirSync } from 'node:fs';
|
|
import { join, dirname } from 'node:path';
|
|
import { fileURLToPath } from 'node:url';
|
|
import { parseDocument } from '../../lib/util/frontmatter.mjs';
|
|
|
|
const HERE = dirname(fileURLToPath(import.meta.url));
|
|
const ROOT = join(HERE, '..', '..');
|
|
|
|
function read(rel) { return readFileSync(join(ROOT, rel), 'utf-8'); }
|
|
function listMd(rel) { return readdirSync(join(ROOT, rel)).filter(f => f.endsWith('.md')); }
|
|
|
|
test('CLAUDE.md agents table row count == agents/*.md file count', () => {
|
|
const md = read('CLAUDE.md');
|
|
const agentFiles = listMd('agents');
|
|
const agentTable = md.split('## Agents')[1] || '';
|
|
const tableSection = agentTable.split('\n## ')[0];
|
|
const dataRows = tableSection
|
|
.split('\n')
|
|
.filter(l => l.startsWith('|') && !l.match(/^\|[\s-]+\|/) && !l.match(/^\|\s*Agent\s*\|/));
|
|
assert.equal(
|
|
dataRows.length,
|
|
agentFiles.length,
|
|
`Drift: ${agentFiles.length} agent files vs ${dataRows.length} CLAUDE.md table rows. ` +
|
|
`Sync agents/ ↔ CLAUDE.md.`,
|
|
);
|
|
});
|
|
|
|
test('CLAUDE.md commands table mentions every commands/*.md file', () => {
|
|
const md = read('CLAUDE.md');
|
|
const commandFiles = listMd('commands');
|
|
for (const f of commandFiles) {
|
|
const cmdName = `/${f.replace(/\.md$/, '')}`;
|
|
assert.ok(
|
|
md.includes(cmdName),
|
|
`commands/${f} not mentioned in CLAUDE.md (looked for ${cmdName})`,
|
|
);
|
|
}
|
|
});
|
|
|
|
test('every command frontmatter name matches its filename', () => {
|
|
for (const f of listMd('commands')) {
|
|
const text = read(`commands/${f}`);
|
|
const doc = parseDocument(text);
|
|
if (!doc.valid) continue;
|
|
const expected = f.replace(/\.md$/, '');
|
|
if (doc.parsed.frontmatter && doc.parsed.frontmatter.name !== undefined) {
|
|
assert.equal(
|
|
doc.parsed.frontmatter.name,
|
|
expected,
|
|
`commands/${f} frontmatter.name="${doc.parsed.frontmatter.name}" should be "${expected}"`,
|
|
);
|
|
}
|
|
}
|
|
});
|
|
|
|
test('templates/plan-template.md declares plan_version: 1.7', () => {
|
|
const tpl = read('templates/plan-template.md');
|
|
assert.match(tpl, /plan_version:\s*['"]?1\.7['"]?/);
|
|
});
|
|
|
|
test('commands/ultraexecute-local.md still parses v1.7 plan schema', () => {
|
|
const cmd = read('commands/ultraexecute-local.md');
|
|
const tpl = read('templates/plan-template.md');
|
|
const tplVersion = (tpl.match(/plan_version:\s*['"]?([\d.]+)['"]?/) || [])[1];
|
|
assert.ok(tplVersion, 'templates/plan-template.md missing plan_version');
|
|
assert.ok(
|
|
cmd.includes(`plan_version`) || cmd.includes(`Step N:`) || cmd.includes('### Step '),
|
|
'commands/ultraexecute-local.md should reference v1.7 plan-schema parsing',
|
|
);
|
|
});
|
|
|
|
test('settings.json has only known top-level scopes after Spor 0 cleanup', () => {
|
|
const cfg = JSON.parse(read('settings.json'));
|
|
const known = ['ultraplan', 'ultraresearch'];
|
|
for (const k of Object.keys(cfg)) {
|
|
assert.ok(known.includes(k), `Unknown top-level scope in settings.json: ${k}`);
|
|
}
|
|
});
|
|
|
|
test('settings.json no longer carries vestigial exploration block', () => {
|
|
const cfg = JSON.parse(read('settings.json'));
|
|
assert.equal(cfg.ultraplan?.exploration, undefined,
|
|
'exploration block was vestigial — should be deleted in v3.1.0 Spor 0');
|
|
assert.equal(cfg.ultraplan?.agentTeam, undefined,
|
|
'agentTeam block was vestigial — should be deleted in v3.1.0 Spor 0');
|
|
});
|
|
|
|
test('CLAUDE.md mentions all five pipeline commands', () => {
|
|
const md = read('CLAUDE.md');
|
|
for (const c of ['/ultrabrief-local', '/ultraresearch-local', '/ultraplan-local', '/ultraexecute-local', '/ultrareview-local']) {
|
|
assert.ok(md.includes(c), `CLAUDE.md missing reference to ${c}`);
|
|
}
|
|
});
|
|
|
|
test('HANDOVER-CONTRACTS.md contains Handover 6 section', () => {
|
|
const text = read('docs/HANDOVER-CONTRACTS.md');
|
|
assert.ok(
|
|
text.includes('## Handover 6'),
|
|
'docs/HANDOVER-CONTRACTS.md should document Handover 6 (review → plan)',
|
|
);
|
|
});
|
|
|
|
test('HANDOVER-CONTRACTS.md contains Handover 7 section (session-state)', () => {
|
|
const text = read('docs/HANDOVER-CONTRACTS.md');
|
|
assert.ok(
|
|
text.includes('## Handover 7'),
|
|
'docs/HANDOVER-CONTRACTS.md should document Handover 7 (.session-state.local.json) ' +
|
|
'consumed by /ultracontinue',
|
|
);
|
|
assert.ok(
|
|
text.includes('.session-state.local.json'),
|
|
'Handover 7 section should name the artifact path',
|
|
);
|
|
});
|
|
|
|
test('review-validator has CLI shim', () => {
|
|
const text = read('lib/validators/review-validator.mjs');
|
|
assert.ok(
|
|
text.includes('import.meta.url === '),
|
|
'lib/validators/review-validator.mjs should expose the standard CLI shim ' +
|
|
'(if (import.meta.url === `file://${process.argv[1]}`)) so commands can call it from Bash',
|
|
);
|
|
});
|
|
|
|
test('session-state-validator has CLI shim', () => {
|
|
const text = read('lib/validators/session-state-validator.mjs');
|
|
assert.ok(
|
|
text.includes('import.meta.url === '),
|
|
'lib/validators/session-state-validator.mjs should expose the standard CLI shim ' +
|
|
'(if (import.meta.url === `file://${process.argv[1]}`)) so /ultracontinue can call it from Bash',
|
|
);
|
|
});
|
|
|
|
test('next-session-prompt-validator has CLI shim', () => {
|
|
const text = read('lib/validators/next-session-prompt-validator.mjs');
|
|
assert.ok(
|
|
text.includes('import.meta.url === '),
|
|
'lib/validators/next-session-prompt-validator.mjs should expose the standard CLI shim ' +
|
|
'(if (import.meta.url === `file://${process.argv[1]}`)) so /ultracontinue Phase 1.5 can call it from Bash',
|
|
);
|
|
});
|
|
|
|
test('HANDOVER-CONTRACTS.md Handover 7 documents § Lifecycle subsection', () => {
|
|
const text = read('docs/HANDOVER-CONTRACTS.md');
|
|
const h7Start = text.indexOf('## Handover 7');
|
|
assert.ok(h7Start >= 0, 'Handover 7 heading missing');
|
|
const h7End = text.indexOf('## Stability summary', h7Start);
|
|
assert.ok(h7End > h7Start, 'Stability summary heading missing — could not bound Handover 7');
|
|
const h7 = text.slice(h7Start, h7End);
|
|
assert.ok(
|
|
h7.includes('Lifecycle'),
|
|
'Handover 7 section should include a § Lifecycle subsection (SC-5 stale-file principle)',
|
|
);
|
|
});
|
|
|
|
test('HANDOVER-CONTRACTS.md Handover 7 § Lifecycle names --cleanup and produced_by contract', () => {
|
|
const text = read('docs/HANDOVER-CONTRACTS.md');
|
|
const h7Start = text.indexOf('## Handover 7');
|
|
const h7End = text.indexOf('## Stability summary', h7Start);
|
|
const h7 = text.slice(h7Start, h7End);
|
|
assert.ok(
|
|
h7.includes('--cleanup'),
|
|
'Handover 7 § Lifecycle should mention --cleanup as the operator-invoked stale-file remover',
|
|
);
|
|
assert.ok(
|
|
h7.includes('produced_by'),
|
|
'Handover 7 § Lifecycle should document the produced_by frontmatter contract for NEXT-SESSION-PROMPT.local.md',
|
|
);
|
|
});
|
|
|
|
test('CLAUDE.md mentions /ultracontinue-local command', () => {
|
|
const md = read('CLAUDE.md');
|
|
assert.ok(
|
|
md.includes('/ultracontinue-local') || md.includes('ultracontinue-local'),
|
|
'CLAUDE.md should document /ultracontinue-local in the Commands table ' +
|
|
'(added in v3.3.0 alongside the new command file)',
|
|
);
|
|
});
|
|
|
|
test('rule-catalogue has exactly 12 entries', async () => {
|
|
const mod = await import('../../lib/review/rule-catalogue.mjs');
|
|
assert.strictEqual(
|
|
mod.RULE_CATALOGUE.length,
|
|
12,
|
|
'lib/review/rule-catalogue.mjs RULE_CATALOGUE size invariant: must be 12 (v1.0 baseline)',
|
|
);
|
|
});
|
|
|
|
test('headless-launch-template.md mirrors Phase 2.6 hardenings', () => {
|
|
const tpl = read('templates/headless-launch-template.md');
|
|
for (const needle of [
|
|
'GIT_OPTIONAL_LOCKS',
|
|
'--max-turns',
|
|
'--max-budget-usd',
|
|
'--append-system-prompt-file',
|
|
'SHARED_CONTEXT_FILE',
|
|
'SAFETY_PREAMBLE',
|
|
'git push origin',
|
|
'GH #36071',
|
|
'push-before-cleanup',
|
|
]) {
|
|
assert.ok(
|
|
tpl.includes(needle),
|
|
`templates/headless-launch-template.md should include "${needle}" (Step 10 mirrors Phase 2.6)`,
|
|
);
|
|
}
|
|
});
|
|
|
|
test('Phase 9 prose mandates parallel single-message dispatch + inline dedup', () => {
|
|
const cmd = read('commands/ultraplan-local.md');
|
|
const orch = read('agents/planning-orchestrator.md');
|
|
// Single-message reinforcement appears in both (command + orchestrator)
|
|
assert.ok(
|
|
cmd.includes('single assistant message turn'),
|
|
'commands/ultraplan-local.md Phase 9 should reinforce single-message parallel dispatch',
|
|
);
|
|
assert.ok(
|
|
orch.includes('single assistant message turn'),
|
|
'agents/planning-orchestrator.md Phase 6 should mirror the single-message parallel-dispatch contract',
|
|
);
|
|
// Dedup CLI shim is wired in both
|
|
assert.ok(
|
|
cmd.includes('plan-review-dedup.mjs'),
|
|
'commands/ultraplan-local.md Phase 9 should call lib/review/plan-review-dedup.mjs after both reviewers complete',
|
|
);
|
|
assert.ok(
|
|
orch.includes('plan-review-dedup.mjs'),
|
|
'agents/planning-orchestrator.md Phase 6 should reference the dedup helper',
|
|
);
|
|
});
|
|
|
|
test('commands/ultraplan-local.md Phase 8 seals Opus-4.7 schema-drift defense', () => {
|
|
const cmd = read('commands/ultraplan-local.md');
|
|
// Locate Phase 8 section
|
|
const phase8Start = cmd.indexOf('## Phase 8');
|
|
assert.ok(phase8Start >= 0, 'Phase 8 heading missing');
|
|
const phase8End = cmd.indexOf('## Phase 9', phase8Start);
|
|
assert.ok(phase8End > phase8Start, 'Phase 9 heading missing — could not bound Phase 8');
|
|
const phase8 = cmd.slice(phase8Start, phase8End);
|
|
// Required regex source-of-truth references
|
|
assert.ok(
|
|
phase8.includes('STEP_HEADING_REGEX'),
|
|
'Phase 8 should inline STEP_HEADING_REGEX so format contract survives without orchestrator-doc loading',
|
|
);
|
|
assert.ok(
|
|
phase8.includes('FORBIDDEN_HEADING_REGEX'),
|
|
'Phase 8 should inline FORBIDDEN_HEADING_REGEX (Step 7 — schema-drift seal)',
|
|
);
|
|
// Required validator self-check
|
|
assert.ok(
|
|
phase8.includes('plan-validator.mjs --strict'),
|
|
'Phase 8 should mandate post-write `plan-validator.mjs --strict` self-check',
|
|
);
|
|
// Forbidden-headings list (literal "FORBIDDEN" appears more than once: in regex const + in human-readable list)
|
|
assert.ok(
|
|
/FORBIDDEN/.test(phase8),
|
|
'Phase 8 should explicitly enumerate FORBIDDEN headings',
|
|
);
|
|
});
|