ktg-plugin-marketplace/plugins/llm-security/tests/scanners/unicode.test.mjs

108 lines
4.2 KiB
JavaScript

// unicode.test.mjs — Integration tests for the unicode-scanner
// Tests against the evil-project-health fixture which contains:
// - Zero-width characters in SKILL.fixture.md
// - Unicode Tag block codepoints (steganographic hidden message) in SKILL.fixture.md
// - BIDI override characters in SKILL.fixture.md
import { describe, it, beforeEach } from 'node:test';
import assert from 'node:assert/strict';
import { resolve } from 'node:path';
import { fileURLToPath } from 'node:url';
import { resetCounter } from '../../scanners/lib/output.mjs';
import { discoverFiles } from '../../scanners/lib/file-discovery.mjs';
import { scan } from '../../scanners/unicode-scanner.mjs';
const __dirname = fileURLToPath(new URL('.', import.meta.url));
const FIXTURE = resolve(__dirname, '../../examples/malicious-skill-demo/evil-project-health');
describe('unicode-scanner integration', () => {
let discovery;
beforeEach(async () => {
resetCounter();
discovery = await discoverFiles(FIXTURE);
});
it('returns status ok', async () => {
const result = await scan(FIXTURE, discovery);
assert.equal(result.status, 'ok', `Expected status 'ok', got '${result.status}'`);
});
it('scans at least one file', async () => {
const result = await scan(FIXTURE, discovery);
assert.ok(result.files_scanned >= 1, `Expected files_scanned >= 1, got ${result.files_scanned}`);
});
it('detects zero-width characters (CRITICAL or HIGH)', async () => {
const result = await scan(FIXTURE, discovery);
const zeroWidthFindings = result.findings.filter(f =>
(f.severity === 'critical' || f.severity === 'high') &&
(
f.title.toLowerCase().includes('zero-width') ||
f.title.toLowerCase().includes('zero width') ||
(f.evidence && f.evidence.toLowerCase().includes('u+200'))
)
);
assert.ok(
zeroWidthFindings.length >= 1,
`Expected at least 1 zero-width finding, got ${zeroWidthFindings.length}. ` +
`All findings: ${result.findings.map(f => f.title).join('; ')}`
);
});
it('detects Unicode Tag block codepoints (CRITICAL) — steganographic hidden message', async () => {
const result = await scan(FIXTURE, discovery);
const tagFindings = result.findings.filter(f =>
f.severity === 'critical' &&
f.title.toLowerCase().includes('unicode tag')
);
assert.ok(
tagFindings.length >= 1,
`Expected at least 1 Unicode Tag finding (CRITICAL), got ${tagFindings.length}. ` +
`All findings: ${result.findings.map(f => f.title).join('; ')}`
);
});
it('reports at least 3 total findings across all categories', async () => {
const result = await scan(FIXTURE, discovery);
assert.ok(
result.findings.length >= 3,
`Expected >= 3 total unicode findings, got ${result.findings.length}`
);
});
it('assigns correct scanner prefix UNI to all findings', async () => {
const result = await scan(FIXTURE, discovery);
const wrongPrefix = result.findings.filter(f => !f.id.startsWith('DS-UNI-'));
assert.equal(
wrongPrefix.length, 0,
`All findings should have DS-UNI- prefix. Wrong: ${wrongPrefix.map(f => f.id).join(', ')}`
);
});
it('finding IDs are sequential starting from DS-UNI-001', async () => {
const result = await scan(FIXTURE, discovery);
if (result.findings.length === 0) return;
assert.equal(result.findings[0].id, 'DS-UNI-001');
});
it('all findings have required fields', async () => {
const result = await scan(FIXTURE, discovery);
for (const f of result.findings) {
assert.ok(f.id, `Finding missing id`);
assert.ok(f.scanner, `Finding ${f.id} missing scanner`);
assert.ok(f.severity, `Finding ${f.id} missing severity`);
assert.ok(f.title, `Finding ${f.id} missing title`);
assert.ok(f.owasp, `Finding ${f.id} missing owasp`);
}
});
it('counts object reflects actual findings array', async () => {
const result = await scan(FIXTURE, discovery);
const countTotal = Object.values(result.counts).reduce((s, n) => s + n, 0);
assert.equal(
countTotal, result.findings.length,
`counts total (${countTotal}) should equal findings.length (${result.findings.length})`
);
});
});