mirror of
https://github.com/affaan-m/everything-claude-code.git
synced 2026-03-30 13:43:26 +08:00
fix(harness-audit): make scoring deterministic with scripted rubric (#524)
This commit is contained in:
86
tests/scripts/harness-audit.test.js
Normal file
86
tests/scripts/harness-audit.test.js
Normal file
@@ -0,0 +1,86 @@
|
||||
/**
|
||||
* Tests for scripts/harness-audit.js
|
||||
*/
|
||||
|
||||
const assert = require('assert');
|
||||
const path = require('path');
|
||||
const { execFileSync } = require('child_process');
|
||||
|
||||
const SCRIPT = path.join(__dirname, '..', '..', 'scripts', 'harness-audit.js');
|
||||
|
||||
function run(args = []) {
|
||||
const stdout = execFileSync('node', [SCRIPT, ...args], {
|
||||
cwd: path.join(__dirname, '..', '..'),
|
||||
encoding: 'utf8',
|
||||
stdio: ['pipe', 'pipe', 'pipe'],
|
||||
timeout: 10000,
|
||||
});
|
||||
|
||||
return stdout;
|
||||
}
|
||||
|
||||
function test(name, fn) {
|
||||
try {
|
||||
fn();
|
||||
console.log(` \u2713 ${name}`);
|
||||
return true;
|
||||
} catch (error) {
|
||||
console.log(` \u2717 ${name}`);
|
||||
console.log(` Error: ${error.message}`);
|
||||
return false;
|
||||
}
|
||||
}
|
||||
|
||||
function runTests() {
|
||||
console.log('\n=== Testing harness-audit.js ===\n');
|
||||
|
||||
let passed = 0;
|
||||
let failed = 0;
|
||||
|
||||
if (test('json output is deterministic between runs', () => {
|
||||
const first = run(['repo', '--format', 'json']);
|
||||
const second = run(['repo', '--format', 'json']);
|
||||
|
||||
assert.strictEqual(first, second);
|
||||
})) passed++; else failed++;
|
||||
|
||||
if (test('report includes bounded scores and fixed categories', () => {
|
||||
const parsed = JSON.parse(run(['repo', '--format', 'json']));
|
||||
|
||||
assert.strictEqual(parsed.deterministic, true);
|
||||
assert.strictEqual(parsed.rubric_version, '2026-03-16');
|
||||
assert.ok(parsed.overall_score >= 0);
|
||||
assert.ok(parsed.max_score > 0);
|
||||
assert.ok(parsed.overall_score <= parsed.max_score);
|
||||
|
||||
const categoryNames = Object.keys(parsed.categories);
|
||||
assert.ok(categoryNames.includes('Tool Coverage'));
|
||||
assert.ok(categoryNames.includes('Context Efficiency'));
|
||||
assert.ok(categoryNames.includes('Quality Gates'));
|
||||
assert.ok(categoryNames.includes('Memory Persistence'));
|
||||
assert.ok(categoryNames.includes('Eval Coverage'));
|
||||
assert.ok(categoryNames.includes('Security Guardrails'));
|
||||
assert.ok(categoryNames.includes('Cost Efficiency'));
|
||||
})) passed++; else failed++;
|
||||
|
||||
if (test('scope filtering changes max score and check list', () => {
|
||||
const full = JSON.parse(run(['repo', '--format', 'json']));
|
||||
const scoped = JSON.parse(run(['hooks', '--format', 'json']));
|
||||
|
||||
assert.strictEqual(scoped.scope, 'hooks');
|
||||
assert.ok(scoped.max_score < full.max_score);
|
||||
assert.ok(scoped.checks.length < full.checks.length);
|
||||
assert.ok(scoped.checks.every(check => check.path.includes('hooks') || check.path.includes('scripts/hooks')));
|
||||
})) passed++; else failed++;
|
||||
|
||||
if (test('text format includes summary header', () => {
|
||||
const output = run(['repo']);
|
||||
assert.ok(output.includes('Harness Audit (repo):'));
|
||||
assert.ok(output.includes('Top 3 Actions:') || output.includes('Checks:'));
|
||||
})) passed++; else failed++;
|
||||
|
||||
console.log(`\nResults: Passed: ${passed}, Failed: ${failed}`);
|
||||
process.exit(failed > 0 ? 1 : 0);
|
||||
}
|
||||
|
||||
runTests();
|
||||
Reference in New Issue
Block a user