feat: export continuity hard-gate and watchdog workstream
This commit is contained in:
421
scripts/test_approved_plan_continuity_gate.mjs
Normal file
421
scripts/test_approved_plan_continuity_gate.mjs
Normal file
@@ -0,0 +1,421 @@
|
||||
#!/usr/bin/env node
|
||||
import { mkdirSync, mkdtempSync, rmSync, writeFileSync } from 'node:fs';
|
||||
import os from 'node:os';
|
||||
import path from 'node:path';
|
||||
import { spawnSync } from 'node:child_process';
|
||||
import { fileURLToPath } from 'node:url';
|
||||
|
||||
const __filename = fileURLToPath(import.meta.url);
|
||||
const __dirname = path.dirname(__filename);
|
||||
const gateScript = path.join(__dirname, 'approved_plan_continuity_gate.mjs');
|
||||
|
||||
function createFixture(files = {}) {
|
||||
const root = mkdtempSync(path.join(os.tmpdir(), 'approved-plan-continuity-'));
|
||||
|
||||
for (const [relativePath, content] of Object.entries(files)) {
|
||||
const filePath = path.join(root, relativePath);
|
||||
mkdirSync(path.dirname(filePath), { recursive: true });
|
||||
writeFileSync(filePath, typeof content === 'string' ? content : `${JSON.stringify(content, null, 2)}\n`);
|
||||
}
|
||||
|
||||
return {
|
||||
root,
|
||||
path(...segments) {
|
||||
return path.join(root, ...segments);
|
||||
},
|
||||
cleanup() {
|
||||
rmSync(root, { recursive: true, force: true });
|
||||
},
|
||||
};
|
||||
}
|
||||
|
||||
function runGate({ args = [], stdin = null } = {}) {
|
||||
const result = spawnSync(process.execPath, [gateScript, ...args], {
|
||||
input: stdin,
|
||||
encoding: 'utf8',
|
||||
});
|
||||
|
||||
let json = null;
|
||||
if (result.stdout && result.stdout.trim()) {
|
||||
try {
|
||||
json = JSON.parse(result.stdout);
|
||||
} catch {
|
||||
json = null;
|
||||
}
|
||||
}
|
||||
|
||||
return {
|
||||
status: result.status,
|
||||
stdout: result.stdout,
|
||||
stderr: result.stderr,
|
||||
json,
|
||||
};
|
||||
}
|
||||
|
||||
const tests = [
|
||||
{
|
||||
name: 'skeleton: gate script responds with placeholder envelope when given fixture input',
|
||||
run() {
|
||||
const fixture = createFixture({
|
||||
'input.json': {
|
||||
planId: 'plan-skeleton',
|
||||
currentTask: 'task-5',
|
||||
},
|
||||
});
|
||||
|
||||
try {
|
||||
const result = runGate({
|
||||
args: ['--compact', '--input', fixture.path('input.json')],
|
||||
});
|
||||
|
||||
if (result.status !== 0 && result.status !== null) {
|
||||
throw new Error(`expected controlled execution, got status=${result.status}\n${result.stderr || result.stdout}`);
|
||||
}
|
||||
|
||||
if (!result.json || typeof result.json !== 'object') {
|
||||
throw new Error(`expected JSON output\nstdout=${result.stdout}`);
|
||||
}
|
||||
|
||||
if (result.json.gate !== 'approved_plan_continuity') {
|
||||
throw new Error(`expected gate=approved_plan_continuity, got ${JSON.stringify(result.json.gate)}`);
|
||||
}
|
||||
} finally {
|
||||
fixture.cleanup();
|
||||
}
|
||||
},
|
||||
},
|
||||
{
|
||||
name: 'continuity: fails when task is complete, next action is known, no dispatch receipt exists, and closure is not in an allowed terminal state',
|
||||
run() {
|
||||
const fixture = createFixture({
|
||||
'input.json': {
|
||||
planId: 'plan-missing-dispatch',
|
||||
currentTask: 'task-6',
|
||||
taskState: 'complete',
|
||||
nextDerivedAction: {
|
||||
type: 'message_subagent',
|
||||
task: 'continue with task-7',
|
||||
},
|
||||
replyClosureState: 'completed',
|
||||
dispatchReceipt: null,
|
||||
},
|
||||
});
|
||||
|
||||
try {
|
||||
const result = runGate({
|
||||
args: ['--compact', '--input', fixture.path('input.json')],
|
||||
});
|
||||
|
||||
if (result.status !== 0 && result.status !== null) {
|
||||
throw new Error(`expected controlled execution, got status=${result.status}\n${result.stderr || result.stdout}`);
|
||||
}
|
||||
|
||||
if (!result.json || typeof result.json !== 'object') {
|
||||
throw new Error(`expected JSON output\nstdout=${result.stdout}`);
|
||||
}
|
||||
|
||||
if (result.json.ok !== false) {
|
||||
throw new Error(`expected continuity failure ok=false, got ${JSON.stringify(result.json)}`);
|
||||
}
|
||||
|
||||
if (result.json.verdict !== 'continuity_failure') {
|
||||
throw new Error(`expected verdict=continuity_failure, got ${JSON.stringify(result.json.verdict)}`);
|
||||
}
|
||||
} finally {
|
||||
fixture.cleanup();
|
||||
}
|
||||
},
|
||||
},
|
||||
{
|
||||
name: 'continuity: fails when planner returns derivedAction without any bound dispatch receipt',
|
||||
run() {
|
||||
const fixture = createFixture({
|
||||
'input.json': {
|
||||
planId: 'plan-derived-action-without-bound-dispatch',
|
||||
currentTask: 'task-6b',
|
||||
taskState: 'complete',
|
||||
derivedAction: {
|
||||
type: 'message_subagent',
|
||||
task: 'continue with task-7b',
|
||||
},
|
||||
replyClosureState: 'completed',
|
||||
dispatchReceipt: null,
|
||||
},
|
||||
});
|
||||
|
||||
try {
|
||||
const result = runGate({
|
||||
args: ['--compact', '--input', fixture.path('input.json')],
|
||||
});
|
||||
|
||||
if (result.status !== 0 && result.status !== null) {
|
||||
throw new Error(`expected controlled execution, got status=${result.status}
|
||||
${result.stderr || result.stdout}`);
|
||||
}
|
||||
|
||||
if (!result.json || typeof result.json !== 'object') {
|
||||
throw new Error(`expected JSON output
|
||||
stdout=${result.stdout}`);
|
||||
}
|
||||
|
||||
if (result.json.ok !== false) {
|
||||
throw new Error(`expected continuity failure ok=false for derivedAction without dispatch receipt, got ${JSON.stringify(result.json)}`);
|
||||
}
|
||||
|
||||
if (result.json.verdict !== 'continuity_failure') {
|
||||
throw new Error(`expected verdict=continuity_failure for derivedAction without dispatch receipt, got ${JSON.stringify(result.json.verdict)}`);
|
||||
}
|
||||
} finally {
|
||||
fixture.cleanup();
|
||||
}
|
||||
},
|
||||
},
|
||||
|
||||
{
|
||||
name: 'continuity: passes when task is complete, next action is known, and a dispatch receipt already exists',
|
||||
run() {
|
||||
const fixture = createFixture({
|
||||
'input.json': {
|
||||
planId: 'plan-existing-dispatch',
|
||||
currentTask: 'task-6',
|
||||
taskState: 'complete',
|
||||
nextDerivedAction: {
|
||||
type: 'message_subagent',
|
||||
task: 'continue with task-7',
|
||||
},
|
||||
replyClosureState: 'completed',
|
||||
dispatchReceipt: {
|
||||
planId: 'plan-existing-dispatch',
|
||||
currentTask: 'task-6',
|
||||
nextDerivedAction: {
|
||||
type: 'message_subagent',
|
||||
task: 'continue with task-7',
|
||||
},
|
||||
dispatchedAt: '2026-04-24T11:55:00+08:00',
|
||||
},
|
||||
},
|
||||
});
|
||||
|
||||
try {
|
||||
const result = runGate({
|
||||
args: ['--compact', '--input', fixture.path('input.json')],
|
||||
});
|
||||
|
||||
if (result.status !== 0 && result.status !== null) {
|
||||
throw new Error(`expected controlled execution, got status=${result.status}
|
||||
${result.stderr || result.stdout}`);
|
||||
}
|
||||
|
||||
if (!result.json || typeof result.json !== 'object') {
|
||||
throw new Error(`expected JSON output
|
||||
stdout=${result.stdout}`);
|
||||
}
|
||||
|
||||
if (result.json.ok !== true) {
|
||||
throw new Error(`expected continuity pass ok=true when dispatch receipt exists, got ${JSON.stringify(result.json)}`);
|
||||
}
|
||||
} finally {
|
||||
fixture.cleanup();
|
||||
}
|
||||
},
|
||||
},
|
||||
|
||||
{
|
||||
name: 'continuity: passes when planner returns derivedAction and a bound dispatch receipt already exists',
|
||||
run() {
|
||||
const fixture = createFixture({
|
||||
'input.json': {
|
||||
planId: 'plan-derived-action-with-bound-dispatch',
|
||||
currentTask: 'task-6c',
|
||||
taskState: 'complete',
|
||||
derivedAction: {
|
||||
type: 'message_subagent',
|
||||
task: 'continue with task-7c',
|
||||
},
|
||||
replyClosureState: 'completed',
|
||||
dispatchReceipt: {
|
||||
planId: 'plan-derived-action-with-bound-dispatch',
|
||||
currentTask: 'task-6c',
|
||||
derivedAction: {
|
||||
type: 'message_subagent',
|
||||
task: 'continue with task-7c',
|
||||
},
|
||||
dispatchedAt: '2026-04-24T12:05:00+08:00',
|
||||
},
|
||||
},
|
||||
});
|
||||
|
||||
try {
|
||||
const result = runGate({
|
||||
args: ['--compact', '--input', fixture.path('input.json')],
|
||||
});
|
||||
|
||||
if (result.status !== 0 && result.status !== null) {
|
||||
throw new Error(`expected controlled execution, got status=${result.status}
|
||||
${result.stderr || result.stdout}`);
|
||||
}
|
||||
|
||||
if (!result.json || typeof result.json !== 'object') {
|
||||
throw new Error(`expected JSON output
|
||||
stdout=${result.stdout}`);
|
||||
}
|
||||
|
||||
if (result.json.ok !== true) {
|
||||
throw new Error(`expected continuity pass ok=true when derivedAction has bound dispatch receipt, got ${JSON.stringify(result.json)}`);
|
||||
}
|
||||
} finally {
|
||||
fixture.cleanup();
|
||||
}
|
||||
},
|
||||
},
|
||||
|
||||
{
|
||||
name: 'continuity: passes when task is complete, next action is known, no dispatch receipt exists, and closure is waiting_user',
|
||||
run() {
|
||||
const fixture = createFixture({
|
||||
'input.json': {
|
||||
planId: 'plan-waiting-user-closure',
|
||||
currentTask: 'task-8',
|
||||
taskState: 'complete',
|
||||
nextDerivedAction: {
|
||||
type: 'message_subagent',
|
||||
task: 'continue with task-9',
|
||||
},
|
||||
replyClosureState: 'waiting_user',
|
||||
dispatchReceipt: null,
|
||||
},
|
||||
});
|
||||
|
||||
try {
|
||||
const result = runGate({
|
||||
args: ['--compact', '--input', fixture.path('input.json')],
|
||||
});
|
||||
|
||||
if (result.status !== 0 && result.status !== null) {
|
||||
throw new Error(`expected controlled execution, got status=${result.status}
|
||||
${result.stderr || result.stdout}`);
|
||||
}
|
||||
|
||||
if (!result.json || typeof result.json !== 'object') {
|
||||
throw new Error(`expected JSON output
|
||||
stdout=${result.stdout}`);
|
||||
}
|
||||
|
||||
if (result.json.ok !== true) {
|
||||
throw new Error(`expected continuity pass ok=true when closure is waiting_user, got ${JSON.stringify(result.json)}`);
|
||||
}
|
||||
} finally {
|
||||
fixture.cleanup();
|
||||
}
|
||||
},
|
||||
},
|
||||
|
||||
{
|
||||
name: 'continuity: passes when task is complete, next action is known, no dispatch receipt exists, and closure is pending_verification',
|
||||
run() {
|
||||
const fixture = createFixture({
|
||||
'input.json': {
|
||||
planId: 'plan-pending-verification-closure',
|
||||
currentTask: 'task-8b',
|
||||
taskState: 'complete',
|
||||
nextDerivedAction: {
|
||||
type: 'message_subagent',
|
||||
task: 'continue with task-9',
|
||||
},
|
||||
replyClosureState: 'pending_verification',
|
||||
dispatchReceipt: null,
|
||||
},
|
||||
});
|
||||
|
||||
try {
|
||||
const result = runGate({
|
||||
args: ['--compact', '--input', fixture.path('input.json')],
|
||||
});
|
||||
|
||||
if (result.status !== 0 && result.status !== null) {
|
||||
throw new Error(`expected controlled execution, got status=${result.status}
|
||||
${result.stderr || result.stdout}`);
|
||||
}
|
||||
|
||||
if (!result.json || typeof result.json !== 'object') {
|
||||
throw new Error(`expected JSON output
|
||||
stdout=${result.stdout}`);
|
||||
}
|
||||
|
||||
if (result.json.ok !== true) {
|
||||
throw new Error(`expected continuity pass ok=true when closure is pending_verification, got ${JSON.stringify(result.json)}`);
|
||||
}
|
||||
} finally {
|
||||
fixture.cleanup();
|
||||
}
|
||||
},
|
||||
},
|
||||
|
||||
{
|
||||
name: 'continuity: passes when task is complete, next action is known, no dispatch receipt exists, and closure is blocked',
|
||||
run() {
|
||||
const fixture = createFixture({
|
||||
'input.json': {
|
||||
planId: 'plan-blocked-closure',
|
||||
currentTask: 'task-9',
|
||||
taskState: 'complete',
|
||||
nextDerivedAction: {
|
||||
type: 'message_subagent',
|
||||
task: 'continue with task-10',
|
||||
},
|
||||
replyClosureState: 'blocked',
|
||||
dispatchReceipt: null,
|
||||
},
|
||||
});
|
||||
|
||||
try {
|
||||
const result = runGate({
|
||||
args: ['--compact', '--input', fixture.path('input.json')],
|
||||
});
|
||||
|
||||
if (result.status !== 0 && result.status !== null) {
|
||||
throw new Error(`expected controlled execution, got status=${result.status}
|
||||
${result.stderr || result.stdout}`);
|
||||
}
|
||||
|
||||
if (!result.json || typeof result.json !== 'object') {
|
||||
throw new Error(`expected JSON output
|
||||
stdout=${result.stdout}`);
|
||||
}
|
||||
|
||||
if (result.json.ok !== true) {
|
||||
throw new Error(`expected continuity pass ok=true when closure is blocked, got ${JSON.stringify(result.json)}`);
|
||||
}
|
||||
} finally {
|
||||
fixture.cleanup();
|
||||
}
|
||||
},
|
||||
},
|
||||
];
|
||||
|
||||
const results = [];
|
||||
let failed = false;
|
||||
|
||||
for (const test of tests) {
|
||||
try {
|
||||
test.run();
|
||||
results.push({ test: test.name, ok: true });
|
||||
} catch (error) {
|
||||
failed = true;
|
||||
results.push({
|
||||
test: test.name,
|
||||
ok: false,
|
||||
error: error instanceof Error ? error.message : String(error),
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
const summary = {
|
||||
total: tests.length,
|
||||
passed: results.filter((entry) => entry.ok).length,
|
||||
failed: results.filter((entry) => !entry.ok).length,
|
||||
};
|
||||
|
||||
process.stdout.write(`${JSON.stringify({ summary, results }, null, 2)}\n`);
|
||||
|
||||
if (failed) process.exit(1);
|
||||
Reference in New Issue
Block a user