322 lines
10 KiB
TypeScript
322 lines
10 KiB
TypeScript
/**
|
|
* Integration tests: debug prompt log wiring in executePiece().
|
|
*/
|
|
|
|
import { describe, it, expect, beforeEach, vi } from 'vitest';
|
|
import type { PieceConfig } from '../core/models/index.js';
|
|
|
|
const { mockIsDebugEnabled, mockWritePromptLog, MockPieceEngine } = vi.hoisted(() => {
|
|
// eslint-disable-next-line @typescript-eslint/no-require-imports
|
|
const { EventEmitter: EE } = require('node:events') as typeof import('node:events');
|
|
|
|
const mockIsDebugEnabled = vi.fn().mockReturnValue(true);
|
|
const mockWritePromptLog = vi.fn();
|
|
|
|
class MockPieceEngine extends EE {
|
|
private config: PieceConfig;
|
|
private task: string;
|
|
|
|
constructor(config: PieceConfig, _cwd: string, task: string, _options: unknown) {
|
|
super();
|
|
if (task === 'constructor-throw-task') {
|
|
throw new Error('mock constructor failure');
|
|
}
|
|
this.config = config;
|
|
this.task = task;
|
|
}
|
|
|
|
abort(): void {}
|
|
|
|
async run(): Promise<{ status: string; iteration: number }> {
|
|
const step = this.config.movements[0]!;
|
|
const timestamp = new Date('2026-02-07T00:00:00.000Z');
|
|
const shouldAbort = this.task === 'abort-task';
|
|
|
|
const shouldRepeatMovement = this.task === 'repeat-movement-task';
|
|
this.emit('movement:start', step, 1, 'movement instruction');
|
|
this.emit('phase:start', step, 1, 'execute', 'phase prompt');
|
|
this.emit('phase:complete', step, 1, 'execute', 'phase response', 'done');
|
|
this.emit(
|
|
'movement:complete',
|
|
step,
|
|
{
|
|
persona: step.personaDisplayName,
|
|
status: 'done',
|
|
content: 'movement response',
|
|
timestamp,
|
|
},
|
|
'movement instruction'
|
|
);
|
|
if (shouldRepeatMovement) {
|
|
this.emit('movement:start', step, 2, 'movement instruction repeat');
|
|
this.emit(
|
|
'movement:complete',
|
|
step,
|
|
{
|
|
persona: step.personaDisplayName,
|
|
status: 'done',
|
|
content: 'movement response repeat',
|
|
timestamp,
|
|
},
|
|
'movement instruction repeat'
|
|
);
|
|
}
|
|
if (shouldAbort) {
|
|
this.emit('piece:abort', { status: 'aborted', iteration: 1 }, 'user_interrupted');
|
|
return { status: 'aborted', iteration: shouldRepeatMovement ? 2 : 1 };
|
|
}
|
|
this.emit('piece:complete', { status: 'completed', iteration: 1 });
|
|
return { status: 'completed', iteration: shouldRepeatMovement ? 2 : 1 };
|
|
}
|
|
}
|
|
|
|
return { mockIsDebugEnabled, mockWritePromptLog, MockPieceEngine };
|
|
});
|
|
|
|
vi.mock('../core/piece/index.js', () => ({
|
|
PieceEngine: MockPieceEngine,
|
|
}));
|
|
|
|
vi.mock('../infra/claude/query-manager.js', () => ({
|
|
interruptAllQueries: vi.fn(),
|
|
}));
|
|
|
|
vi.mock('../agents/ai-judge.js', () => ({
|
|
callAiJudge: vi.fn(),
|
|
}));
|
|
|
|
vi.mock('../infra/config/index.js', () => ({
|
|
loadPersonaSessions: vi.fn().mockReturnValue({}),
|
|
updatePersonaSession: vi.fn(),
|
|
loadWorktreeSessions: vi.fn().mockReturnValue({}),
|
|
updateWorktreeSession: vi.fn(),
|
|
resolvePieceConfigValues: vi.fn().mockReturnValue({
|
|
notificationSound: true,
|
|
notificationSoundEvents: {},
|
|
provider: 'claude',
|
|
runtime: undefined,
|
|
preventSleep: false,
|
|
model: undefined,
|
|
observability: undefined,
|
|
}),
|
|
saveSessionState: vi.fn(),
|
|
ensureDir: vi.fn(),
|
|
writeFileAtomic: vi.fn(),
|
|
}));
|
|
|
|
vi.mock('../shared/context.js', () => ({
|
|
isQuietMode: vi.fn().mockReturnValue(true),
|
|
}));
|
|
|
|
vi.mock('../shared/ui/index.js', () => ({
|
|
header: vi.fn(),
|
|
info: vi.fn(),
|
|
warn: vi.fn(),
|
|
error: vi.fn(),
|
|
success: vi.fn(),
|
|
status: vi.fn(),
|
|
blankLine: vi.fn(),
|
|
StreamDisplay: vi.fn().mockImplementation(() => ({
|
|
createHandler: vi.fn().mockReturnValue(vi.fn()),
|
|
flush: vi.fn(),
|
|
})),
|
|
}));
|
|
|
|
vi.mock('../infra/fs/index.js', () => ({
|
|
generateSessionId: vi.fn().mockReturnValue('test-session-id'),
|
|
createSessionLog: vi.fn().mockReturnValue({
|
|
startTime: new Date().toISOString(),
|
|
iterations: 0,
|
|
}),
|
|
finalizeSessionLog: vi.fn().mockImplementation((log, status) => ({
|
|
...log,
|
|
status,
|
|
endTime: new Date().toISOString(),
|
|
})),
|
|
initNdjsonLog: vi.fn().mockReturnValue('/tmp/test-log.jsonl'),
|
|
appendNdjsonLine: vi.fn(),
|
|
}));
|
|
|
|
vi.mock('../shared/utils/index.js', () => ({
|
|
createLogger: vi.fn().mockReturnValue({
|
|
debug: vi.fn(),
|
|
info: vi.fn(),
|
|
warn: vi.fn(),
|
|
error: vi.fn(),
|
|
}),
|
|
notifySuccess: vi.fn(),
|
|
notifyError: vi.fn(),
|
|
preventSleep: vi.fn(),
|
|
isDebugEnabled: mockIsDebugEnabled,
|
|
writePromptLog: mockWritePromptLog,
|
|
generateReportDir: vi.fn().mockReturnValue('test-report-dir'),
|
|
isValidReportDirName: vi.fn().mockImplementation((value: string) => /^[a-z0-9]+(?:-[a-z0-9]+)*$/.test(value)),
|
|
}));
|
|
|
|
vi.mock('../shared/prompt/index.js', () => ({
|
|
selectOption: vi.fn(),
|
|
promptInput: vi.fn(),
|
|
}));
|
|
|
|
vi.mock('../shared/i18n/index.js', () => ({
|
|
getLabel: vi.fn().mockImplementation((key: string) => key),
|
|
}));
|
|
|
|
vi.mock('../shared/exitCodes.js', () => ({
|
|
EXIT_SIGINT: 130,
|
|
}));
|
|
|
|
import { executePiece } from '../features/tasks/execute/pieceExecution.js';
|
|
import { ensureDir, writeFileAtomic } from '../infra/config/index.js';
|
|
|
|
describe('executePiece debug prompts logging', () => {
|
|
beforeEach(() => {
|
|
vi.clearAllMocks();
|
|
});
|
|
|
|
function makeConfig(): PieceConfig {
|
|
return {
|
|
name: 'test-piece',
|
|
maxMovements: 5,
|
|
initialMovement: 'implement',
|
|
movements: [
|
|
{
|
|
name: 'implement',
|
|
persona: '../agents/coder.md',
|
|
personaDisplayName: 'coder',
|
|
instructionTemplate: 'Implement task',
|
|
passPreviousResponse: true,
|
|
rules: [{ condition: 'done', next: 'COMPLETE' }],
|
|
},
|
|
],
|
|
};
|
|
}
|
|
|
|
it('should write prompt log record when debug is enabled', async () => {
|
|
mockIsDebugEnabled.mockReturnValue(true);
|
|
|
|
await executePiece(makeConfig(), 'task', '/tmp/project', {
|
|
projectCwd: '/tmp/project',
|
|
});
|
|
|
|
expect(mockWritePromptLog).toHaveBeenCalledTimes(1);
|
|
const record = mockWritePromptLog.mock.calls[0]?.[0] as {
|
|
movement: string;
|
|
phase: number;
|
|
iteration: number;
|
|
prompt: string;
|
|
response: string;
|
|
timestamp: string;
|
|
};
|
|
expect(record.movement).toBe('implement');
|
|
expect(record.phase).toBe(1);
|
|
expect(record.iteration).toBe(1);
|
|
expect(record.prompt).toBe('phase prompt');
|
|
expect(record.response).toBe('phase response');
|
|
expect(record.timestamp).toMatch(/^\d{4}-\d{2}-\d{2}T/);
|
|
});
|
|
|
|
it('should not write prompt log record when debug is disabled', async () => {
|
|
mockIsDebugEnabled.mockReturnValue(false);
|
|
|
|
await executePiece(makeConfig(), 'task', '/tmp/project', {
|
|
projectCwd: '/tmp/project',
|
|
});
|
|
|
|
expect(mockWritePromptLog).not.toHaveBeenCalled();
|
|
});
|
|
|
|
it('should update movement prefix context on each movement:start event', async () => {
|
|
const stdoutSpy = vi.spyOn(process.stdout, 'write').mockImplementation(() => true);
|
|
|
|
try {
|
|
await executePiece(makeConfig(), 'repeat-movement-task', '/tmp/project', {
|
|
projectCwd: '/tmp/project',
|
|
taskPrefix: 'override-persona-provider',
|
|
taskColorIndex: 0,
|
|
});
|
|
|
|
const output = stdoutSpy.mock.calls.map((call) => String(call[0])).join('');
|
|
const normalizedOutput = output.replace(/\x1b\[[0-9;]*m/g, '');
|
|
expect(normalizedOutput).toContain('[over][implement](1/5)(1) [INFO] [1/5] implement (coder)');
|
|
expect(normalizedOutput).toContain('[over][implement](2/5)(2) [INFO] [2/5] implement (coder)');
|
|
} finally {
|
|
stdoutSpy.mockRestore();
|
|
}
|
|
});
|
|
|
|
it('should fail fast when taskPrefix is provided without taskColorIndex', async () => {
|
|
await expect(
|
|
executePiece(makeConfig(), 'task', '/tmp/project', {
|
|
projectCwd: '/tmp/project',
|
|
taskPrefix: 'override-persona-provider',
|
|
})
|
|
).rejects.toThrow('taskPrefix and taskColorIndex must be provided together');
|
|
});
|
|
|
|
it('should fail fast for invalid reportDirName before run directory writes', async () => {
|
|
await expect(
|
|
executePiece(makeConfig(), 'task', '/tmp/project', {
|
|
projectCwd: '/tmp/project',
|
|
reportDirName: '..',
|
|
})
|
|
).rejects.toThrow('Invalid reportDirName: ..');
|
|
|
|
expect(vi.mocked(ensureDir)).not.toHaveBeenCalled();
|
|
expect(vi.mocked(writeFileAtomic)).not.toHaveBeenCalled();
|
|
});
|
|
|
|
it('should update meta status from running to completed', async () => {
|
|
await executePiece(makeConfig(), 'task', '/tmp/project', {
|
|
projectCwd: '/tmp/project',
|
|
reportDirName: 'test-report-dir',
|
|
});
|
|
|
|
const calls = vi.mocked(writeFileAtomic).mock.calls;
|
|
expect(calls).toHaveLength(2);
|
|
|
|
const firstMeta = JSON.parse(String(calls[0]![1])) as { status: string; endTime?: string };
|
|
const secondMeta = JSON.parse(String(calls[1]![1])) as { status: string; endTime?: string };
|
|
expect(firstMeta.status).toBe('running');
|
|
expect(firstMeta.endTime).toBeUndefined();
|
|
expect(secondMeta.status).toBe('completed');
|
|
expect(secondMeta.endTime).toMatch(/^\d{4}-\d{2}-\d{2}T/);
|
|
});
|
|
|
|
it('should update meta status from running to aborted', async () => {
|
|
await executePiece(makeConfig(), 'abort-task', '/tmp/project', {
|
|
projectCwd: '/tmp/project',
|
|
reportDirName: 'test-report-dir',
|
|
});
|
|
|
|
const calls = vi.mocked(writeFileAtomic).mock.calls;
|
|
expect(calls).toHaveLength(2);
|
|
|
|
const firstMeta = JSON.parse(String(calls[0]![1])) as { status: string; endTime?: string };
|
|
const secondMeta = JSON.parse(String(calls[1]![1])) as { status: string; endTime?: string };
|
|
expect(firstMeta.status).toBe('running');
|
|
expect(firstMeta.endTime).toBeUndefined();
|
|
expect(secondMeta.status).toBe('aborted');
|
|
expect(secondMeta.endTime).toMatch(/^\d{4}-\d{2}-\d{2}T/);
|
|
});
|
|
|
|
it('should finalize meta as aborted when PieceEngine constructor throws', async () => {
|
|
await expect(
|
|
executePiece(makeConfig(), 'constructor-throw-task', '/tmp/project', {
|
|
projectCwd: '/tmp/project',
|
|
reportDirName: 'test-report-dir',
|
|
})
|
|
).rejects.toThrow('mock constructor failure');
|
|
|
|
const calls = vi.mocked(writeFileAtomic).mock.calls;
|
|
expect(calls).toHaveLength(2);
|
|
|
|
const firstMeta = JSON.parse(String(calls[0]![1])) as { status: string; endTime?: string };
|
|
const secondMeta = JSON.parse(String(calls[1]![1])) as { status: string; endTime?: string };
|
|
expect(firstMeta.status).toBe('running');
|
|
expect(firstMeta.endTime).toBeUndefined();
|
|
expect(secondMeta.status).toBe('aborted');
|
|
expect(secondMeta.endTime).toMatch(/^\d{4}-\d{2}-\d{2}T/);
|
|
});
|
|
});
|