add it

2026-02-01 23:36:33 +09:00 · 2026-02-01 23:36:33 +09:00 · 942f983ea5
commit 942f983ea5
parent d6ac71f0e6
7 changed files with 2817 additions and 0 deletions
--- a/src/tests/it-error-recovery.test.ts
+++ b/src/tests/it-error-recovery.test.ts
@ -0,0 +1,365 @@
 /**
 * Error recovery integration tests.
 *
 * Tests agent error, blocked responses, max iteration limits,
 * loop detection, scenario queue exhaustion, and step execution exceptions.
 *
 * Mocked: UI, session, phase-runner, notifications, config, callAiJudge
 * Not mocked: WorkflowEngine, runAgent, detectMatchedRule, rule-evaluator
 */
 import { describe, it, expect, beforeEach, afterEach, vi } from 'vitest';
 import { mkdtempSync, mkdirSync, writeFileSync, rmSync } from 'node:fs';
 import { join } from 'node:path';
 import { tmpdir } from 'node:os';
 import { setMockScenario, resetScenario } from '../mock/scenario.js';
 import type { WorkflowConfig, WorkflowStep, WorkflowRule } from '../models/types.js';
 // --- Mocks ---
 vi.mock('../claude/client.js', async (importOriginal) => {
  const original = await importOriginal<typeof import('../claude/client.js')>();
  return {
    ...original,
    callAiJudge: vi.fn().mockResolvedValue(-1),
  };
 });
 vi.mock('../workflow/phase-runner.js', () => ({
  needsStatusJudgmentPhase: vi.fn().mockReturnValue(false),
  runReportPhase: vi.fn().mockResolvedValue(undefined),
  runStatusJudgmentPhase: vi.fn().mockResolvedValue(''),
 }));
 vi.mock('../utils/session.js', () => ({
  generateReportDir: vi.fn().mockReturnValue('test-report-dir'),
  generateSessionId: vi.fn().mockReturnValue('test-session-id'),
 }));
 vi.mock('../config/globalConfig.js', () => ({
  loadGlobalConfig: vi.fn().mockReturnValue({}),
  getLanguage: vi.fn().mockReturnValue('en'),
  getDisabledBuiltins: vi.fn().mockReturnValue([]),
 }));
 vi.mock('../config/projectConfig.js', () => ({
  loadProjectConfig: vi.fn().mockReturnValue({}),
 }));
 // --- Imports (after mocks) ---
 import { WorkflowEngine } from '../workflow/engine.js';
 // --- Test helpers ---
 function makeRule(condition: string, next: string): WorkflowRule {
  return { condition, next };
 }
 function makeStep(name: string, agentPath: string, rules: WorkflowRule[]): WorkflowStep {
  return {
    name,
    agent: `./agents/${name}.md`,
    agentDisplayName: name,
    agentPath,
    instructionTemplate: '{task}',
    passPreviousResponse: true,
    rules,
  };
 }
 function createTestEnv(): { dir: string; agentPaths: Record<string, string> } {
  const dir = mkdtempSync(join(tmpdir(), 'takt-it-err-'));
  mkdirSync(join(dir, '.takt', 'reports', 'test-report-dir'), { recursive: true });
  const agentsDir = join(dir, 'agents');
  mkdirSync(agentsDir, { recursive: true });
  // Agent file names match step names used in makeStep()
  const agents = ['plan', 'implement', 'review', 'supervisor'];
  const agentPaths: Record<string, string> = {};
  for (const agent of agents) {
    const path = join(agentsDir, `${agent}.md`);
    writeFileSync(path, `You are a ${agent} agent.`);
    agentPaths[agent] = path;
  }
  return { dir, agentPaths };
 }
 function buildWorkflow(agentPaths: Record<string, string>, maxIterations: number): WorkflowConfig {
  return {
    name: 'it-error',
    description: 'IT error recovery workflow',
    maxIterations,
    initialStep: 'plan',
    steps: [
      makeStep('plan', agentPaths.plan, [
        makeRule('Requirements are clear', 'implement'),
        makeRule('Requirements unclear', 'ABORT'),
      ]),
      makeStep('implement', agentPaths.implement, [
        makeRule('Implementation complete', 'review'),
        makeRule('Cannot proceed', 'plan'),
      ]),
      makeStep('review', agentPaths.review, [
        makeRule('All checks passed', 'COMPLETE'),
        makeRule('Issues found', 'implement'),
      ]),
    ],
  };
 }
 describe('Error Recovery IT: agent blocked response', () => {
  let testDir: string;
  let agentPaths: Record<string, string>;
  beforeEach(() => {
    vi.clearAllMocks();
    const env = createTestEnv();
    testDir = env.dir;
    agentPaths = env.agentPaths;
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should handle blocked agent response gracefully', async () => {
    setMockScenario([
      { agent: 'plan', status: 'blocked', content: 'Error: Agent is blocked.' },
    ]);
    const config = buildWorkflow(agentPaths, 10);
    const engine = new WorkflowEngine(config, testDir, 'Test task', {
      projectCwd: testDir,
      provider: 'mock',
    });
    const state = await engine.run();
    // Blocked agent should result in workflow abort
    expect(state.status).toBe('aborted');
  });
  it('should handle empty content from agent', async () => {
    setMockScenario([
      { agent: 'plan', status: 'done', content: '' },
    ]);
    const config = buildWorkflow(agentPaths, 10);
    const engine = new WorkflowEngine(config, testDir, 'Test task', {
      projectCwd: testDir,
      provider: 'mock',
    });
    const state = await engine.run();
    // Empty content means no tag match; should eventually abort
    expect(['aborted', 'completed']).toContain(state.status);
  });
 });
 describe('Error Recovery IT: max iterations reached', () => {
  let testDir: string;
  let agentPaths: Record<string, string>;
  beforeEach(() => {
    vi.clearAllMocks();
    const env = createTestEnv();
    testDir = env.dir;
    agentPaths = env.agentPaths;
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should abort when max iterations reached (tight limit)', async () => {
    // Only 2 iterations allowed, but workflow needs 3 steps
    setMockScenario([
      { agent: 'plan', status: 'done', content: '[PLAN:1]\n\nClear.' },
      { agent: 'implement', status: 'done', content: '[IMPLEMENT:1]\n\nDone.' },
      { agent: 'review', status: 'done', content: '[REVIEW:1]\n\nPassed.' },
    ]);
    const config = buildWorkflow(agentPaths, 2);
    const engine = new WorkflowEngine(config, testDir, 'Task', {
      projectCwd: testDir,
      provider: 'mock',
    });
    const state = await engine.run();
    expect(state.status).toBe('aborted');
    expect(state.iteration).toBeLessThanOrEqual(2);
  });
  it('should abort when infinite plan → implement loop hits max', async () => {
    // plan → implement → plan → implement ...
    const loopScenario = Array.from({ length: 10 }, (_, i) => ({
      status: 'done' as const,
      content: i % 2 === 0 ? '[PLAN:1]\n\nClear.' : '[IMPLEMENT:2]\n\nCannot proceed.',
    }));
    setMockScenario(loopScenario);
    const config = buildWorkflow(agentPaths, 4);
    const engine = new WorkflowEngine(config, testDir, 'Looping task', {
      projectCwd: testDir,
      provider: 'mock',
    });
    const state = await engine.run();
    expect(state.status).toBe('aborted');
    expect(state.iteration).toBeLessThanOrEqual(4);
  });
 });
 describe('Error Recovery IT: scenario queue exhaustion', () => {
  let testDir: string;
  let agentPaths: Record<string, string>;
  beforeEach(() => {
    vi.clearAllMocks();
    const env = createTestEnv();
    testDir = env.dir;
    agentPaths = env.agentPaths;
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should handle scenario queue exhaustion mid-workflow', async () => {
    // Only 1 entry, but workflow needs 3 steps
    setMockScenario([
      { agent: 'plan', status: 'done', content: '[PLAN:1]\n\nClear.' },
    ]);
    const config = buildWorkflow(agentPaths, 10);
    const engine = new WorkflowEngine(config, testDir, 'Task', {
      projectCwd: testDir,
      provider: 'mock',
    });
    // Should not throw; mock client falls back to generic response when queue is empty
    const state = await engine.run();
    // Even with queue exhaustion, engine should reach some terminal state
    expect(['completed', 'aborted']).toContain(state.status);
  });
 });
 describe('Error Recovery IT: step events on error paths', () => {
  let testDir: string;
  let agentPaths: Record<string, string>;
  beforeEach(() => {
    vi.clearAllMocks();
    const env = createTestEnv();
    testDir = env.dir;
    agentPaths = env.agentPaths;
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should emit workflow:abort event with reason on max iterations', async () => {
    const loopScenario = Array.from({ length: 6 }, (_, i) => ({
      status: 'done' as const,
      content: i % 2 === 0 ? '[PLAN:1]\n\nClear.' : '[IMPLEMENT:2]\n\nCannot proceed.',
    }));
    setMockScenario(loopScenario);
    const config = buildWorkflow(agentPaths, 3);
    const engine = new WorkflowEngine(config, testDir, 'Task', {
      projectCwd: testDir,
      provider: 'mock',
    });
    let abortReason: string | undefined;
    engine.on('workflow:abort', (_state, reason) => {
      abortReason = reason;
    });
    await engine.run();
    expect(abortReason).toBeDefined();
  });
  it('should emit step:start and step:complete for each executed step before abort', async () => {
    setMockScenario([
      { agent: 'plan', status: 'done', content: '[PLAN:2]\n\nRequirements unclear.' },
    ]);
    const config = buildWorkflow(agentPaths, 10);
    const engine = new WorkflowEngine(config, testDir, 'Task', {
      projectCwd: testDir,
      provider: 'mock',
    });
    const startedSteps: string[] = [];
    const completedSteps: string[] = [];
    engine.on('step:start', (step) => {
      startedSteps.push(step.name);
    });
    engine.on('step:complete', (step) => {
      completedSteps.push(step.name);
    });
    await engine.run();
    expect(startedSteps).toEqual(['plan']);
    expect(completedSteps).toEqual(['plan']);
  });
 });
 describe('Error Recovery IT: programmatic abort', () => {
  let testDir: string;
  let agentPaths: Record<string, string>;
  beforeEach(() => {
    vi.clearAllMocks();
    const env = createTestEnv();
    testDir = env.dir;
    agentPaths = env.agentPaths;
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should support engine.abort() to cancel running workflow', async () => {
    // Provide enough scenarios for 3 steps
    setMockScenario([
      { agent: 'plan', status: 'done', content: '[PLAN:1]\n\nClear.' },
      { agent: 'implement', status: 'done', content: '[IMPLEMENT:1]\n\nDone.' },
      { agent: 'review', status: 'done', content: '[REVIEW:1]\n\nPassed.' },
    ]);
    const config = buildWorkflow(agentPaths, 10);
    const engine = new WorkflowEngine(config, testDir, 'Task', {
      projectCwd: testDir,
      provider: 'mock',
    });
    // Abort after the first step completes
    engine.on('step:complete', () => {
      engine.abort();
    });
    const state = await engine.run();
    expect(state.status).toBe('aborted');
    // Should have aborted after 1 step
    expect(state.iteration).toBeLessThanOrEqual(2);
  });
 });
--- a/src/tests/it-instruction-builder.test.ts
+++ b/src/tests/it-instruction-builder.test.ts
@ -0,0 +1,361 @@
 /**
 * Instruction builder integration tests.
 *
 * Tests template variable expansion and auto-injection in buildInstruction().
 * Uses real workflow step configs (not mocked) against the buildInstruction function.
 *
 * Not mocked: buildInstruction, buildReportInstruction, buildStatusJudgmentInstruction
 */
 import { describe, it, expect, vi } from 'vitest';
 import type { WorkflowStep, WorkflowRule, AgentResponse } from '../models/types.js';
 vi.mock('../config/globalConfig.js', () => ({
  loadGlobalConfig: vi.fn().mockReturnValue({}),
  getLanguage: vi.fn().mockReturnValue('en'),
 }));
 import {
  buildInstruction,
  buildReportInstruction,
  buildStatusJudgmentInstruction,
 } from '../workflow/instruction-builder.js';
 import type { InstructionContext } from '../workflow/instruction-builder.js';
 // --- Test helpers ---
 function makeRule(condition: string, next: string, extra?: Partial<WorkflowRule>): WorkflowRule {
  return { condition, next, ...extra };
 }
 function makeStep(overrides: Partial<WorkflowStep> = {}): WorkflowStep {
  return {
    name: 'test-step',
    agent: 'test-agent',
    agentDisplayName: 'test-step',
    instructionTemplate: 'Do the work.',
    passPreviousResponse: false,
    rules: [
      makeRule('Done', 'COMPLETE'),
      makeRule('Not done', 'ABORT'),
    ],
    ...overrides,
  };
 }
 function makeContext(overrides: Partial<InstructionContext> = {}): InstructionContext {
  return {
    task: 'Test task description',
    iteration: 3,
    maxIterations: 30,
    stepIteration: 2,
    cwd: '/tmp/test-project',
    projectCwd: '/tmp/test-project',
    userInputs: [],
    language: 'en',
    ...overrides,
  };
 }
 describe('Instruction Builder IT: task auto-injection', () => {
  it('should auto-inject task as "User Request" section when template has no {task}', () => {
    const step = makeStep({ instructionTemplate: 'Do the work.' });
    const ctx = makeContext({ task: 'Build the login page' });
    const result = buildInstruction(step, ctx);
    expect(result).toContain('## User Request');
    expect(result).toContain('Build the login page');
  });
  it('should NOT auto-inject task section when template contains {task}', () => {
    const step = makeStep({ instructionTemplate: 'Here is the task: {task}' });
    const ctx = makeContext({ task: 'Build the login page' });
    const result = buildInstruction(step, ctx);
    // Should not have separate User Request section
    const userRequestCount = (result.match(/## User Request/g) || []).length;
    expect(userRequestCount).toBe(0);
    // But task should still appear inline
    expect(result).toContain('Build the login page');
  });
 });
 describe('Instruction Builder IT: previous_response auto-injection', () => {
  it('should auto-inject previous response when passPreviousResponse is true', () => {
    const step = makeStep({
      passPreviousResponse: true,
      instructionTemplate: 'Continue the work.',
    });
    const previousOutput: AgentResponse = {
      agent: 'previous-agent',
      status: 'done',
      content: 'Previous agent completed step A.',
      timestamp: new Date(),
    };
    const ctx = makeContext({ previousOutput });
    const result = buildInstruction(step, ctx);
    expect(result).toContain('## Previous Response');
    expect(result).toContain('Previous agent completed step A.');
  });
  it('should NOT inject previous response when passPreviousResponse is false', () => {
    const step = makeStep({
      passPreviousResponse: false,
      instructionTemplate: 'Do fresh work.',
    });
    const previousOutput: AgentResponse = {
      agent: 'previous-agent',
      status: 'done',
      content: 'Previous output.',
      timestamp: new Date(),
    };
    const ctx = makeContext({ previousOutput });
    const result = buildInstruction(step, ctx);
    expect(result).not.toContain('## Previous Response');
    expect(result).not.toContain('Previous output.');
  });
  it('should NOT auto-inject when template contains {previous_response}', () => {
    const step = makeStep({
      passPreviousResponse: true,
      instructionTemplate: '## Context\n{previous_response}\n\nDo work.',
    });
    const previousOutput: AgentResponse = {
      agent: 'prev', status: 'done', content: 'Prior work done.', timestamp: new Date(),
    };
    const ctx = makeContext({ previousOutput });
    const result = buildInstruction(step, ctx);
    // Should not have separate Previous Response section
    const prevCount = (result.match(/## Previous Response/g) || []).length;
    expect(prevCount).toBe(0);
    // But content should be inline
    expect(result).toContain('Prior work done.');
  });
 });
 describe('Instruction Builder IT: user_inputs auto-injection', () => {
  it('should auto-inject user inputs section', () => {
    const step = makeStep();
    const ctx = makeContext({ userInputs: ['Fix the typo', 'Use TypeScript'] });
    const result = buildInstruction(step, ctx);
    expect(result).toContain('## Additional User Inputs');
    expect(result).toContain('Fix the typo');
    expect(result).toContain('Use TypeScript');
  });
  it('should NOT auto-inject when template contains {user_inputs}', () => {
    const step = makeStep({ instructionTemplate: 'Inputs: {user_inputs}' });
    const ctx = makeContext({ userInputs: ['Input A'] });
    const result = buildInstruction(step, ctx);
    const count = (result.match(/## Additional User Inputs/g) || []).length;
    expect(count).toBe(0);
    expect(result).toContain('Input A');
  });
 });
 describe('Instruction Builder IT: iteration variables', () => {
  it('should replace {iteration}, {max_iterations}, {step_iteration} in template', () => {
    const step = makeStep({
      instructionTemplate: 'Iter: {iteration}/{max_iterations}, step iter: {step_iteration}',
    });
    const ctx = makeContext({ iteration: 5, maxIterations: 30, stepIteration: 2 });
    const result = buildInstruction(step, ctx);
    expect(result).toContain('Iter: 5/30, step iter: 2');
  });
  it('should include iteration in Workflow Context section', () => {
    const step = makeStep();
    const ctx = makeContext({ iteration: 7, maxIterations: 20, stepIteration: 3 });
    const result = buildInstruction(step, ctx);
    expect(result).toContain('Iteration: 7/20');
    expect(result).toContain('Step Iteration: 3');
  });
 });
 describe('Instruction Builder IT: report_dir expansion', () => {
  it('should replace {report_dir} in template', () => {
    const step = makeStep({
      instructionTemplate: 'Read the plan from {report_dir}/00-plan.md',
    });
    const ctx = makeContext({ reportDir: '/tmp/test-project/.takt/reports/20250126-task' });
    const result = buildInstruction(step, ctx);
    expect(result).toContain('Read the plan from /tmp/test-project/.takt/reports/20250126-task/00-plan.md');
  });
  it('should replace {report:filename} with full path', () => {
    const step = makeStep({
      instructionTemplate: 'Read {report:00-plan.md} for the plan.',
    });
    const ctx = makeContext({ reportDir: '/tmp/reports' });
    const result = buildInstruction(step, ctx);
    expect(result).toContain('Read /tmp/reports/00-plan.md for the plan.');
  });
 });
 describe('Instruction Builder IT: status output rules injection', () => {
  it('should inject status rules for steps with tag-based rules', () => {
    const step = makeStep({
      name: 'plan',
      rules: [
        makeRule('Requirements clear', 'implement'),
        makeRule('Requirements unclear', 'ABORT'),
      ],
    });
    const ctx = makeContext();
    const result = buildInstruction(step, ctx);
    // Should contain status rules section with the tag format
    expect(result).toContain('[PLAN:');
    expect(result).toContain('Requirements clear');
    expect(result).toContain('Requirements unclear');
  });
  it('should NOT inject status rules for steps with only ai() conditions', () => {
    const step = makeStep({
      name: 'review',
      rules: [
        makeRule('ai("approved")', 'COMPLETE', { isAiCondition: true, aiConditionText: 'approved' }),
        makeRule('ai("rejected")', 'ABORT', { isAiCondition: true, aiConditionText: 'rejected' }),
      ],
    });
    const ctx = makeContext();
    const result = buildInstruction(step, ctx);
    // Should NOT contain tag-based status rules
    expect(result).not.toContain('[REVIEW:');
  });
 });
 describe('Instruction Builder IT: edit permission in execution context', () => {
  it('should include edit permission rules when edit is true', () => {
    const step = makeStep({ edit: true });
    const ctx = makeContext();
    const result = buildInstruction(step, ctx);
    // Should mention editing is allowed
    expect(result).toMatch(/edit|Edit|ファイル/i);
  });
  it('should indicate read-only when edit is false', () => {
    const step = makeStep({ edit: false });
    const ctx = makeContext();
    const result = buildInstruction(step, ctx);
    // Should contain the "Editing is DISABLED" execution rule
    expect(result).toContain('Editing is DISABLED');
    expect(result).not.toContain('Editing is ENABLED');
  });
 });
 describe('Instruction Builder IT: buildReportInstruction', () => {
  it('should build report instruction with report context', () => {
    const step = makeStep({
      name: 'plan',
      report: { name: '00-plan.md', format: '# Plan\n{step_iteration}' },
    });
    const result = buildReportInstruction(step, {
      cwd: '/tmp/test',
      reportDir: '/tmp/test/.takt/reports/test-dir',
      stepIteration: 1,
      language: 'en',
    });
    expect(result).toContain('00-plan.md');
    expect(result).toContain('/tmp/test/.takt/reports/test-dir');
    expect(result).toContain('report');
  });
  it('should throw for step without report config', () => {
    const step = makeStep({ report: undefined });
    expect(() =>
      buildReportInstruction(step, {
        cwd: '/tmp',
        reportDir: '/tmp/reports',
        stepIteration: 1,
      }),
    ).toThrow(/no report config/);
  });
 });
 describe('Instruction Builder IT: buildStatusJudgmentInstruction', () => {
  it('should build Phase 3 instruction with status rules', () => {
    const step = makeStep({
      name: 'plan',
      rules: [
        makeRule('Clear', 'implement'),
        makeRule('Unclear', 'ABORT'),
      ],
    });
    const result = buildStatusJudgmentInstruction(step, { language: 'en' });
    expect(result).toContain('[PLAN:');
    expect(result).toContain('Clear');
    expect(result).toContain('Unclear');
  });
  it('should throw for step without rules', () => {
    const step = makeStep({ rules: undefined });
    expect(() =>
      buildStatusJudgmentInstruction(step, { language: 'en' }),
    ).toThrow(/no rules/);
  });
 });
 describe('Instruction Builder IT: template injection prevention', () => {
  it('should escape curly braces in task content', () => {
    const step = makeStep();
    const ctx = makeContext({ task: 'Use {variable} in code' });
    const result = buildInstruction(step, ctx);
    // Braces should be escaped to prevent template re-injection
    expect(result).not.toContain('{variable}');
    expect(result).toContain('｛variable｝');
  });
  it('should escape curly braces in previous response content', () => {
    const step = makeStep({
      passPreviousResponse: true,
      instructionTemplate: 'Continue.',
    });
    const ctx = makeContext({
      previousOutput: {
        agent: 'prev', status: 'done',
        content: 'Use {template} syntax', timestamp: new Date(),
      },
    });
    const result = buildInstruction(step, ctx);
    expect(result).not.toContain('{template}');
    expect(result).toContain('｛template｝');
  });
 });
--- a/src/tests/it-pipeline-modes.test.ts
+++ b/src/tests/it-pipeline-modes.test.ts
@ -0,0 +1,546 @@
 /**
 * Pipeline execution mode integration tests.
 *
 * Tests various --pipeline mode option combinations including:
 * - --task, --issue, --skip-git, --auto-pr, --workflow (name/path), --provider, --model
 * - Exit codes for different failure scenarios
 *
 * Mocked: git (child_process), GitHub API, UI, notifications, session, phase-runner, config
 * Not mocked: executePipeline, executeTask, WorkflowEngine, runAgent, rule evaluation
 */
 import { describe, it, expect, beforeEach, afterEach, vi } from 'vitest';
 import { mkdtempSync, mkdirSync, writeFileSync, rmSync } from 'node:fs';
 import { join } from 'node:path';
 import { tmpdir } from 'node:os';
 import { setMockScenario, resetScenario } from '../mock/scenario.js';
 // --- Mocks ---
 const {
  mockFetchIssue,
  mockFormatIssueAsTask,
  mockCheckGhCli,
  mockCreatePullRequest,
  mockPushBranch,
 } = vi.hoisted(() => ({
  mockFetchIssue: vi.fn(),
  mockFormatIssueAsTask: vi.fn(),
  mockCheckGhCli: vi.fn(),
  mockCreatePullRequest: vi.fn(),
  mockPushBranch: vi.fn(),
 }));
 vi.mock('../claude/client.js', async (importOriginal) => {
  const original = await importOriginal<typeof import('../claude/client.js')>();
  return {
    ...original,
    callAiJudge: vi.fn().mockResolvedValue(-1),
  };
 });
 vi.mock('node:child_process', () => ({
  execFileSync: vi.fn(),
 }));
 vi.mock('../github/issue.js', () => ({
  fetchIssue: mockFetchIssue,
  formatIssueAsTask: mockFormatIssueAsTask,
  checkGhCli: mockCheckGhCli,
 }));
 vi.mock('../github/pr.js', () => ({
  createPullRequest: mockCreatePullRequest,
  pushBranch: mockPushBranch,
  buildPrBody: vi.fn().mockReturnValue('PR body'),
 }));
 vi.mock('../task/git.js', () => ({
  stageAndCommit: vi.fn().mockReturnValue('abc1234'),
 }));
 vi.mock('../utils/ui.js', () => ({
  header: vi.fn(),
  info: vi.fn(),
  warn: vi.fn(),
  error: vi.fn(),
  success: vi.fn(),
  status: vi.fn(),
  blankLine: vi.fn(),
  StreamDisplay: vi.fn().mockImplementation(() => ({
    createHandler: () => vi.fn(),
    flush: vi.fn(),
  })),
 }));
 vi.mock('../utils/notification.js', () => ({
  notifySuccess: vi.fn(),
  notifyError: vi.fn(),
 }));
 vi.mock('../utils/session.js', () => ({
  generateSessionId: vi.fn().mockReturnValue('test-session-id'),
  createSessionLog: vi.fn().mockReturnValue({
    startTime: new Date().toISOString(),
    iterations: 0,
  }),
  finalizeSessionLog: vi.fn().mockImplementation((log, status) => ({ ...log, status })),
  updateLatestPointer: vi.fn(),
  initNdjsonLog: vi.fn().mockReturnValue('/tmp/test.ndjson'),
  appendNdjsonLine: vi.fn(),
  generateReportDir: vi.fn().mockReturnValue('test-report-dir'),
 }));
 vi.mock('../config/paths.js', async (importOriginal) => {
  const original = await importOriginal<typeof import('../config/paths.js')>();
  return {
    ...original,
    loadAgentSessions: vi.fn().mockReturnValue({}),
    updateAgentSession: vi.fn(),
    loadWorktreeSessions: vi.fn().mockReturnValue({}),
    updateWorktreeSession: vi.fn(),
    getCurrentWorkflow: vi.fn().mockReturnValue('default'),
    getProjectConfigDir: vi.fn().mockImplementation((cwd: string) => join(cwd, '.takt')),
  };
 });
 vi.mock('../config/globalConfig.js', async (importOriginal) => {
  const original = await importOriginal<typeof import('../config/globalConfig.js')>();
  return {
    ...original,
    loadGlobalConfig: vi.fn().mockReturnValue({}),
    getLanguage: vi.fn().mockReturnValue('en'),
    getDisabledBuiltins: vi.fn().mockReturnValue([]),
  };
 });
 vi.mock('../config/projectConfig.js', async (importOriginal) => {
  const original = await importOriginal<typeof import('../config/projectConfig.js')>();
  return {
    ...original,
    loadProjectConfig: vi.fn().mockReturnValue({}),
  };
 });
 vi.mock('../cli.js', () => ({
  isQuietMode: vi.fn().mockReturnValue(true),
 }));
 vi.mock('../prompt/index.js', () => ({
  selectOption: vi.fn().mockResolvedValue('stop'),
  promptInput: vi.fn().mockResolvedValue(null),
 }));
 vi.mock('../workflow/phase-runner.js', () => ({
  needsStatusJudgmentPhase: vi.fn().mockReturnValue(false),
  runReportPhase: vi.fn().mockResolvedValue(undefined),
  runStatusJudgmentPhase: vi.fn().mockResolvedValue(''),
 }));
 // --- Imports (after mocks) ---
 import { executePipeline } from '../commands/pipelineExecution.js';
 import {
  EXIT_ISSUE_FETCH_FAILED,
  EXIT_WORKFLOW_FAILED,
  EXIT_PR_CREATION_FAILED,
 } from '../exitCodes.js';
 // --- Test helpers ---
 function createTestWorkflowDir(): { dir: string; workflowPath: string } {
  const dir = mkdtempSync(join(tmpdir(), 'takt-it-pm-'));
  mkdirSync(join(dir, '.takt', 'reports', 'test-report-dir'), { recursive: true });
  const agentsDir = join(dir, 'agents');
  mkdirSync(agentsDir, { recursive: true });
  writeFileSync(join(agentsDir, 'planner.md'), 'You are a planner.');
  writeFileSync(join(agentsDir, 'coder.md'), 'You are a coder.');
  writeFileSync(join(agentsDir, 'reviewer.md'), 'You are a reviewer.');
  const workflowYaml = `
 name: it-pipeline
 description: Pipeline test workflow
 max_iterations: 10
 initial_step: plan
 steps:
  - name: plan
    agent: ./agents/planner.md
    rules:
      - condition: Requirements are clear
        next: implement
      - condition: Requirements unclear
        next: ABORT
    instruction: "{task}"
  - name: implement
    agent: ./agents/coder.md
    rules:
      - condition: Implementation complete
        next: review
      - condition: Cannot proceed
        next: plan
    instruction: "{task}"
  - name: review
    agent: ./agents/reviewer.md
    rules:
      - condition: All checks passed
        next: COMPLETE
      - condition: Issues found
        next: implement
    instruction: "{task}"
 `;
  const workflowPath = join(dir, 'workflow.yaml');
  writeFileSync(workflowPath, workflowYaml);
  return { dir, workflowPath };
 }
 function happyScenario(): void {
  setMockScenario([
    { agent: 'planner', status: 'done', content: '[PLAN:1]\n\nRequirements are clear.' },
    { agent: 'coder', status: 'done', content: '[IMPLEMENT:1]\n\nImplementation complete.' },
    { agent: 'reviewer', status: 'done', content: '[REVIEW:1]\n\nAll checks passed.' },
  ]);
 }
 describe('Pipeline Modes IT: --task + --workflow path', () => {
  let testDir: string;
  let workflowPath: string;
  beforeEach(() => {
    vi.clearAllMocks();
    const setup = createTestWorkflowDir();
    testDir = setup.dir;
    workflowPath = setup.workflowPath;
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should return exit code 0 on successful pipeline', async () => {
    happyScenario();
    const exitCode = await executePipeline({
      task: 'Add a feature',
      workflow: workflowPath,
      autoPr: false,
      skipGit: true,
      cwd: testDir,
      provider: 'mock',
    });
    expect(exitCode).toBe(0);
  });
  it('should return EXIT_WORKFLOW_FAILED (3) on ABORT', async () => {
    setMockScenario([
      { agent: 'planner', status: 'done', content: '[PLAN:2]\n\nRequirements unclear.' },
    ]);
    const exitCode = await executePipeline({
      task: 'Vague task',
      workflow: workflowPath,
      autoPr: false,
      skipGit: true,
      cwd: testDir,
      provider: 'mock',
    });
    expect(exitCode).toBe(EXIT_WORKFLOW_FAILED);
  });
 });
 describe('Pipeline Modes IT: --task + --workflow name (builtin)', () => {
  let testDir: string;
  beforeEach(() => {
    vi.clearAllMocks();
    const setup = createTestWorkflowDir();
    testDir = setup.dir;
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should load and execute builtin simple workflow by name', async () => {
    setMockScenario([
      { agent: 'planner', status: 'done', content: '[PLAN:1]\n\nRequirements are clear.' },
      { agent: 'coder', status: 'done', content: '[IMPLEMENT:1]\n\nImplementation complete.' },
      { agent: 'ai-antipattern-reviewer', status: 'done', content: '[AI_REVIEW:1]\n\nNo issues.' },
      { agent: 'architecture-reviewer', status: 'done', content: '[REVIEW:1]\n\nNo issues found.' },
      { agent: 'supervisor', status: 'done', content: '[SUPERVISE:1]\n\nAll checks passed.' },
    ]);
    const exitCode = await executePipeline({
      task: 'Add a feature',
      workflow: 'simple',
      autoPr: false,
      skipGit: true,
      cwd: testDir,
      provider: 'mock',
    });
    expect(exitCode).toBe(0);
  });
  it('should return EXIT_WORKFLOW_FAILED for non-existent workflow name', async () => {
    const exitCode = await executePipeline({
      task: 'Test task',
      workflow: 'non-existent-workflow-xyz',
      autoPr: false,
      skipGit: true,
      cwd: testDir,
      provider: 'mock',
    });
    expect(exitCode).toBe(EXIT_WORKFLOW_FAILED);
  });
 });
 describe('Pipeline Modes IT: --issue', () => {
  let testDir: string;
  let workflowPath: string;
  beforeEach(() => {
    vi.clearAllMocks();
    const setup = createTestWorkflowDir();
    testDir = setup.dir;
    workflowPath = setup.workflowPath;
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should fetch issue and execute workflow', async () => {
    mockCheckGhCli.mockReturnValue({ available: true });
    mockFetchIssue.mockReturnValue({
      number: 42,
      title: 'Fix the bug',
      body: 'Details here',
    });
    mockFormatIssueAsTask.mockReturnValue('Fix the bug\n\nDetails here');
    happyScenario();
    const exitCode = await executePipeline({
      issueNumber: 42,
      workflow: workflowPath,
      autoPr: false,
      skipGit: true,
      cwd: testDir,
      provider: 'mock',
    });
    expect(exitCode).toBe(0);
    expect(mockFetchIssue).toHaveBeenCalledWith(42);
  });
  it('should return EXIT_ISSUE_FETCH_FAILED when gh CLI unavailable', async () => {
    mockCheckGhCli.mockReturnValue({ available: false, error: 'gh not found' });
    const exitCode = await executePipeline({
      issueNumber: 42,
      workflow: workflowPath,
      autoPr: false,
      skipGit: true,
      cwd: testDir,
      provider: 'mock',
    });
    expect(exitCode).toBe(EXIT_ISSUE_FETCH_FAILED);
  });
  it('should return EXIT_ISSUE_FETCH_FAILED when issue fetch throws', async () => {
    mockCheckGhCli.mockReturnValue({ available: true });
    mockFetchIssue.mockImplementation(() => {
      throw new Error('Issue not found');
    });
    const exitCode = await executePipeline({
      issueNumber: 999,
      workflow: workflowPath,
      autoPr: false,
      skipGit: true,
      cwd: testDir,
      provider: 'mock',
    });
    expect(exitCode).toBe(EXIT_ISSUE_FETCH_FAILED);
  });
  it('should return EXIT_ISSUE_FETCH_FAILED when neither --issue nor --task specified', async () => {
    const exitCode = await executePipeline({
      workflow: workflowPath,
      autoPr: false,
      skipGit: true,
      cwd: testDir,
      provider: 'mock',
    });
    expect(exitCode).toBe(EXIT_ISSUE_FETCH_FAILED);
  });
 });
 describe('Pipeline Modes IT: --auto-pr', () => {
  let testDir: string;
  let workflowPath: string;
  beforeEach(() => {
    vi.clearAllMocks();
    const setup = createTestWorkflowDir();
    testDir = setup.dir;
    workflowPath = setup.workflowPath;
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should create PR on success when --auto-pr is set (without --skip-git)', async () => {
    happyScenario();
    mockCreatePullRequest.mockReturnValue({ success: true, url: 'https://github.com/test/pr/1' });
    const exitCode = await executePipeline({
      task: 'Add a feature',
      workflow: workflowPath,
      autoPr: true,
      skipGit: false,
      cwd: testDir,
      provider: 'mock',
    });
    expect(exitCode).toBe(0);
    expect(mockCreatePullRequest).toHaveBeenCalled();
  });
  it('should return EXIT_PR_CREATION_FAILED when PR creation fails', async () => {
    happyScenario();
    mockCreatePullRequest.mockReturnValue({ success: false, error: 'Rate limited' });
    const exitCode = await executePipeline({
      task: 'Add a feature',
      workflow: workflowPath,
      autoPr: true,
      skipGit: false,
      cwd: testDir,
      provider: 'mock',
    });
    expect(exitCode).toBe(EXIT_PR_CREATION_FAILED);
  });
  it('should skip PR creation when --auto-pr and --skip-git are both set', async () => {
    happyScenario();
    const exitCode = await executePipeline({
      task: 'Add a feature',
      workflow: workflowPath,
      autoPr: true,
      skipGit: true,
      cwd: testDir,
      provider: 'mock',
    });
    expect(exitCode).toBe(0);
    expect(mockCreatePullRequest).not.toHaveBeenCalled();
  });
 });
 describe('Pipeline Modes IT: --provider and --model overrides', () => {
  let testDir: string;
  let workflowPath: string;
  beforeEach(() => {
    vi.clearAllMocks();
    const setup = createTestWorkflowDir();
    testDir = setup.dir;
    workflowPath = setup.workflowPath;
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should pass provider override to workflow execution', async () => {
    happyScenario();
    const exitCode = await executePipeline({
      task: 'Test task',
      workflow: workflowPath,
      autoPr: false,
      skipGit: true,
      cwd: testDir,
      provider: 'mock',
    });
    expect(exitCode).toBe(0);
  });
  it('should pass model override to workflow execution', async () => {
    happyScenario();
    const exitCode = await executePipeline({
      task: 'Test task',
      workflow: workflowPath,
      autoPr: false,
      skipGit: true,
      cwd: testDir,
      provider: 'mock',
      model: 'opus',
    });
    expect(exitCode).toBe(0);
  });
 });
 describe('Pipeline Modes IT: review → fix loop', () => {
  let testDir: string;
  let workflowPath: string;
  beforeEach(() => {
    vi.clearAllMocks();
    const setup = createTestWorkflowDir();
    testDir = setup.dir;
    workflowPath = setup.workflowPath;
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should handle review → implement → review loop', async () => {
    setMockScenario([
      { agent: 'planner', status: 'done', content: '[PLAN:1]\n\nClear.' },
      { agent: 'coder', status: 'done', content: '[IMPLEMENT:1]\n\nDone.' },
      // First review: issues found → back to implement
      { agent: 'reviewer', status: 'done', content: '[REVIEW:2]\n\nIssues found.' },
      // Fix
      { agent: 'coder', status: 'done', content: '[IMPLEMENT:1]\n\nFixed.' },
      // Second review: passed
      { agent: 'reviewer', status: 'done', content: '[REVIEW:1]\n\nAll checks passed.' },
    ]);
    const exitCode = await executePipeline({
      task: 'Task with fix loop',
      workflow: workflowPath,
      autoPr: false,
      skipGit: true,
      cwd: testDir,
      provider: 'mock',
    });
    expect(exitCode).toBe(0);
  });
 });
--- a/src/tests/it-rule-evaluation.test.ts
+++ b/src/tests/it-rule-evaluation.test.ts
@ -0,0 +1,418 @@
 /**
 * Rule evaluation integration tests.
 *
 * Tests the 5-stage rule evaluation cascade:
 * 1. Aggregate conditions (all/any)
 * 2. Phase 3 tag detection
 * 3. Phase 1 tag detection (fallback)
 * 4. AI judge for ai() conditions
 * 5. AI judge fallback for all conditions
 *
 * Also tests RuleMatchMethod tracking.
 *
 * Mocked: callAiJudge (controlled responses)
 * Not mocked: detectMatchedRule, evaluateAggregateConditions
 */
 import { describe, it, expect, beforeEach, vi } from 'vitest';
 import type { WorkflowStep, WorkflowState, WorkflowRule, AgentResponse } from '../models/types.js';
 // --- Mocks ---
 const mockCallAiJudge = vi.fn();
 vi.mock('../claude/client.js', async (importOriginal) => {
  const original = await importOriginal<typeof import('../claude/client.js')>();
  return {
    ...original,
    callAiJudge: (...args: unknown[]) => mockCallAiJudge(...args),
  };
 });
 vi.mock('../config/globalConfig.js', () => ({
  loadGlobalConfig: vi.fn().mockReturnValue({}),
  getLanguage: vi.fn().mockReturnValue('en'),
 }));
 vi.mock('../config/projectConfig.js', () => ({
  loadProjectConfig: vi.fn().mockReturnValue({}),
 }));
 // --- Imports (after mocks) ---
 import { detectMatchedRule, evaluateAggregateConditions } from '../workflow/rule-evaluator.js';
 import type { RuleMatch, RuleEvaluatorContext } from '../workflow/rule-evaluator.js';
 // --- Test helpers ---
 function makeRule(condition: string, next: string, extra?: Partial<WorkflowRule>): WorkflowRule {
  return { condition, next, ...extra };
 }
 function makeStep(name: string, rules: WorkflowRule[], parallel?: WorkflowStep[]): WorkflowStep {
  return {
    name,
    agent: 'test-agent',
    agentDisplayName: name,
    instructionTemplate: '{task}',
    passPreviousResponse: true,
    rules,
    parallel,
  };
 }
 function makeState(stepOutputs?: Map<string, AgentResponse>): WorkflowState {
  return {
    workflowName: 'it-test',
    currentStep: 'test',
    iteration: 1,
    status: 'running',
    stepOutputs: stepOutputs ?? new Map(),
    stepIterations: new Map(),
    agentSessions: new Map(),
    userInputs: [],
  };
 }
 function makeCtx(stepOutputs?: Map<string, AgentResponse>): RuleEvaluatorContext {
  return {
    state: makeState(stepOutputs),
    cwd: '/tmp/test',
  };
 }
 describe('Rule Evaluation IT: Phase 3 tag detection', () => {
  beforeEach(() => {
    vi.clearAllMocks();
    mockCallAiJudge.mockResolvedValue(-1);
  });
  it('should detect rule from Phase 3 tag content', async () => {
    const step = makeStep('plan', [
      makeRule('Clear', 'implement'),
      makeRule('Unclear', 'ABORT'),
    ]);
    const result = await detectMatchedRule(step, 'Agent output without tag.', '[PLAN:2]', makeCtx());
    expect(result).toEqual<RuleMatch>({ index: 1, method: 'phase3_tag' });
  });
  it('should prefer Phase 3 tag over Phase 1 tag', async () => {
    const step = makeStep('plan', [
      makeRule('Clear', 'implement'),
      makeRule('Unclear', 'ABORT'),
    ]);
    // Phase 1 has tag [PLAN:1], Phase 3 has tag [PLAN:2]
    const result = await detectMatchedRule(step, '[PLAN:1] Clear.', '[PLAN:2]', makeCtx());
    expect(result).toEqual<RuleMatch>({ index: 1, method: 'phase3_tag' });
  });
 });
 describe('Rule Evaluation IT: Phase 1 tag fallback', () => {
  beforeEach(() => {
    vi.clearAllMocks();
    mockCallAiJudge.mockResolvedValue(-1);
  });
  it('should fall back to Phase 1 tag when Phase 3 has no tag', async () => {
    const step = makeStep('plan', [
      makeRule('Clear', 'implement'),
      makeRule('Unclear', 'ABORT'),
    ]);
    const result = await detectMatchedRule(step, '[PLAN:1] Requirements are clear.', '', makeCtx());
    expect(result).toEqual<RuleMatch>({ index: 0, method: 'phase1_tag' });
  });
  it('should detect last tag when multiple tags in Phase 1', async () => {
    const step = makeStep('plan', [
      makeRule('Clear', 'implement'),
      makeRule('Unclear', 'ABORT'),
    ]);
    const result = await detectMatchedRule(step, 'Some [PLAN:1] text then [PLAN:2] final.', '', makeCtx());
    expect(result).toEqual<RuleMatch>({ index: 1, method: 'phase1_tag' });
  });
 });
 describe('Rule Evaluation IT: Aggregate conditions (all/any)', () => {
  beforeEach(() => {
    vi.clearAllMocks();
    mockCallAiJudge.mockResolvedValue(-1);
  });
  it('should match all("approved") when all sub-steps have "approved"', () => {
    const subStep1 = makeStep('arch-review', [
      makeRule('approved', ''),
      makeRule('needs_fix', ''),
    ]);
    const subStep2 = makeStep('security-review', [
      makeRule('approved', ''),
      makeRule('needs_fix', ''),
    ]);
    const parentStep = makeStep('reviewers', [
      makeRule('all("approved")', 'supervise', {
        isAggregateCondition: true,
        aggregateType: 'all',
        aggregateConditionText: 'approved',
      }),
      makeRule('any("needs_fix")', 'fix', {
        isAggregateCondition: true,
        aggregateType: 'any',
        aggregateConditionText: 'needs_fix',
      }),
    ], [subStep1, subStep2]);
    const outputs = new Map<string, AgentResponse>();
    outputs.set('arch-review', {
      agent: 'arch', status: 'done', content: 'approved',
      timestamp: new Date(), matchedRuleIndex: 0,
    });
    outputs.set('security-review', {
      agent: 'security', status: 'done', content: 'approved',
      timestamp: new Date(), matchedRuleIndex: 0,
    });
    const result = evaluateAggregateConditions(parentStep, makeState(outputs));
    expect(result).toBe(0); // all("approved") is rule index 0
  });
  it('should match any("needs_fix") when one sub-step has "needs_fix"', () => {
    const subStep1 = makeStep('arch-review', [
      makeRule('approved', ''),
      makeRule('needs_fix', ''),
    ]);
    const subStep2 = makeStep('security-review', [
      makeRule('approved', ''),
      makeRule('needs_fix', ''),
    ]);
    const parentStep = makeStep('reviewers', [
      makeRule('all("approved")', 'supervise', {
        isAggregateCondition: true,
        aggregateType: 'all',
        aggregateConditionText: 'approved',
      }),
      makeRule('any("needs_fix")', 'fix', {
        isAggregateCondition: true,
        aggregateType: 'any',
        aggregateConditionText: 'needs_fix',
      }),
    ], [subStep1, subStep2]);
    const outputs = new Map<string, AgentResponse>();
    outputs.set('arch-review', {
      agent: 'arch', status: 'done', content: 'approved',
      timestamp: new Date(), matchedRuleIndex: 0,
    });
    outputs.set('security-review', {
      agent: 'security', status: 'done', content: 'needs_fix',
      timestamp: new Date(), matchedRuleIndex: 1,
    });
    const result = evaluateAggregateConditions(parentStep, makeState(outputs));
    expect(result).toBe(1); // any("needs_fix") is rule index 1
  });
  it('should return -1 when no aggregate condition matches', () => {
    const subStep1 = makeStep('review-a', [
      makeRule('approved', ''),
      makeRule('needs_fix', ''),
    ]);
    const subStep2 = makeStep('review-b', [
      makeRule('approved', ''),
      makeRule('needs_fix', ''),
    ]);
    const parentStep = makeStep('reviews', [
      makeRule('all("approved")', 'done', {
        isAggregateCondition: true,
        aggregateType: 'all',
        aggregateConditionText: 'approved',
      }),
    ], [subStep1, subStep2]);
    const outputs = new Map<string, AgentResponse>();
    outputs.set('review-a', {
      agent: 'a', status: 'done', content: 'approved',
      timestamp: new Date(), matchedRuleIndex: 0,
    });
    outputs.set('review-b', {
      agent: 'b', status: 'done', content: 'needs_fix',
      timestamp: new Date(), matchedRuleIndex: 1,
    });
    const result = evaluateAggregateConditions(parentStep, makeState(outputs));
    expect(result).toBe(-1);
  });
  it('should return -1 for non-parallel step', () => {
    const step = makeStep('step', [
      makeRule('all("done")', 'COMPLETE', {
        isAggregateCondition: true,
        aggregateType: 'all',
        aggregateConditionText: 'done',
      }),
    ]);
    const result = evaluateAggregateConditions(step, makeState());
    expect(result).toBe(-1);
  });
 });
 describe('Rule Evaluation IT: ai() judge condition', () => {
  beforeEach(() => {
    vi.clearAllMocks();
  });
  it('should call AI judge for ai() conditions when no tag match', async () => {
    mockCallAiJudge.mockResolvedValue(0); // Judge says first ai() condition matches
    const step = makeStep('step', [
      makeRule('ai("The code is approved")', 'COMPLETE', {
        isAiCondition: true,
        aiConditionText: 'The code is approved',
      }),
      makeRule('ai("The code needs fixes")', 'fix', {
        isAiCondition: true,
        aiConditionText: 'The code needs fixes',
      }),
    ]);
    const result = await detectMatchedRule(step, 'Code looks great, no issues.', '', makeCtx());
    expect(result).toEqual<RuleMatch>({ index: 0, method: 'ai_judge' });
    expect(mockCallAiJudge).toHaveBeenCalled();
  });
  it('should skip AI judge if tag already matched', async () => {
    const step = makeStep('plan', [
      makeRule('ai("Clear")', 'implement', {
        isAiCondition: true,
        aiConditionText: 'Clear',
      }),
    ]);
    const result = await detectMatchedRule(step, '[PLAN:1] Clear.', '', makeCtx());
    expect(result).toEqual<RuleMatch>({ index: 0, method: 'phase1_tag' });
    expect(mockCallAiJudge).not.toHaveBeenCalled();
  });
 });
 describe('Rule Evaluation IT: AI judge fallback', () => {
  beforeEach(() => {
    vi.clearAllMocks();
  });
  it('should use AI judge fallback when no tag and no ai() conditions', async () => {
    // First call (ai() conditions): returns -1 (no ai() conditions exist)
    // Second call (all conditions fallback): returns 0
    mockCallAiJudge.mockResolvedValue(0);
    const step = makeStep('review', [
      makeRule('Approved', 'COMPLETE'),
      makeRule('Rejected', 'fix'),
    ]);
    // No tag in content, no ai() rules → goes to fallback
    const result = await detectMatchedRule(step, 'The code looks fine, approved.', '', makeCtx());
    expect(result).toEqual<RuleMatch>({ index: 0, method: 'ai_judge_fallback' });
  });
  it('should throw when no rule matches (AI judge returns -1 for all phases)', async () => {
    mockCallAiJudge.mockResolvedValue(-1);
    const step = makeStep('review', [
      makeRule('Approved', 'COMPLETE'),
      makeRule('Rejected', 'fix'),
    ]);
    await expect(
      detectMatchedRule(step, 'Totally unrelated content.', '', makeCtx()),
    ).rejects.toThrow(/no rule matched/);
  });
 });
 describe('Rule Evaluation IT: RuleMatchMethod tracking', () => {
  beforeEach(() => {
    vi.clearAllMocks();
    mockCallAiJudge.mockResolvedValue(-1);
  });
  it('should record method as "aggregate" for aggregate matches', () => {
    const subStep = makeStep('sub', [makeRule('ok', '')]);
    const parentStep = makeStep('parent', [
      makeRule('all("ok")', 'COMPLETE', {
        isAggregateCondition: true,
        aggregateType: 'all',
        aggregateConditionText: 'ok',
      }),
    ], [subStep]);
    const outputs = new Map<string, AgentResponse>();
    outputs.set('sub', {
      agent: 'sub', status: 'done', content: 'ok',
      timestamp: new Date(), matchedRuleIndex: 0,
    });
    const result = evaluateAggregateConditions(parentStep, makeState(outputs));
    expect(result).toBe(0);
    // Method verified via detectMatchedRule in engine integration
  });
  it('should record method as "phase3_tag" for Phase 3 matches', async () => {
    const step = makeStep('step', [
      makeRule('Done', 'COMPLETE'),
    ]);
    const result = await detectMatchedRule(step, 'content', '[STEP:1]', makeCtx());
    expect(result?.method).toBe('phase3_tag');
  });
  it('should record method as "phase1_tag" for Phase 1 fallback matches', async () => {
    const step = makeStep('step', [
      makeRule('Done', 'COMPLETE'),
    ]);
    const result = await detectMatchedRule(step, '[STEP:1] Done.', '', makeCtx());
    expect(result?.method).toBe('phase1_tag');
  });
 });
 describe('Rule Evaluation IT: steps without rules', () => {
  beforeEach(() => {
    vi.clearAllMocks();
  });
  it('should return undefined for step with no rules', async () => {
    const step: WorkflowStep = {
      name: 'step',
      agent: 'agent',
      agentDisplayName: 'step',
      instructionTemplate: '{task}',
      passPreviousResponse: true,
    };
    const result = await detectMatchedRule(step, 'content', '', makeCtx());
    expect(result).toBeUndefined();
  });
  it('should return undefined for step with empty rules array', async () => {
    const step = makeStep('step', []);
    const result = await detectMatchedRule(step, 'content', '', makeCtx());
    expect(result).toBeUndefined();
  });
 });
--- a/src/tests/it-three-phase-execution.test.ts
+++ b/src/tests/it-three-phase-execution.test.ts
@ -0,0 +1,392 @@
 /**
 * Three-phase execution integration tests.
 *
 * Tests Phase 1 (main) → Phase 2 (report) → Phase 3 (status judgment) lifecycle.
 * Verifies that the correct combination of phases fires based on step config.
 *
 * Mocked: UI, session, config, callAiJudge
 * Selectively mocked: phase-runner (to inspect call patterns)
 * Not mocked: WorkflowEngine, runAgent, detectMatchedRule, rule-evaluator
 */
 import { describe, it, expect, beforeEach, afterEach, vi } from 'vitest';
 import { mkdtempSync, mkdirSync, writeFileSync, rmSync } from 'node:fs';
 import { join } from 'node:path';
 import { tmpdir } from 'node:os';
 import { setMockScenario, resetScenario } from '../mock/scenario.js';
 import type { WorkflowConfig, WorkflowStep, WorkflowRule } from '../models/types.js';
 // --- Mocks ---
 vi.mock('../claude/client.js', async (importOriginal) => {
  const original = await importOriginal<typeof import('../claude/client.js')>();
  return {
    ...original,
    callAiJudge: vi.fn().mockResolvedValue(-1),
  };
 });
 const mockNeedsStatusJudgmentPhase = vi.fn();
 const mockRunReportPhase = vi.fn();
 const mockRunStatusJudgmentPhase = vi.fn();
 vi.mock('../workflow/phase-runner.js', () => ({
  needsStatusJudgmentPhase: (...args: unknown[]) => mockNeedsStatusJudgmentPhase(...args),
  runReportPhase: (...args: unknown[]) => mockRunReportPhase(...args),
  runStatusJudgmentPhase: (...args: unknown[]) => mockRunStatusJudgmentPhase(...args),
 }));
 vi.mock('../utils/session.js', () => ({
  generateReportDir: vi.fn().mockReturnValue('test-report-dir'),
  generateSessionId: vi.fn().mockReturnValue('test-session-id'),
 }));
 vi.mock('../config/globalConfig.js', () => ({
  loadGlobalConfig: vi.fn().mockReturnValue({}),
  getLanguage: vi.fn().mockReturnValue('en'),
  getDisabledBuiltins: vi.fn().mockReturnValue([]),
 }));
 vi.mock('../config/projectConfig.js', () => ({
  loadProjectConfig: vi.fn().mockReturnValue({}),
 }));
 // --- Imports (after mocks) ---
 import { WorkflowEngine } from '../workflow/engine.js';
 // --- Test helpers ---
 function makeRule(condition: string, next: string): WorkflowRule {
  return { condition, next };
 }
 function createTestEnv(): { dir: string; agentPath: string } {
  const dir = mkdtempSync(join(tmpdir(), 'takt-it-3ph-'));
  mkdirSync(join(dir, '.takt', 'reports', 'test-report-dir'), { recursive: true });
  const agentsDir = join(dir, 'agents');
  mkdirSync(agentsDir, { recursive: true });
  const agentPath = join(agentsDir, 'agent.md');
  writeFileSync(agentPath, 'You are an agent.');
  return { dir, agentPath };
 }
 function makeStep(
  name: string,
  agentPath: string,
  rules: WorkflowRule[],
  options: { report?: string | { label: string; path: string }[]; edit?: boolean } = {},
 ): WorkflowStep {
  return {
    name,
    agent: './agents/agent.md',
    agentDisplayName: name,
    agentPath,
    instructionTemplate: '{task}',
    passPreviousResponse: true,
    rules,
    report: options.report,
    edit: options.edit,
  };
 }
 describe('Three-Phase Execution IT: phase1 only (no report, no tag rules)', () => {
  let testDir: string;
  let agentPath: string;
  beforeEach(() => {
    vi.clearAllMocks();
    const env = createTestEnv();
    testDir = env.dir;
    agentPath = env.agentPath;
    // No tag rules needed → Phase 3 not needed
    mockNeedsStatusJudgmentPhase.mockReturnValue(false);
    mockRunReportPhase.mockResolvedValue(undefined);
    mockRunStatusJudgmentPhase.mockResolvedValue('');
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should only run Phase 1 when step has no report and no tag rules', async () => {
    setMockScenario([
      { status: 'done', content: '[STEP:1]\n\nDone.' },
    ]);
    const config: WorkflowConfig = {
      name: 'it-phase1-only',
      description: 'Test',
      maxIterations: 5,
      initialStep: 'step',
      steps: [
        makeStep('step', agentPath, [
          makeRule('Done', 'COMPLETE'),
          makeRule('Not done', 'ABORT'),
        ]),
      ],
    };
    const engine = new WorkflowEngine(config, testDir, 'Test task', {
      projectCwd: testDir,
      provider: 'mock',
    });
    const state = await engine.run();
    expect(state.status).toBe('completed');
    expect(mockRunReportPhase).not.toHaveBeenCalled();
    // needsStatusJudgmentPhase is called but returns false
    expect(mockRunStatusJudgmentPhase).not.toHaveBeenCalled();
  });
 });
 describe('Three-Phase Execution IT: phase1 + phase2 (report defined)', () => {
  let testDir: string;
  let agentPath: string;
  beforeEach(() => {
    vi.clearAllMocks();
    const env = createTestEnv();
    testDir = env.dir;
    agentPath = env.agentPath;
    mockNeedsStatusJudgmentPhase.mockReturnValue(false);
    mockRunReportPhase.mockResolvedValue(undefined);
    mockRunStatusJudgmentPhase.mockResolvedValue('');
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should run Phase 1 + Phase 2 when step has report', async () => {
    setMockScenario([
      { status: 'done', content: '[STEP:1]\n\nDone.' },
    ]);
    const config: WorkflowConfig = {
      name: 'it-phase1-2',
      description: 'Test',
      maxIterations: 5,
      initialStep: 'step',
      steps: [
        makeStep('step', agentPath, [
          makeRule('Done', 'COMPLETE'),
          makeRule('Not done', 'ABORT'),
        ], { report: 'test-report.md' }),
      ],
    };
    const engine = new WorkflowEngine(config, testDir, 'Test task', {
      projectCwd: testDir,
      provider: 'mock',
    });
    const state = await engine.run();
    expect(state.status).toBe('completed');
    expect(mockRunReportPhase).toHaveBeenCalledTimes(1);
    expect(mockRunStatusJudgmentPhase).not.toHaveBeenCalled();
  });
  it('should run Phase 2 for multi-report step', async () => {
    setMockScenario([
      { status: 'done', content: '[STEP:1]\n\nDone.' },
    ]);
    const config: WorkflowConfig = {
      name: 'it-phase1-2-multi',
      description: 'Test',
      maxIterations: 5,
      initialStep: 'step',
      steps: [
        makeStep('step', agentPath, [
          makeRule('Done', 'COMPLETE'),
        ], { report: [{ label: 'Scope', path: 'scope.md' }, { label: 'Decisions', path: 'decisions.md' }] }),
      ],
    };
    const engine = new WorkflowEngine(config, testDir, 'Test task', {
      projectCwd: testDir,
      provider: 'mock',
    });
    const state = await engine.run();
    expect(state.status).toBe('completed');
    expect(mockRunReportPhase).toHaveBeenCalledTimes(1);
  });
 });
 describe('Three-Phase Execution IT: phase1 + phase3 (tag rules defined)', () => {
  let testDir: string;
  let agentPath: string;
  beforeEach(() => {
    vi.clearAllMocks();
    const env = createTestEnv();
    testDir = env.dir;
    agentPath = env.agentPath;
    mockNeedsStatusJudgmentPhase.mockReturnValue(true);
    mockRunReportPhase.mockResolvedValue(undefined);
    // Phase 3 returns content with a tag
    mockRunStatusJudgmentPhase.mockResolvedValue('[STEP:1]');
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should run Phase 1 + Phase 3 when step has tag-based rules but no report', async () => {
    setMockScenario([
      // Phase 1: main content (no tag — Phase 3 will provide it)
      { status: 'done', content: 'Agent completed the work.' },
    ]);
    const config: WorkflowConfig = {
      name: 'it-phase1-3',
      description: 'Test',
      maxIterations: 5,
      initialStep: 'step',
      steps: [
        makeStep('step', agentPath, [
          makeRule('Done', 'COMPLETE'),
          makeRule('Not done', 'ABORT'),
        ]),
      ],
    };
    const engine = new WorkflowEngine(config, testDir, 'Test task', {
      projectCwd: testDir,
      provider: 'mock',
    });
    const state = await engine.run();
    expect(state.status).toBe('completed');
    expect(mockRunReportPhase).not.toHaveBeenCalled();
    expect(mockRunStatusJudgmentPhase).toHaveBeenCalledTimes(1);
  });
 });
 describe('Three-Phase Execution IT: all three phases', () => {
  let testDir: string;
  let agentPath: string;
  beforeEach(() => {
    vi.clearAllMocks();
    const env = createTestEnv();
    testDir = env.dir;
    agentPath = env.agentPath;
    mockNeedsStatusJudgmentPhase.mockReturnValue(true);
    mockRunReportPhase.mockResolvedValue(undefined);
    mockRunStatusJudgmentPhase.mockResolvedValue('[STEP:1]');
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should run Phase 1 → Phase 2 → Phase 3 when step has report and tag rules', async () => {
    setMockScenario([
      { status: 'done', content: 'Agent completed the work.' },
    ]);
    const config: WorkflowConfig = {
      name: 'it-all-phases',
      description: 'Test',
      maxIterations: 5,
      initialStep: 'step',
      steps: [
        makeStep('step', agentPath, [
          makeRule('Done', 'COMPLETE'),
          makeRule('Not done', 'ABORT'),
        ], { report: 'test-report.md' }),
      ],
    };
    const engine = new WorkflowEngine(config, testDir, 'Test task', {
      projectCwd: testDir,
      provider: 'mock',
    });
    const state = await engine.run();
    expect(state.status).toBe('completed');
    expect(mockRunReportPhase).toHaveBeenCalledTimes(1);
    expect(mockRunStatusJudgmentPhase).toHaveBeenCalledTimes(1);
    // Verify ordering: report phase is called before status judgment
    const reportCallOrder = mockRunReportPhase.mock.invocationCallOrder[0];
    const judgmentCallOrder = mockRunStatusJudgmentPhase.mock.invocationCallOrder[0];
    expect(reportCallOrder).toBeLessThan(judgmentCallOrder);
  });
 });
 describe('Three-Phase Execution IT: phase3 tag → rule match', () => {
  let testDir: string;
  let agentPath: string;
  beforeEach(() => {
    vi.clearAllMocks();
    const env = createTestEnv();
    testDir = env.dir;
    agentPath = env.agentPath;
    mockNeedsStatusJudgmentPhase.mockReturnValue(true);
    mockRunReportPhase.mockResolvedValue(undefined);
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should use Phase 3 tag for rule matching over Phase 1 content', async () => {
    // Phase 1 content has no tag → fallback
    setMockScenario([
      { status: 'done', content: 'Work done.' },
      { status: 'done', content: '[STEP2:1]\n\nChecked.' },
    ]);
    // Phase 3 returns rule 2 (ABORT)
    mockRunStatusJudgmentPhase.mockResolvedValue('[STEP1:2]');
    const config: WorkflowConfig = {
      name: 'it-phase3-tag',
      description: 'Test',
      maxIterations: 5,
      initialStep: 'step1',
      steps: [
        makeStep('step1', agentPath, [
          makeRule('Done', 'step2'),
          makeRule('Not done', 'ABORT'),
        ]),
        makeStep('step2', agentPath, [
          makeRule('Checked', 'COMPLETE'),
        ]),
      ],
    };
    const engine = new WorkflowEngine(config, testDir, 'Test task', {
      projectCwd: testDir,
      provider: 'mock',
    });
    const state = await engine.run();
    // Phase 3 returned [STEP1:2] → rule index 1 → "Not done" → ABORT
    expect(state.status).toBe('aborted');
    expect(state.iteration).toBe(1);
  });
 });
--- a/src/tests/it-workflow-loader.test.ts
+++ b/src/tests/it-workflow-loader.test.ts
@ -0,0 +1,380 @@
 /**
 * Workflow loader integration tests.
 *
 * Tests the 3-tier workflow resolution (project-local → user → builtin)
 * and YAML parsing including special rule syntax (ai(), all(), any()).
 *
 * Mocked: globalConfig (for language/builtins)
 * Not mocked: loadWorkflow, parseWorkflow, rule parsing
 */
 import { describe, it, expect, beforeEach, afterEach, vi } from 'vitest';
 import { mkdtempSync, mkdirSync, writeFileSync, rmSync, existsSync } from 'node:fs';
 import { join } from 'node:path';
 import { tmpdir } from 'node:os';
 // --- Mocks ---
 vi.mock('../config/globalConfig.js', () => ({
  loadGlobalConfig: vi.fn().mockReturnValue({}),
  getLanguage: vi.fn().mockReturnValue('en'),
  getDisabledBuiltins: vi.fn().mockReturnValue([]),
 }));
 // --- Imports (after mocks) ---
 import { loadWorkflow } from '../config/workflowLoader.js';
 // --- Test helpers ---
 function createTestDir(): string {
  const dir = mkdtempSync(join(tmpdir(), 'takt-it-wfl-'));
  mkdirSync(join(dir, '.takt'), { recursive: true });
  return dir;
 }
 describe('Workflow Loader IT: builtin workflow loading', () => {
  let testDir: string;
  beforeEach(() => {
    testDir = createTestDir();
  });
  afterEach(() => {
    rmSync(testDir, { recursive: true, force: true });
  });
  const builtinNames = ['default', 'simple', 'expert', 'expert-cqrs', 'research', 'magi', 'review-only'];
  for (const name of builtinNames) {
    it(`should load builtin workflow: ${name}`, () => {
      const config = loadWorkflow(name, testDir);
      expect(config).not.toBeNull();
      expect(config!.name).toBe(name);
      expect(config!.steps.length).toBeGreaterThan(0);
      expect(config!.initialStep).toBeDefined();
      expect(config!.maxIterations).toBeGreaterThan(0);
    });
  }
  it('should return null for non-existent workflow', () => {
    const config = loadWorkflow('non-existent-workflow-xyz', testDir);
    expect(config).toBeNull();
  });
 });
 describe('Workflow Loader IT: project-local workflow override', () => {
  let testDir: string;
  beforeEach(() => {
    testDir = createTestDir();
  });
  afterEach(() => {
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should load project-local workflow from .takt/workflows/', () => {
    const workflowsDir = join(testDir, '.takt', 'workflows');
    mkdirSync(workflowsDir, { recursive: true });
    const agentsDir = join(testDir, 'agents');
    mkdirSync(agentsDir, { recursive: true });
    writeFileSync(join(agentsDir, 'custom.md'), 'Custom agent');
    writeFileSync(join(workflowsDir, 'custom-wf.yaml'), `
 name: custom-wf
 description: Custom project workflow
 max_iterations: 5
 initial_step: start
 steps:
  - name: start
    agent: ./agents/custom.md
    rules:
      - condition: Done
        next: COMPLETE
    instruction: "Do the work"
 `);
    const config = loadWorkflow('custom-wf', testDir);
    expect(config).not.toBeNull();
    expect(config!.name).toBe('custom-wf');
    expect(config!.steps.length).toBe(1);
    expect(config!.steps[0]!.name).toBe('start');
  });
 });
 describe('Workflow Loader IT: agent path resolution', () => {
  let testDir: string;
  beforeEach(() => {
    testDir = createTestDir();
  });
  afterEach(() => {
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should resolve relative agent paths from workflow YAML location', () => {
    const config = loadWorkflow('simple', testDir);
    expect(config).not.toBeNull();
    for (const step of config!.steps) {
      if (step.agentPath) {
        // Agent paths should be resolved to absolute paths
        expect(step.agentPath).toMatch(/^\//);
        // Agent files should exist
        expect(existsSync(step.agentPath)).toBe(true);
      }
      if (step.parallel) {
        for (const sub of step.parallel) {
          if (sub.agentPath) {
            expect(sub.agentPath).toMatch(/^\//);
            expect(existsSync(sub.agentPath)).toBe(true);
          }
        }
      }
    }
  });
 });
 describe('Workflow Loader IT: rule syntax parsing', () => {
  let testDir: string;
  beforeEach(() => {
    testDir = createTestDir();
  });
  afterEach(() => {
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should parse all() aggregate conditions from default workflow', () => {
    const config = loadWorkflow('default', testDir);
    expect(config).not.toBeNull();
    // Find the parallel reviewers step
    const reviewersStep = config!.steps.find(
      (s) => s.parallel && s.parallel.length > 0,
    );
    expect(reviewersStep).toBeDefined();
    // Should have aggregate rules
    const allRule = reviewersStep!.rules?.find(
      (r) => r.isAggregateCondition && r.aggregateType === 'all',
    );
    expect(allRule).toBeDefined();
    expect(allRule!.aggregateConditionText).toBe('approved');
  });
  it('should parse any() aggregate conditions from default workflow', () => {
    const config = loadWorkflow('default', testDir);
    expect(config).not.toBeNull();
    const reviewersStep = config!.steps.find(
      (s) => s.parallel && s.parallel.length > 0,
    );
    const anyRule = reviewersStep!.rules?.find(
      (r) => r.isAggregateCondition && r.aggregateType === 'any',
    );
    expect(anyRule).toBeDefined();
    expect(anyRule!.aggregateConditionText).toBe('needs_fix');
  });
  it('should parse standard rules with next step', () => {
    const config = loadWorkflow('simple', testDir);
    expect(config).not.toBeNull();
    const planStep = config!.steps.find((s) => s.name === 'plan');
    expect(planStep).toBeDefined();
    expect(planStep!.rules).toBeDefined();
    expect(planStep!.rules!.length).toBeGreaterThan(0);
    // Each rule should have condition and next
    for (const rule of planStep!.rules!) {
      expect(typeof rule.condition).toBe('string');
      expect(rule.condition.length).toBeGreaterThan(0);
    }
  });
 });
 describe('Workflow Loader IT: workflow config validation', () => {
  let testDir: string;
  beforeEach(() => {
    testDir = createTestDir();
  });
  afterEach(() => {
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should set max_iterations from YAML', () => {
    const config = loadWorkflow('simple', testDir);
    expect(config).not.toBeNull();
    expect(typeof config!.maxIterations).toBe('number');
    expect(config!.maxIterations).toBeGreaterThan(0);
  });
  it('should set initial_step from YAML', () => {
    const config = loadWorkflow('simple', testDir);
    expect(config).not.toBeNull();
    expect(typeof config!.initialStep).toBe('string');
    // initial_step should reference an existing step
    const stepNames = config!.steps.map((s) => s.name);
    expect(stepNames).toContain(config!.initialStep);
  });
  it('should preserve edit property on steps (review-only has no edit: true)', () => {
    const config = loadWorkflow('review-only', testDir);
    expect(config).not.toBeNull();
    // review-only: no step should have edit: true
    for (const step of config!.steps) {
      expect(step.edit).not.toBe(true);
      if (step.parallel) {
        for (const sub of step.parallel) {
          expect(sub.edit).not.toBe(true);
        }
      }
    }
    // expert: implement step should have edit: true
    const expertConfig = loadWorkflow('expert', testDir);
    expect(expertConfig).not.toBeNull();
    const implementStep = expertConfig!.steps.find((s) => s.name === 'implement');
    expect(implementStep).toBeDefined();
    expect(implementStep!.edit).toBe(true);
  });
  it('should set passPreviousResponse from YAML', () => {
    const config = loadWorkflow('simple', testDir);
    expect(config).not.toBeNull();
    // At least some steps should have passPreviousResponse set
    const stepsWithPassPrev = config!.steps.filter((s) => s.passPreviousResponse === true);
    expect(stepsWithPassPrev.length).toBeGreaterThan(0);
  });
 });
 describe('Workflow Loader IT: parallel step loading', () => {
  let testDir: string;
  beforeEach(() => {
    testDir = createTestDir();
  });
  afterEach(() => {
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should load parallel sub-steps from default workflow', () => {
    const config = loadWorkflow('default', testDir);
    expect(config).not.toBeNull();
    const parallelStep = config!.steps.find(
      (s) => s.parallel && s.parallel.length > 0,
    );
    expect(parallelStep).toBeDefined();
    expect(parallelStep!.parallel!.length).toBeGreaterThanOrEqual(2);
    // Each sub-step should have required fields
    for (const sub of parallelStep!.parallel!) {
      expect(sub.name).toBeDefined();
      expect(sub.agent).toBeDefined();
      expect(sub.rules).toBeDefined();
    }
  });
  it('should load 4 parallel reviewers from expert workflow', () => {
    const config = loadWorkflow('expert', testDir);
    expect(config).not.toBeNull();
    const parallelStep = config!.steps.find(
      (s) => s.parallel && s.parallel.length === 4,
    );
    expect(parallelStep).toBeDefined();
    const subNames = parallelStep!.parallel!.map((s) => s.name);
    expect(subNames).toContain('arch-review');
    expect(subNames).toContain('frontend-review');
    expect(subNames).toContain('security-review');
    expect(subNames).toContain('qa-review');
  });
 });
 describe('Workflow Loader IT: report config loading', () => {
  let testDir: string;
  beforeEach(() => {
    testDir = createTestDir();
  });
  afterEach(() => {
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should load single report config', () => {
    const config = loadWorkflow('simple', testDir);
    expect(config).not.toBeNull();
    // simple workflow: plan step has a report config
    const planStep = config!.steps.find((s) => s.name === 'plan');
    expect(planStep).toBeDefined();
    expect(planStep!.report).toBeDefined();
  });
  it('should load multi-report config from expert workflow', () => {
    const config = loadWorkflow('expert', testDir);
    expect(config).not.toBeNull();
    // implement step has multi-report: [Scope, Decisions]
    const implementStep = config!.steps.find((s) => s.name === 'implement');
    expect(implementStep).toBeDefined();
    expect(implementStep!.report).toBeDefined();
    expect(Array.isArray(implementStep!.report)).toBe(true);
    expect((implementStep!.report as unknown[]).length).toBe(2);
  });
 });
 describe('Workflow Loader IT: invalid YAML handling', () => {
  let testDir: string;
  beforeEach(() => {
    testDir = createTestDir();
  });
  afterEach(() => {
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should throw for workflow file with invalid YAML', () => {
    const workflowsDir = join(testDir, '.takt', 'workflows');
    mkdirSync(workflowsDir, { recursive: true });
    writeFileSync(join(workflowsDir, 'broken.yaml'), `
 name: broken
 this is not: valid yaml: [[[[
  - bad: {
 `);
    expect(() => loadWorkflow('broken', testDir)).toThrow();
  });
  it('should throw for workflow missing required fields', () => {
    const workflowsDir = join(testDir, '.takt', 'workflows');
    mkdirSync(workflowsDir, { recursive: true });
    writeFileSync(join(workflowsDir, 'incomplete.yaml'), `
 name: incomplete
 description: Missing steps
 `);
    expect(() => loadWorkflow('incomplete', testDir)).toThrow();
  });
 });
--- a/src/tests/it-workflow-patterns.test.ts
+++ b/src/tests/it-workflow-patterns.test.ts
@ -0,0 +1,355 @@
 /**
 * Workflow patterns integration tests.
 *
 * Tests that all builtin workflow definitions can be loaded and execute
 * the expected step transitions using WorkflowEngine + MockProvider + ScenarioQueue.
 *
 * Mocked: UI, session, phase-runner, notifications, config, callAiJudge
 * Not mocked: WorkflowEngine, runAgent, detectMatchedRule, rule-evaluator
 */
 import { describe, it, expect, beforeEach, afterEach, vi } from 'vitest';
 import { mkdtempSync, mkdirSync, rmSync } from 'node:fs';
 import { join } from 'node:path';
 import { tmpdir } from 'node:os';
 import { setMockScenario, resetScenario } from '../mock/scenario.js';
 // --- Mocks ---
 vi.mock('../claude/client.js', async (importOriginal) => {
  const original = await importOriginal<typeof import('../claude/client.js')>();
  return {
    ...original,
    callAiJudge: vi.fn().mockResolvedValue(-1),
  };
 });
 vi.mock('../workflow/phase-runner.js', () => ({
  needsStatusJudgmentPhase: vi.fn().mockReturnValue(false),
  runReportPhase: vi.fn().mockResolvedValue(undefined),
  runStatusJudgmentPhase: vi.fn().mockResolvedValue(''),
 }));
 vi.mock('../utils/session.js', () => ({
  generateReportDir: vi.fn().mockReturnValue('test-report-dir'),
  generateSessionId: vi.fn().mockReturnValue('test-session-id'),
 }));
 vi.mock('../config/globalConfig.js', () => ({
  loadGlobalConfig: vi.fn().mockReturnValue({}),
  getLanguage: vi.fn().mockReturnValue('en'),
  getDisabledBuiltins: vi.fn().mockReturnValue([]),
 }));
 vi.mock('../config/projectConfig.js', () => ({
  loadProjectConfig: vi.fn().mockReturnValue({}),
 }));
 // --- Imports (after mocks) ---
 import { WorkflowEngine } from '../workflow/engine.js';
 import { loadWorkflow } from '../config/workflowLoader.js';
 import type { WorkflowConfig } from '../models/types.js';
 // --- Test helpers ---
 function createTestDir(): string {
  const dir = mkdtempSync(join(tmpdir(), 'takt-it-wfp-'));
  mkdirSync(join(dir, '.takt', 'reports', 'test-report-dir'), { recursive: true });
  return dir;
 }
 function createEngine(config: WorkflowConfig, dir: string, task: string): WorkflowEngine {
  return new WorkflowEngine(config, dir, task, {
    projectCwd: dir,
    provider: 'mock',
  });
 }
 describe('Workflow Patterns IT: simple workflow', () => {
  let testDir: string;
  beforeEach(() => {
    vi.clearAllMocks();
    testDir = createTestDir();
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should complete: plan → implement → ai_review → review → supervise → COMPLETE', async () => {
    const config = loadWorkflow('simple', testDir);
    expect(config).not.toBeNull();
    setMockScenario([
      { agent: 'planner', status: 'done', content: '[PLAN:1]\n\nRequirements are clear.' },
      { agent: 'coder', status: 'done', content: '[IMPLEMENT:1]\n\nImplementation complete.' },
      { agent: 'ai-antipattern-reviewer', status: 'done', content: '[AI_REVIEW:1]\n\nNo AI-specific issues.' },
      { agent: 'architecture-reviewer', status: 'done', content: '[REVIEW:1]\n\nNo issues found.' },
      { agent: 'supervisor', status: 'done', content: '[SUPERVISE:1]\n\nAll checks passed.' },
    ]);
    const engine = createEngine(config!, testDir, 'Test task');
    const state = await engine.run();
    expect(state.status).toBe('completed');
    expect(state.iteration).toBe(5);
  });
  it('should ABORT when plan returns rule 3 (requirements unclear)', async () => {
    const config = loadWorkflow('simple', testDir);
    setMockScenario([
      { agent: 'planner', status: 'done', content: '[PLAN:3]\n\nRequirements unclear.' },
    ]);
    const engine = createEngine(config!, testDir, 'Vague task');
    const state = await engine.run();
    expect(state.status).toBe('aborted');
    expect(state.iteration).toBe(1);
  });
  it('should COMPLETE when plan detects a question (rule 2)', async () => {
    const config = loadWorkflow('simple', testDir);
    setMockScenario([
      { agent: 'planner', status: 'done', content: '[PLAN:2]\n\nUser is asking a question.' },
    ]);
    const engine = createEngine(config!, testDir, 'What is X?');
    const state = await engine.run();
    expect(state.status).toBe('completed');
    expect(state.iteration).toBe(1);
  });
 });
 describe('Workflow Patterns IT: default workflow (parallel reviewers)', () => {
  let testDir: string;
  beforeEach(() => {
    vi.clearAllMocks();
    testDir = createTestDir();
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should complete with all("approved") in parallel review step', async () => {
    const config = loadWorkflow('default', testDir);
    expect(config).not.toBeNull();
    setMockScenario([
      { agent: 'planner', status: 'done', content: '[PLAN:1]\n\nClear.' },
      { agent: 'coder', status: 'done', content: '[IMPLEMENT:1]\n\nDone.' },
      { agent: 'ai-antipattern-reviewer', status: 'done', content: '[AI_REVIEW:1]\n\nNo issues.' },
      // Parallel reviewers: both approved
      { agent: 'architecture-reviewer', status: 'done', content: '[ARCH-REVIEW:1]\n\napproved' },
      { agent: 'security-reviewer', status: 'done', content: '[SECURITY-REVIEW:1]\n\napproved' },
      // Supervisor
      { agent: 'supervisor', status: 'done', content: '[SUPERVISE:1]\n\nAll checks passed.' },
    ]);
    const engine = createEngine(config!, testDir, 'Test task');
    const state = await engine.run();
    expect(state.status).toBe('completed');
  });
  it('should route to fix when any("needs_fix") in parallel review step', async () => {
    const config = loadWorkflow('default', testDir);
    setMockScenario([
      { agent: 'planner', status: 'done', content: '[PLAN:1]\n\nClear.' },
      { agent: 'coder', status: 'done', content: '[IMPLEMENT:1]\n\nDone.' },
      { agent: 'ai-antipattern-reviewer', status: 'done', content: '[AI_REVIEW:1]\n\nNo issues.' },
      // Parallel: arch approved, security needs_fix
      { agent: 'architecture-reviewer', status: 'done', content: '[ARCH-REVIEW:1]\n\napproved' },
      { agent: 'security-reviewer', status: 'done', content: '[SECURITY-REVIEW:2]\n\nneeds_fix' },
      // Fix step
      { agent: 'coder', status: 'done', content: '[FIX:1]\n\nFix complete.' },
      // Re-review: both approved
      { agent: 'architecture-reviewer', status: 'done', content: '[ARCH-REVIEW:1]\n\napproved' },
      { agent: 'security-reviewer', status: 'done', content: '[SECURITY-REVIEW:1]\n\napproved' },
      // Supervisor
      { agent: 'supervisor', status: 'done', content: '[SUPERVISE:1]\n\nAll checks passed.' },
    ]);
    const engine = createEngine(config!, testDir, 'Task needing security fix');
    const state = await engine.run();
    expect(state.status).toBe('completed');
  });
 });
 describe('Workflow Patterns IT: research workflow', () => {
  let testDir: string;
  beforeEach(() => {
    vi.clearAllMocks();
    testDir = createTestDir();
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should complete: plan → dig → supervise → COMPLETE', async () => {
    const config = loadWorkflow('research', testDir);
    expect(config).not.toBeNull();
    setMockScenario([
      { agent: 'research/planner', status: 'done', content: '[PLAN:1]\n\nPlanning is complete.' },
      { agent: 'research/digger', status: 'done', content: '[DIG:1]\n\nResearch is complete.' },
      { agent: 'research/supervisor', status: 'done', content: '[SUPERVISE:1]\n\nAdequate.' },
    ]);
    const engine = createEngine(config!, testDir, 'Research topic X');
    const state = await engine.run();
    expect(state.status).toBe('completed');
    expect(state.iteration).toBe(3);
  });
  it('should loop: plan → dig → supervise (insufficient) → plan → dig → supervise → COMPLETE', async () => {
    const config = loadWorkflow('research', testDir);
    setMockScenario([
      { agent: 'research/planner', status: 'done', content: '[PLAN:1]\n\nPlanning is complete.' },
      { agent: 'research/digger', status: 'done', content: '[DIG:1]\n\nResearch is complete.' },
      { agent: 'research/supervisor', status: 'done', content: '[SUPERVISE:2]\n\nInsufficient.' },
      // Second pass
      { agent: 'research/planner', status: 'done', content: '[PLAN:1]\n\nRevised plan.' },
      { agent: 'research/digger', status: 'done', content: '[DIG:1]\n\nMore research.' },
      { agent: 'research/supervisor', status: 'done', content: '[SUPERVISE:1]\n\nAdequate now.' },
    ]);
    const engine = createEngine(config!, testDir, 'Research topic X');
    const state = await engine.run();
    expect(state.status).toBe('completed');
    expect(state.iteration).toBe(6);
  });
 });
 describe('Workflow Patterns IT: magi workflow', () => {
  let testDir: string;
  beforeEach(() => {
    vi.clearAllMocks();
    testDir = createTestDir();
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should complete: melchior → balthasar → casper → COMPLETE', async () => {
    const config = loadWorkflow('magi', testDir);
    expect(config).not.toBeNull();
    setMockScenario([
      { agent: 'magi/melchior', status: 'done', content: '[MELCHIOR:1]\n\nJudgment completed.' },
      { agent: 'magi/balthasar', status: 'done', content: '[BALTHASAR:1]\n\nJudgment completed.' },
      { agent: 'magi/casper', status: 'done', content: '[CASPER:1]\n\nFinal judgment completed.' },
    ]);
    const engine = createEngine(config!, testDir, 'Deliberation topic');
    const state = await engine.run();
    expect(state.status).toBe('completed');
    expect(state.iteration).toBe(3);
  });
 });
 describe('Workflow Patterns IT: review-only workflow', () => {
  let testDir: string;
  beforeEach(() => {
    vi.clearAllMocks();
    testDir = createTestDir();
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should complete: plan → reviewers (all approved) → supervise → COMPLETE', async () => {
    const config = loadWorkflow('review-only', testDir);
    expect(config).not.toBeNull();
    setMockScenario([
      { agent: 'planner', status: 'done', content: '[PLAN:1]\n\nReview scope is clear.' },
      // Parallel reviewers: all approved
      { agent: 'architecture-reviewer', status: 'done', content: '[ARCH-REVIEW:1]\n\napproved' },
      { agent: 'security-reviewer', status: 'done', content: '[SECURITY-REVIEW:1]\n\napproved' },
      { agent: 'ai-antipattern-reviewer', status: 'done', content: '[AI-REVIEW:1]\n\napproved' },
      // Supervisor: approved (local review, no PR)
      { agent: 'supervisor', status: 'done', content: '[SUPERVISE:2]\n\napproved' },
    ]);
    const engine = createEngine(config!, testDir, 'Review the codebase');
    const state = await engine.run();
    expect(state.status).toBe('completed');
  });
  it('should verify no steps have edit: true', () => {
    const config = loadWorkflow('review-only', testDir);
    expect(config).not.toBeNull();
    for (const step of config!.steps) {
      expect(step.edit).not.toBe(true);
      if (step.parallel) {
        for (const subStep of step.parallel) {
          expect(subStep.edit).not.toBe(true);
        }
      }
    }
  });
 });
 describe('Workflow Patterns IT: expert workflow (4 parallel reviewers)', () => {
  let testDir: string;
  beforeEach(() => {
    vi.clearAllMocks();
    testDir = createTestDir();
  });
  afterEach(() => {
    resetScenario();
    rmSync(testDir, { recursive: true, force: true });
  });
  it('should complete with all("approved") in 4-parallel review', async () => {
    const config = loadWorkflow('expert', testDir);
    expect(config).not.toBeNull();
    setMockScenario([
      { agent: 'planner', status: 'done', content: '[PLAN:1]\n\nClear.' },
      { agent: 'coder', status: 'done', content: '[IMPLEMENT:1]\n\nDone.' },
      { agent: 'ai-antipattern-reviewer', status: 'done', content: '[AI_REVIEW:1]\n\nNo issues.' },
      // 4 parallel reviewers
      { agent: 'architecture-reviewer', status: 'done', content: '[ARCH-REVIEW:1]\n\napproved' },
      { agent: 'expert/frontend-reviewer', status: 'done', content: '[FRONTEND-REVIEW:1]\n\napproved' },
      { agent: 'expert/security-reviewer', status: 'done', content: '[SECURITY-REVIEW:1]\n\napproved' },
      { agent: 'expert/qa-reviewer', status: 'done', content: '[QA-REVIEW:1]\n\napproved' },
      // Supervisor
      { agent: 'expert/supervisor', status: 'done', content: '[SUPERVISE:1]\n\nAll validations pass.' },
    ]);
    const engine = createEngine(config!, testDir, 'Expert review task');
    const state = await engine.run();
    expect(state.status).toBe('completed');
  });
 });