diff --git a/.specflow/orchestration-state.json b/.specflow/orchestration-state.json
index 0cd0842..ce4416e 100644
--- a/.specflow/orchestration-state.json
+++ b/.specflow/orchestration-state.json
@@ -1,28 +1,41 @@
 {
   "schema_version": "3.0",
   "project": {
-    "id": "d9faf772-66c0-476e-bf4f-c9a33e7b248b",
+    "id": "75bd784a-8b56-459d-b272-44ad1e9d0364",
     "name": "specflow",
     "path": "/Users/ppatterson/dev/specflow"
   },
-  "last_updated": "2026-01-22T18:14:43.458Z",
+  "last_updated": "2026-01-24T21:57:04.195Z",
   "orchestration": {
     "phase": {
+      "id": null,
       "number": null,
       "name": null,
       "branch": null,
       "status": "not_started",
-      "userGateStatus": "confirmed"
+      "goals": [
+        "Trust step.status - If sub-command set it to complete, step is done",
+        "Complete decision matrix - Every state combination has explicit action",
+        "Fix question flow - Wire SSE data to DecisionToast (3 files)",
+        "Claude Helper for 3 cases only - With explicit fallback chains",
+        "Eliminate race conditions - Atomic writes, spawn intent pattern",
+        "Reduce code - Target simplicity"
+      ],
+      "hasUserGate": true
     },
     "next_phase": {
-      "number": "1056",
-      "name": "JSONL Watcher (Push Updates)"
+      "number": "1060",
+      "name": "Stats & Operations"
     },
     "step": {
       "current": "design",
       "index": 0,
       "status": "not_started"
     },
+    "analyze": {
+      "iteration": null,
+      "completedAt": 1769189896
+    },
     "implement": null,
     "progress": {
       "tasks_completed": 0,
@@ -32,272 +45,27 @@
     "steps": {}
   },
   "health": {
-    "status": "ready",
-    "last_check": "2026-01-18T04:04:09Z",
+    "status": "healthy",
+    "last_check": "2026-01-24T17:20:00.000Z",
     "issues": []
   },
   "actions": {
-    "available": [],
-    "pending": [],
     "history": [
       {
         "type": "phase_completed",
-        "phase_number": "0030",
-        "phase_name": "test-suite-completion",
-        "branch": "0030-test-suite-completion",
-        "completed_at": "2026-01-11T06:46:22Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "0040",
-        "phase_name": "integration-options",
-        "branch": "0040-integration-options",
-        "completed_at": "2026-01-11T07:14:34Z",
-        "tasks_completed": 19,
-        "tasks_total": 19
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "0041",
-        "phase_name": "code-review-findings",
-        "branch": "0041-code-review-findings",
-        "completed_at": "2026-01-11T08:23:30Z",
-        "tasks_completed": "0",
-        "tasks_total": "42"
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "0050",
-        "phase_name": "ux-simplification",
-        "branch": "0050-ux-simplification",
-        "completed_at": "2026-01-11T20:26:26Z",
-        "tasks_completed": "0",
-        "tasks_total": "45"
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "0060",
-        "phase_name": "constitution-compliance",
-        "branch": "0060-constitution-compliance",
-        "completed_at": "2026-01-11T22:19:01Z",
-        "tasks_completed": "58",
-        "tasks_total": "58"
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "0060",
-        "phase_name": "0060-constitution-compliance",
-        "branch": null,
-        "completed_at": "2026-01-17T13:18:56Z",
-        "tasks_completed": 58,
-        "tasks_total": 58
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "1010",
-        "phase_name": "core-ui-scaffold",
-        "branch": "1010-core-ui-scaffold",
-        "completed_at": "2026-01-17T14:34:20Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "1020",
-        "phase_name": "real-time-file-watching",
-        "branch": "1020-real-time-file-watching",
-        "completed_at": "2026-01-17T15:11:16Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "1030",
-        "phase_name": "project-detail-views",
-        "branch": "1030-project-detail-views",
-        "completed_at": "2026-01-17T18:07:56Z",
-        "tasks_completed": 29,
-        "tasks_total": 29
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "1040",
-        "phase_name": "cli-actions-from-ui",
-        "branch": "1040-cli-actions-from-ui",
-        "completed_at": "2026-01-17T20:09:10Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "1045",
-        "phase_name": "project-actions-health",
-        "branch": "1045-project-actions-health",
-        "completed_at": "2026-01-18T01:28:45Z",
-        "tasks_completed": 25,
-        "tasks_total": 25
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "0070",
-        "phase_name": "preworkflow-consolidation",
-        "branch": "0070-preworkflow-consolidation",
-        "completed_at": "2026-01-18T03:34:08Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "0072",
-        "phase_name": "workflow-consolidation",
-        "branch": "0072-workflow-consolidation",
-        "completed_at": "2026-01-18T04:04:09Z",
-        "tasks_completed": 39,
-        "tasks_total": 42
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "0010",
-        "phase_name": "Roadmap Flexibility",
-        "branch": "0010-Roadmap Flexibility",
-        "completed_at": "2026-01-18T09:37:49.628Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "0015",
-        "phase_name": "Workflow Commands",
-        "branch": "0015-Workflow Commands",
-        "completed_at": "2026-01-18T09:37:49.633Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "0020",
-        "phase_name": "Onboarding Polish",
-        "branch": "0020-Onboarding Polish",
-        "completed_at": "2026-01-18T09:37:49.633Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "0042",
-        "phase_name": "Code Review 2026-01-11",
-        "branch": "0042-Code Review 2026-01-11",
-        "completed_at": "2026-01-18T09:37:49.633Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "0076",
-        "phase_name": "Command Rebrand",
-        "branch": "0076-Command Rebrand",
-        "completed_at": "2026-01-18T09:37:49.633Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "0080",
-        "phase_name": "CLI TypeScript Migration",
-        "branch": "0080-CLI TypeScript Migration",
-        "completed_at": "2026-01-18T09:37:49.633Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "0082",
-        "phase_name": "Code Review 20260118",
-        "branch": "0082-code-review-20260118",
-        "completed_at": "2026-01-18T22:09:41.870Z",
-        "tasks_completed": "11",
-        "tasks_total": "53"
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "1046",
-        "phase_name": "Command JSON Output",
-        "branch": "1046-command-json-output",
-        "completed_at": "2026-01-18T23:16:29.542Z",
-        "tasks_completed": 0,
-        "tasks_total": 13
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "1047",
-        "phase_name": "Workflow Decomposition: Design",
-        "branch": "1047-workflow-decomposition-design",
-        "completed_at": "2026-01-19T03:50:36.982Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "1048",
-        "phase_name": "Workflow Foundation",
-        "branch": "1048-workflow-foundation",
-        "completed_at": "2026-01-19T04:46:08.853Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "1050",
-        "phase_name": "Workflow UI",
-        "branch": "1050-workflow-ui",
-        "completed_at": "2026-01-19T05:34:39.638Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "1051",
-        "phase_name": "Questions & Notifications",
-        "branch": "1051-questions-notifications",
-        "completed_at": "2026-01-19T06:05:34.184Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "1052",
-        "phase_name": "Session Viewer",
-        "branch": "1052-session-viewer",
-        "completed_at": "2026-01-19T07:30:21.594Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "1053",
-        "phase_name": "Workflow-Session Unification",
-        "branch": "1053-workflow-session-unification",
-        "completed_at": "2026-01-20T04:25:45.063Z",
-        "tasks_completed": 0,
-        "tasks_total": 0
-      },
-      {
-        "type": "phase_completed",
-        "phase_number": "1054",
-        "phase_name": "Project Details Redesign",
-        "branch": "1054-project-details-redesign",
-        "completed_at": "2026-01-20T06:34:58.276Z",
+        "phase_number": "1056",
+        "phase_name": "jsonl-watcher",
+        "branch": "1056-jsonl-watcher-push-updates",
+        "completed_at": "2026-01-23T16:58:51.483Z",
         "tasks_completed": 0,
         "tasks_total": 0
       },
       {
         "type": "phase_completed",
-        "phase_number": "1055",
-        "phase_name": "Smart Batching & Orchestration",
-        "branch": "1055-smart-batching-orchestration",
-        "completed_at": "2026-01-22T18:14:43.457Z",
+        "phase_number": "1057",
+        "phase_name": "Orchestration Simplification",
+        "branch": "1057-orchestration-simplification",
+        "completed_at": "2026-01-24T21:57:04.195Z",
         "tasks_completed": 0,
         "tasks_total": 0
       }
diff --git a/.specify/archive/1056-jsonl-watcher/checklists/implementation.md b/.specify/archive/1056-jsonl-watcher/checklists/implementation.md
new file mode 100644
index 0000000..3e5fb5c
--- /dev/null
+++ b/.specify/archive/1056-jsonl-watcher/checklists/implementation.md
@@ -0,0 +1,36 @@
+# Implementation Checklist: JSONL File Watcher
+
+**Phase**: 1056-jsonl-watcher
+**Created**: 2026-01-22
+
+## Requirement Completeness
+
+- [x] I-001: All deprecated polling files identified for deletion (5 files)
+- [x] I-002: Session JSONL file path pattern defined (~/.claude/projects/{hash}/*.jsonl)
+- [x] I-003: New SSE event types fully specified (session:message, session:question, session:end)
+- [ ] I-004: Orchestration event types specified (orchestration:decision, orchestration:batch)
+- [x] I-005: Debounce values defined (200ms project, 100ms session)
+
+## Requirement Clarity
+
+- [x] I-006: Session message parsing format documented (JSONL line structure)
+- [x] I-007: Question detection criteria clear (AskUserQuestion tool call in message)
+- [x] I-008: Session end detection criteria clear (end marker in JSONL)
+- [x] I-009: Task count parsing format documented (- [ ] T### pattern)
+- [x] I-010: Artifact existence paths documented (spec.md, plan.md, tasks.md in specs/{phase}/)
+
+## Scenario Coverage
+
+- [x] I-011: Normal session message flow covered
+- [x] I-012: Question detection and notification flow covered
+- [x] I-013: Session end detection flow covered
+- [x] I-014: Orchestration decision flow covered (file change -> decision)
+- [x] I-015: Error handling for malformed JSONL covered
+
+## Edge Case Coverage
+
+- [x] I-016: Malformed JSONL line handling (skip, log warning)
+- [x] I-017: Missing session directory handling (create on first access)
+- [x] I-018: File watcher limit handling (glob patterns)
+- [x] I-019: SSE connection drop handling (auto-reconnect existing)
+- [x] I-020: Empty tasks.md handling (return 0/0 counts)
diff --git a/.specify/archive/1056-jsonl-watcher/checklists/verification.md b/.specify/archive/1056-jsonl-watcher/checklists/verification.md
new file mode 100644
index 0000000..59af348
--- /dev/null
+++ b/.specify/archive/1056-jsonl-watcher/checklists/verification.md
@@ -0,0 +1,60 @@
+# Verification Checklist: JSONL File Watcher
+
+**Phase**: 1056-jsonl-watcher
+**Created**: 2026-01-22
+
+## Acceptance Criteria Quality
+
+- [x] V-001: SC-001 measurable - Session message latency <500ms verified
+- [x] V-002: SC-002 measurable - Question detection latency <200ms verified
+- [x] V-003: SC-003 measurable - Orchestration decision latency <500ms verified
+- [x] V-004: SC-004 measurable - Subprocess calls = 0 verified
+- [x] V-005: SC-005 measurable - Polling loops = 0 verified
+- [x] V-006: SC-006 verified - Connection recovery on network interruption
+
+## Non-Functional Requirements
+
+- [x] V-007: Session message latency consistently under 500ms (NFR-001)
+- [x] V-008: Question detection latency consistently under 200ms (NFR-002)
+- [x] V-009: Orchestration decisions occur within 500ms of file change (NFR-003)
+- [x] V-010: Zero subprocess calls for status during orchestration (NFR-004)
+- [x] V-011: Zero setInterval polling loops for data fetching (NFR-005)
+- [x] V-012: File watcher uses glob patterns, within macOS 256 limit (NFR-006)
+- [x] V-013: Malformed JSONL lines skipped gracefully (NFR-007)
+
+## Phase Goal Verification
+
+- [x] V-014: Goal 1 - All polling replaced with file-watching
+- [x] V-015: Goal 2 - Zero polling loops remain in codebase
+- [x] V-016: Goal 3 - Session messages appear within 500ms
+- [x] V-017: Goal 4 - Questions appear instantly (<200ms)
+- [x] V-018: Goal 5 - Orchestration updates without polling
+- [x] V-019: Goal 6 - No specflow status --json subprocess calls
+
+## Functional Verification
+
+- [x] V-020: FR-001 - Deprecated polling hooks deleted (5 files)
+- [x] V-021: FR-002 - Session JSONL file watching active
+- [x] V-022: FR-003/004 - New SSE event types working
+- [x] V-023: FR-005-007 - Session events emitting correctly
+- [x] V-024: FR-008 - useSessionContent uses SSE
+- [x] V-025: FR-009 - useSSE handles new event types
+- [x] V-026: FR-010-013 - Orchestration runner event-driven
+
+## Build & Test Verification
+
+- [x] V-027: pnpm build:dashboard passes
+- [x] V-028: pnpm test:dashboard passes
+- [x] V-029: No TypeScript errors
+- [x] V-030: ESLint passes
+
+## USER GATE Verification
+
+These items require user confirmation before merge:
+
+- [ ] V-031: USER GATE - Session messages appear within 500ms
+- [ ] V-032: USER GATE - Questions appear instantly
+- [ ] V-033: USER GATE - Orchestration updates without polling
+- [ ] V-034: USER GATE - No specflow status --json subprocess calls
+- [ ] V-035: USER GATE - No setInterval polling loops remain
+- [ ] V-036: USER GATE - Connection recovers on network interruption
diff --git a/.specify/archive/1056-jsonl-watcher/discovery.md b/.specify/archive/1056-jsonl-watcher/discovery.md
new file mode 100644
index 0000000..61cffb6
--- /dev/null
+++ b/.specify/archive/1056-jsonl-watcher/discovery.md
@@ -0,0 +1,132 @@
+# Discovery: JSONL File Watcher & Polling Elimination
+
+**Phase**: `1056-jsonl-watcher`
+**Created**: 2026-01-22
+**Status**: Complete
+
+## Phase Context
+
+**Source**: ROADMAP phase 1056
+**Goal**: Replace all polling with file-watching. Zero polling loops when complete.
+
+---
+
+## Codebase Examination
+
+### Related Implementations
+
+| Location | Description | Relevance |
+|----------|-------------|-----------|
+| `src/lib/watcher.ts:550-609` | Existing chokidar file watcher | Core infrastructure to extend |
+| `src/app/api/events/route.ts` | SSE endpoint `/api/events` | Broadcast mechanism for new events |
+| `src/hooks/use-sse.ts:44-128` | Client-side SSE connection hook | Need to handle new event types |
+| `src/lib/services/orchestration-runner.ts:273-284` | Subprocess calls `specflow status --json` | Critical bottleneck to eliminate |
+| `src/lib/session-polling-manager.ts` | Singleton session polling | To be replaced with file watching |
+| `packages/shared/src/schemas/events.ts:157-165` | Current SSE event type definitions | Need new session/orchestration types |
+
+### Existing Patterns & Conventions
+
+- **Event broadcasting**: Watcher uses listener pattern with debounced file change handlers
+- **Debouncing**: 200ms delay for file changes, proven stable in production
+- **State management**: SSE context provides real-time state to React components
+- **Polling pattern**: Deprecated hooks use setInterval with cleanup on unmount
+
+### Integration Points
+
+- **Chokidar watcher**: Add session JSONL file paths to existing watcher
+- **SSE endpoint**: Extend event handlers for new event types
+- **useSSE hook**: Add case handlers for session:message, session:question, etc.
+- **UnifiedDataContext**: Store session content from SSE events
+
+### Constraints Discovered
+
+- **macOS file watcher limit**: 256 file descriptors - must use glob patterns not individual watchers
+- **Session file location**: `~/.claude/projects/{hash}/*.jsonl` - outside project directories
+- **Debounce tradeoff**: 200ms for project files, 100ms for session files (higher write frequency)
+
+---
+
+## Requirements Sources
+
+### From ROADMAP/Phase File
+
+1. Replace all polling with file-watching
+2. Zero polling loops when complete
+3. Session messages appear within 500ms
+4. Questions appear instantly (<200ms)
+5. Orchestration updates without polling
+6. No `specflow status --json` subprocess calls
+
+### From Analysis Document
+
+**Source**: `.specify/phases/polling-consolidation-analysis.md`
+
+| Polling Source | Interval | Impact | Migration |
+|----------------|----------|--------|-----------|
+| Orchestration runner subprocess | 3s | 1-2s latency per call | Watch files directly |
+| Session polling manager | 5s | Delayed session updates | Watch JSONL files |
+| useWorkflowExecution | 3s | Deprecated | Delete |
+| useWorkflowList | 3s | Deprecated | Delete |
+| useSessionHistory | 5s | Deprecated | Delete |
+| useSessionMessages | 3s | Deprecated | Delete |
+
+### From Memory Documents
+
+- **Constitution Principle VIII**: Keep session JSONL as operational state
+- **Constitution Principle VI**: Graceful degradation - fallback polling if chokidar fails
+- **Tech Stack**: chokidar v3.x approved for file watching
+
+---
+
+## Scope Clarification
+
+### Confirmed Understanding
+
+**What the user wants to achieve**:
+Replace all polling mechanisms in the dashboard with file-watching via chokidar, achieving sub-500ms latency for all real-time updates.
+
+**How it relates to existing code**:
+- Extend existing `watcher.ts` chokidar infrastructure
+- Add new SSE event types for sessions and orchestration
+- Delete deprecated polling hooks
+- Modify orchestration-runner to be event-driven
+
+**Key constraints and requirements**:
+- No subprocess calls for `specflow status --json`
+- Session JSONL files must be watched in `~/.claude/projects/`
+- Must handle macOS file watcher limits via glob patterns
+- Graceful degradation if file watching fails
+
+**Technical approach**:
+1. Delete deprecated polling hooks first (clean slate)
+2. Add session JSONL watching to watcher.ts
+3. Create new SSE event types
+4. Convert orchestration runner to event-driven
+5. Update client hooks to use SSE data
+
+---
+
+## Recommendations for SPECIFY
+
+### Should Include in Spec
+
+- FR: Delete 5 deprecated polling hooks
+- FR: Add session JSONL file watching to chokidar
+- FR: New SSE event types (session:message, session:question, session:end)
+- FR: Event-driven orchestration runner (no subprocess)
+- FR: Derive task counts from tasks.md parsing (not subprocess)
+- NFR: <500ms session message latency
+- NFR: <200ms question detection latency
+- NFR: Zero subprocess calls for status
+
+### Should Exclude from Spec (Non-Goals)
+
+- Backward compatibility with old polling APIs
+- Migration period with parallel systems
+- Fallback polling (single user, just make it work)
+
+### Potential Risks
+
+- **File watcher limits**: Mitigated by glob patterns
+- **JSONL parse errors**: Handle malformed lines gracefully
+- **Connection interruption**: SSE auto-reconnects (existing behavior)
diff --git a/.specify/archive/1056-jsonl-watcher/plan.md b/.specify/archive/1056-jsonl-watcher/plan.md
new file mode 100644
index 0000000..b5a4b3d
--- /dev/null
+++ b/.specify/archive/1056-jsonl-watcher/plan.md
@@ -0,0 +1,187 @@
+# Implementation Plan: JSONL File Watcher & Polling Elimination
+
+**Branch**: `1056-jsonl-watcher-push-updates` | **Date**: 2026-01-22 | **Spec**: [spec.md](spec.md)
+
+## Summary
+
+Replace all polling mechanisms in the SpecFlow dashboard with file-watching via chokidar. The orchestration runner will become fully event-driven, eliminating subprocess calls to `specflow status --json`. Session JSONL files will be watched to provide sub-500ms real-time updates.
+
+## Technical Context
+
+**Language/Version**: TypeScript 5.x (strict mode, ESM)
+**Primary Dependencies**: chokidar v3.x (existing), EventSource (SSE)
+**Storage**: File system watching (no database)
+**Testing**: Vitest (existing)
+**Target Platform**: Node.js 20.x, macOS/Linux
+**Project Type**: Monorepo (packages/dashboard, packages/shared)
+**Performance Goals**: <500ms latency for all real-time updates
+**Constraints**: macOS 256 file watcher limit, 200ms debounce
+**Scale/Scope**: Single user dashboard, ~10 concurrent projects max
+
+## Constitution Check
+
+- **Principle VIII** (Repo Knowledge vs Operational State): Session JSONL files are operational state - watched, not archived
+- **Principle VI** (Graceful Degradation): SSE auto-reconnects on failure
+- **Principle IIa** (TypeScript): All changes use TypeScript with strict mode
+
+## Project Structure
+
+### Documentation (this feature)
+
+```text
+specs/1056-jsonl-watcher/
+├── discovery.md         # Codebase examination findings
+├── spec.md              # Feature specification
+├── requirements.md      # Requirements checklist
+├── plan.md              # This file
+├── tasks.md             # Task breakdown
+└── checklists/          # Implementation & verification checklists
+```
+
+### Source Code (repository root)
+
+```text
+packages/dashboard/
+├── src/
+│   ├── app/api/events/route.ts    # SSE endpoint - emit new events
+│   ├── hooks/
+│   │   ├── use-sse.ts             # Handle new event types
+│   │   ├── use-session-content.ts # Convert to SSE-based
+│   │   ├── use-workflow-execution.ts  # DELETE
+│   │   ├── use-workflow-list.ts       # DELETE
+│   │   ├── use-session-history.ts     # DELETE
+│   │   └── use-session-messages.ts    # DELETE
+│   ├── lib/
+│   │   ├── watcher.ts             # Add session JSONL watching
+│   │   ├── session-polling-manager.ts  # DELETE
+│   │   └── services/
+│   │       └── orchestration-runner.ts # Event-driven conversion
+│   └── contexts/
+│       └── unified-data-context.tsx   # Session content from SSE
+
+packages/shared/
+└── src/schemas/
+    └── events.ts              # New SSE event type definitions
+```
+
+**Structure Decision**: Web app (backend + frontend in packages/dashboard)
+
+## Implementation Phases
+
+### Phase 0.5: Delete Polling Hooks
+
+Delete deprecated hooks first to establish clean baseline:
+- `use-workflow-execution.ts` - replaced by useProjectData
+- `use-workflow-list.ts` - replaced by useUnifiedData
+- `use-session-history.ts` - replaced by useProjectData.sessions
+- `use-session-messages.ts` - replaced by useSessionContent (SSE)
+- `session-polling-manager.ts` - replaced by file watching
+
+Fix any import errors after deletion.
+
+### Phase 1: Event Types & Schemas
+
+Add new SSE event types to `packages/shared/src/schemas/events.ts`:
+
+```typescript
+// Session events
+| { type: 'session:message'; projectId: string; sessionId: string; data: SessionMessage[] }
+| { type: 'session:question'; projectId: string; sessionId: string; data: Question }
+| { type: 'session:end'; projectId: string; sessionId: string }
+
+// Orchestration events
+| { type: 'orchestration:decision'; projectId: string; data: DecisionLogEntry }
+| { type: 'orchestration:batch'; projectId: string; data: BatchProgress }
+```
+
+### Phase 2: Session File Watching
+
+Extend watcher.ts to watch session JSONL files:
+
+1. Calculate session directory: `~/.claude/projects/{projectHash}/`
+2. Add glob pattern: `${sessionDir}/*.jsonl`
+3. On change: parse new lines, emit session:* events
+4. 100ms debounce for session files (faster than 200ms for project files)
+
+### Phase 3: Orchestration Runner Conversion
+
+Replace polling loop with event-driven:
+
+1. Subscribe to file change events
+2. Derive task counts from tasks.md parsing (no subprocess)
+3. Derive artifact existence from file system checks
+4. Replace `while(running) { sleep }` with event handlers
+5. Delete `getSpecflowStatus()` subprocess function
+
+### Phase 4: Client Hook Updates
+
+1. Update useSSE to handle session:* and orchestration:* events
+2. Update useSessionContent to read from SSE context
+3. Update unified-data-context to store session content
+
+## File Change Summary
+
+| File | Action | Purpose |
+|------|--------|---------|
+| `use-workflow-execution.ts` | DELETE | Deprecated polling |
+| `use-workflow-list.ts` | DELETE | Deprecated polling |
+| `use-session-history.ts` | DELETE | Deprecated polling |
+| `use-session-messages.ts` | DELETE | Deprecated polling |
+| `session-polling-manager.ts` | DELETE | Polling manager |
+| `packages/shared/src/schemas/events.ts` | MODIFY | New event types |
+| `src/lib/watcher.ts` | MODIFY | Session JSONL watching |
+| `src/app/api/events/route.ts` | MODIFY | Emit new events |
+| `src/hooks/use-sse.ts` | MODIFY | Handle new events |
+| `src/hooks/use-session-content.ts` | MODIFY | SSE-based |
+| `src/lib/services/orchestration-runner.ts` | MODIFY | Event-driven |
+| `src/contexts/unified-data-context.tsx` | MODIFY | Session from SSE |
+
+## Key Technical Decisions
+
+### Session Directory Calculation
+
+Use existing `calculateProjectHash()` from `src/lib/project-hash.ts`:
+
+```typescript
+import { getProjectSessionDir } from '@/lib/project-hash';
+
+// Claude stores session files in ~/.claude/projects/{dirName}/
+// where dirName is the project path with slashes replaced by dashes
+// e.g., /Users/dev/myproject -> -Users-dev-myproject
+
+const sessionDir = getProjectSessionDir(projectPath);
+// Returns: ~/.claude/projects/-Users-dev-myproject/
+```
+
+### Task Count Derivation
+
+```typescript
+import { readFile } from 'fs/promises';
+
+async function getTaskCounts(tasksPath: string): Promise<{ completed: number; total: number }> {
+  const content = await readFile(tasksPath, 'utf-8');
+  const lines = content.split('\n');
+
+  let total = 0;
+  let completed = 0;
+
+  for (const line of lines) {
+    const match = line.match(/^- \[([ xX])\] T\d{3}/);
+    if (match) {
+      total++;
+      if (match[1].toLowerCase() === 'x') completed++;
+    }
+  }
+
+  return { completed, total };
+}
+```
+
+### Debounce Configuration
+
+```typescript
+const DEBOUNCE_MS = {
+  project: 200,  // Existing, proven stable
+  session: 100,  // Faster for real-time feel
+};
+```
diff --git a/.specify/archive/1056-jsonl-watcher/requirements.md b/.specify/archive/1056-jsonl-watcher/requirements.md
new file mode 100644
index 0000000..f6ce248
--- /dev/null
+++ b/.specify/archive/1056-jsonl-watcher/requirements.md
@@ -0,0 +1,41 @@
+# Requirements Checklist: JSONL File Watcher
+
+**Phase**: 1056-jsonl-watcher
+**Created**: 2026-01-22
+
+## Functional Requirements
+
+- [ ] FR-001: Delete deprecated polling hooks (5 files)
+- [ ] FR-002: Add session JSONL file watching to chokidar
+- [ ] FR-003: Define session SSE event types (session:message, session:question, session:end)
+- [ ] FR-004: Define orchestration SSE event types (orchestration:decision, orchestration:batch)
+- [ ] FR-005: Emit session:message events on JSONL changes
+- [ ] FR-006: Parse JSONL to extract questions, emit session:question
+- [ ] FR-007: Detect session end markers, emit session:end
+- [ ] FR-008: Update useSessionContent to use SSE
+- [ ] FR-009: Update useSSE to handle new event types
+- [ ] FR-010: Remove subprocess calls from orchestration runner
+- [ ] FR-011: Derive task counts from tasks.md parsing
+- [ ] FR-012: Derive artifact existence from file system
+- [ ] FR-013: Event-driven orchestration loop
+- [ ] FR-014: Watch tasks.md per-phase
+- [ ] FR-015: Debounce 200ms project, 100ms session
+
+## Non-Functional Requirements
+
+- [ ] NFR-001: Session message latency <500ms
+- [ ] NFR-002: Question detection latency <200ms
+- [ ] NFR-003: Orchestration decision latency <500ms
+- [ ] NFR-004: Zero subprocess calls for status
+- [ ] NFR-005: Zero polling loops
+- [ ] NFR-006: Glob patterns for file watching (macOS limit)
+- [ ] NFR-007: Graceful JSONL parse error handling
+
+## Success Criteria
+
+- [ ] SC-001: Session latency 10x improvement
+- [ ] SC-002: Question detection 25x improvement
+- [ ] SC-003: Orchestration decision 6-10x improvement
+- [ ] SC-004: Subprocess calls eliminated
+- [ ] SC-005: Polling loops eliminated
+- [ ] SC-006: Connection recovery preserved
diff --git a/.specify/archive/1056-jsonl-watcher/spec.md b/.specify/archive/1056-jsonl-watcher/spec.md
new file mode 100644
index 0000000..a26b1c3
--- /dev/null
+++ b/.specify/archive/1056-jsonl-watcher/spec.md
@@ -0,0 +1,129 @@
+# Feature Specification: JSONL File Watcher & Polling Elimination
+
+**Feature Branch**: `1056-jsonl-watcher-push-updates`
+**Created**: 2026-01-22
+**Status**: Draft
+
+## ID Format Reference
+
+| ID Format | Type | Example | Used For |
+|-----------|------|---------|----------|
+| `FR-###` | Functional Requirement | FR-001 | Must-have functionality |
+| `NFR-###` | Non-Functional Requirement | NFR-001 | Performance, security, etc. |
+| `SC-###` | Success Criteria | SC-001 | Measurable outcomes |
+| `US-###` | User Story | US-001 | User journeys |
+
+**Traceability chain**: Phase Goal -> FR-### -> T### -> V-###
+
+---
+
+## User Scenarios & Testing
+
+### User Story 1 - Real-time Session Messages (Priority: P1)
+
+When a Claude Code session is running, the user sees session messages in the dashboard within 500ms of them being written to the JSONL file, without any polling.
+
+**Why this priority**: Core user experience - the dashboard exists to monitor sessions in real-time.
+
+**Independent Test**: Start a session, type a message, observe it appearing in the dashboard within 500ms.
+
+**Acceptance Scenarios**:
+
+1. **Given** a running Claude Code session, **When** Claude writes a message to the JSONL file, **Then** the message appears in the dashboard within 500ms
+2. **Given** a running session, **When** a question (AskUserQuestion tool) is written, **Then** the question notification appears within 200ms
+3. **Given** a running session, **When** the session ends (end marker written), **Then** the session status updates immediately
+
+---
+
+### User Story 2 - Event-Driven Orchestration (Priority: P1)
+
+The orchestration runner reacts to file changes instantly instead of polling every 3 seconds with a subprocess call.
+
+**Why this priority**: Performance bottleneck - eliminates ~20 subprocess calls/minute.
+
+**Independent Test**: Run orchestration, observe zero `specflow status --json` subprocess calls and decisions happening within 500ms of file changes.
+
+**Acceptance Scenarios**:
+
+1. **Given** orchestration is running, **When** tasks.md is updated, **Then** orchestration detects the change within 500ms without subprocess
+2. **Given** orchestration is in implement phase, **When** all tasks are marked complete in tasks.md, **Then** orchestration advances to verify phase
+3. **Given** orchestration is running, **When** spec.md/plan.md are created, **Then** orchestration detects artifacts exist
+
+---
+
+### User Story 3 - Clean Polling Removal (Priority: P2)
+
+All deprecated polling hooks are deleted and replaced with SSE-based alternatives.
+
+**Why this priority**: Technical debt cleanup - polling code is redundant with SSE infrastructure.
+
+**Independent Test**: Grep for setInterval in hooks, find zero polling loops.
+
+**Acceptance Scenarios**:
+
+1. **Given** the codebase, **When** searching for deprecated polling hooks, **Then** use-workflow-execution.ts, use-workflow-list.ts, use-session-history.ts, use-session-messages.ts, session-polling-manager.ts do not exist
+2. **Given** any component that used polling hooks, **When** rendered, **Then** it uses useUnifiedData or useSSE instead
+
+---
+
+### Edge Cases
+
+- What happens when a JSONL file is malformed? -> Skip malformed lines, log warning
+- What happens when chokidar fails to initialize? -> Graceful degradation, log error, dashboard shows stale data
+- What happens when too many files are watched (macOS limit)? -> Use glob patterns, monitor watcher count
+- What happens when SSE connection drops? -> Auto-reconnect (existing behavior), show stale data during disconnection
+
+## Requirements
+
+### Functional Requirements
+
+- **FR-001**: System MUST delete deprecated polling hooks: use-workflow-execution.ts, use-workflow-list.ts, use-session-history.ts, use-session-messages.ts, session-polling-manager.ts
+- **FR-002**: System MUST add session JSONL file watching to chokidar watcher for paths `~/.claude/projects/{hash}/*.jsonl`
+- **FR-003**: System MUST define new SSE event types: session:message, session:question, session:end
+- **FR-004**: System MUST define new SSE event types: orchestration:decision, orchestration:batch
+- **FR-005**: System MUST emit session:message events when JSONL file content changes
+- **FR-006**: System MUST parse JSONL files to extract questions (AskUserQuestion tool calls) and emit session:question events
+- **FR-007**: System MUST detect session end markers in JSONL and emit session:end events
+- **FR-008**: System MUST update useSessionContent hook to consume SSE events instead of polling
+- **FR-009**: System MUST update useSSE hook to handle new session and orchestration event types
+- **FR-010**: Orchestration runner MUST NOT call `specflow status --json` subprocess
+- **FR-011**: Orchestration runner MUST derive task counts by parsing tasks.md directly
+- **FR-012**: Orchestration runner MUST derive artifact existence by checking file system directly
+- **FR-013**: Orchestration runner MUST use event-driven loop (file change triggers decision) instead of sleep-poll loop
+- **FR-014**: System MUST watch tasks.md files per-phase for orchestration task tracking
+- **FR-015**: System MUST use 200ms debounce for project files, 100ms for session files
+
+### Non-Functional Requirements
+
+- **NFR-001**: Session message latency MUST be <500ms from file write to UI update
+- **NFR-002**: Question detection latency MUST be <200ms from file write to notification
+- **NFR-003**: Orchestration decision latency MUST be <500ms from file change to decision
+- **NFR-004**: System MUST use zero subprocess calls for status during orchestration
+- **NFR-005**: System MUST have zero polling loops (setInterval for data fetching)
+- **NFR-006**: File watcher MUST use glob patterns to stay within macOS 256 watcher limit
+- **NFR-007**: System MUST handle malformed JSONL lines gracefully (skip, don't crash)
+
+### Key Entities
+
+- **SessionFile**: JSONL file at `~/.claude/projects/{hash}/{sessionId}.jsonl` containing session messages
+- **SessionMessage**: Individual line in JSONL file representing a message, tool call, or event
+- **SSEEvent**: Server-sent event with type discriminator (session:message, session:question, etc.)
+
+## Success Criteria
+
+### Measurable Outcomes
+
+- **SC-001**: Session message latency 0-5s -> <500ms (10x improvement)
+- **SC-002**: Question detection latency 0-5s -> <200ms (25x improvement)
+- **SC-003**: Orchestration decision latency 3-5s -> <500ms (6-10x improvement)
+- **SC-004**: Subprocess calls per minute ~20 -> 0 (complete elimination)
+- **SC-005**: Polling loops in codebase 9+ -> 0 (complete elimination)
+- **SC-006**: Connection recovery works on network interruption (existing behavior preserved)
+
+---
+
+## Memory Promotion Markers
+
+`[PROMOTE]` File watching with 200ms debounce is proven stable for project files; use 100ms for higher-frequency session files.
+
+`[PROMOTE]` Use glob patterns for file watching to avoid macOS 256 watcher limit.
diff --git a/.specify/archive/1056-jsonl-watcher/tasks.md b/.specify/archive/1056-jsonl-watcher/tasks.md
new file mode 100644
index 0000000..c24445d
--- /dev/null
+++ b/.specify/archive/1056-jsonl-watcher/tasks.md
@@ -0,0 +1,166 @@
+# Tasks: JSONL File Watcher & Polling Elimination
+
+## Phase Goals Coverage
+
+| # | Phase Goal | Spec Requirement(s) | Task(s) | Status |
+|---|------------|---------------------|---------|--------|
+| 1 | Replace all polling with file-watching | FR-002, FR-013, FR-014, FR-015 | T008-T015, T021-T026 | COVERED |
+| 2 | Zero polling loops when complete | FR-001, NFR-005 | T001-T007 | COVERED |
+| 3 | Session messages appear within 500ms | FR-002, FR-005, FR-008, NFR-001 | T008-T012, T018-T020 | COVERED |
+| 4 | Questions appear instantly (<200ms) | FR-006, NFR-002 | T010, T011 | COVERED |
+| 5 | Orchestration updates without polling | FR-010, FR-011, FR-012, FR-013, NFR-003 | T021-T026 | COVERED |
+| 6 | No specflow status --json subprocess calls | FR-010, FR-011, FR-012, NFR-004 | T022-T024 | COVERED |
+
+Coverage: 6/6 goals (100%)
+
+---
+
+## Progress Dashboard
+
+> Last updated: 2026-01-22 | Run `specflow tasks sync` to refresh
+
+| Phase | Status | Progress |
+|-------|--------|----------|
+| Setup | PENDING | 0/0 |
+| Phase 0.5: Delete Polling | PENDING | 0/7 |
+| US1: Session Watching | PENDING | 0/12 |
+| US2: Event-Driven Orchestration | PENDING | 0/6 |
+| US3: Clean Polling Removal | PENDING | 0/4 |
+| Polish | PENDING | 0/2 |
+
+**Overall**: 0/31 (0%) | **Current**: None
+
+---
+
+## Phase 0.5: Delete Polling Hooks (Clean Slate)
+
+**Purpose**: Remove deprecated polling code before building new infrastructure
+
+- [x] T001 [P] [US3] Delete packages/dashboard/src/hooks/use-workflow-execution.ts
+- [x] T002 [P] [US3] Delete packages/dashboard/src/hooks/use-workflow-list.ts
+- [x] T003 [P] [US3] Delete packages/dashboard/src/hooks/use-session-history.ts
+- [x] T004 [P] [US3] Delete packages/dashboard/src/hooks/use-session-messages.ts
+- [x] T005 [P] [US3] Delete packages/dashboard/src/lib/session-polling-manager.ts
+- [x] T006 [US3] Fix import errors from deleted files in packages/dashboard/src/
+- [x] T007 [US3] Verify build passes with pnpm build:dashboard
+
+**Checkpoint**: All polling code deleted, build passes
+
+---
+
+## Phase 1: Session File Watching (Priority: P1)
+
+**Goal**: Watch session JSONL files and emit SSE events
+
+**Independent Test**: Start session, type message, see it in dashboard within 500ms
+
+### Event Schema Updates
+
+- [x] T008 [P] [US1] Add SessionMessageSchema to packages/shared/src/schemas/events.ts
+- [x] T009 [P] [US1] Add session:message, session:question, session:end event types to SSEEventSchema
+- [x] T010 [US1] Add QuestionSchema for AskUserQuestion detection in packages/shared/src/schemas/events.ts
+
+### Watcher Extension
+
+- [x] T011 [US1] Add getSessionDirectory() function to packages/dashboard/src/lib/watcher.ts
+- [x] T012 [US1] Add watchSessionFiles() to watch ~/.claude/projects/{hash}/*.jsonl in watcher.ts
+- [x] T013 [US1] Implement handleSessionFileChange() to parse JSONL and detect new messages in watcher.ts
+- [x] T014 [US1] Add parseSessionLines() to extract messages from JSONL content in watcher.ts
+- [x] T015 [US1] Add extractQuestions() to detect AskUserQuestion tool calls in watcher.ts
+
+### SSE Endpoint Updates
+
+- [x] T016 [US1] Add session event handlers to packages/dashboard/src/app/api/events/route.ts
+- [x] T017 [US1] Broadcast session:message events when session content changes in route.ts
+
+### Client Hook Updates
+
+- [x] T018 [US1] Add session:message case handler to packages/dashboard/src/hooks/use-sse.ts
+- [x] T019 [US1] Update useSessionContent to read from SSE context in packages/dashboard/src/hooks/use-session-content.ts
+- [x] T020 [US1] Add sessionContent Map to unified-data-context.tsx
+
+**Checkpoint**: Session messages appear in dashboard within 500ms of file write
+
+---
+
+## Phase 2: Event-Driven Orchestration (Priority: P1)
+
+**Goal**: Orchestration runner reacts to file changes, no subprocess
+
+**Independent Test**: Run orchestration, observe zero subprocess calls, decisions within 500ms
+
+### Subprocess Elimination
+
+- [x] T021 [US2] Add getTaskCounts() function to parse tasks.md directly in packages/dashboard/src/lib/services/orchestration-runner.ts
+- [x] T022 [US2] Add checkArtifactExistence() to check spec.md/plan.md/tasks.md via fs in orchestration-runner.ts
+- [x] T023 [US2] Delete getSpecflowStatus() subprocess function from orchestration-runner.ts
+- [x] T024 [US2] Replace specflow status --json calls with getTaskCounts() + checkArtifactExistence()
+
+### Event-Driven Loop
+
+- [x] T025 [US2] Add subscribeToFileEvents() to listen for watcher events in orchestration-runner.ts
+- [x] T026 [US2] Replace while(running) { sleep } loop with event-triggered decision cycle in orchestration-runner.ts
+
+**Checkpoint**: Orchestration runs with zero subprocess calls, 500ms decision latency
+
+---
+
+## Phase 3: Clean Polling Removal (Priority: P2)
+
+**Goal**: Verify zero polling loops remain
+
+**Independent Test**: grep for setInterval in src/hooks, find zero data-polling loops
+
+- [x] T027 [US3] Audit all useEffect with setInterval patterns in packages/dashboard/src/hooks/
+- [x] T028 [US3] Remove any remaining polling patterns (except UI animation timers)
+- [x] T029 [US3] Update components that imported deleted hooks to use SSE alternatives
+- [x] T030 [US3] Add eslint rule to prevent setInterval in hooks (optional)
+
+**Checkpoint**: Zero setInterval patterns for data fetching
+
+---
+
+## Phase 4: Polish & Verification
+
+**Purpose**: Final cleanup and verification
+
+- [x] T031 Run pnpm test:dashboard to verify all tests pass
+- [x] T032 Manual verification: start session, verify <500ms message latency
+
+---
+
+## Dependencies & Execution Order
+
+### Phase Dependencies
+
+- **Phase 0.5 (Delete Polling)**: No dependencies - start immediately
+- **Phase 1 (Session Watching)**: Depends on T008-T010 (schemas) before T011-T020
+- **Phase 2 (Orchestration)**: Can run parallel to Phase 1 after Phase 0.5
+- **Phase 3 (Clean Removal)**: Depends on Phase 1 & 2 completion
+- **Phase 4 (Polish)**: Depends on all above
+
+### Task Dependencies
+
+- T006 depends on T001-T005 (fix imports after deletion)
+- T007 depends on T006 (verify build after fixes)
+- T011-T015 depend on T008-T010 (schemas first)
+- T016-T017 depend on T011-T015 (watcher before SSE)
+- T018-T020 depend on T016-T017 (SSE before hooks)
+- T024 depends on T021-T023 (helpers before replacement)
+- T026 depends on T024-T025 (event subscription before loop)
+
+### Parallel Opportunities
+
+- T001-T005: All file deletions can run in parallel
+- T008-T010: All schema additions can run in parallel
+- T021-T022: Both helper functions can be written in parallel
+- Phase 1 & Phase 2 can run in parallel after Phase 0.5
+
+---
+
+## Notes
+
+- [P] tasks = different files, no dependencies
+- [US#] = User Story mapping for traceability
+- Commit after each phase completion
+- 100ms debounce for session files, 200ms for project files
diff --git a/.specify/archive/1057-orchestration-simplification/SIMPLIFICATION_PLAN.md b/.specify/archive/1057-orchestration-simplification/SIMPLIFICATION_PLAN.md
new file mode 100644
index 0000000..b25fbc3
--- /dev/null
+++ b/.specify/archive/1057-orchestration-simplification/SIMPLIFICATION_PLAN.md
@@ -0,0 +1,365 @@
+# Orchestration Simplification Plan
+
+## Problem Statement
+
+The dashboard's orchestration system has become a mess of hacks working around edge cases instead of having a clean design. There are multiple sources of truth (CLI state file vs dashboard OrchestrationExecution), reconciliation hacks, guards that block decisions after they're already wrong, and a Claude analyzer as a fallback when nothing makes sense.
+
+## Goals
+
+1. **Single source of truth**: `.specflow/orchestration-state.json` is THE state
+2. **Dead simple flow**: design → analyze → implement (batches) → verify → merge
+3. **Trust sub-commands**: They update step.status; dashboard auto-heals if needed
+4. **Clean decision logic**: No hacks, no guards, no reconciliation between parallel states
+
+---
+
+## Architecture Overview
+
+```
+┌─────────────────────────────────────────────────────────────────────┐
+│                         Dashboard                                    │
+│  ┌─────────────────┐    ┌──────────────────┐    ┌───────────────┐  │
+│  │  Orchestration  │───>│  Claude CLI      │───>│  specflow CLI │  │
+│  │  Runner         │    │  Session         │    │  state set    │  │
+│  └────────┬────────┘    └──────────────────┘    └───────┬───────┘  │
+│           │                                              │          │
+│           │ watches                                      │ writes   │
+│           ▼                                              ▼          │
+│  ┌─────────────────────────────────────────────────────────────┐   │
+│  │              .specflow/orchestration-state.json              │   │
+│  │  (SINGLE SOURCE OF TRUTH)                                    │   │
+│  └─────────────────────────────────────────────────────────────┘   │
+└─────────────────────────────────────────────────────────────────────┘
+```
+
+**Flow**:
+1. Dashboard reads state file
+2. Dashboard decides what to spawn based on state
+3. Dashboard spawns Claude CLI session with skill (/flow.design, etc.)
+4. Claude CLI runs skill, skill calls `specflow state set` to update state
+5. Dashboard watches state file for changes
+6. When session ends AND step.status=complete, move to next step
+7. If state doesn't match expectations, auto-heal (simple rules, Claude fallback)
+
+---
+
+## Phase 1: Consolidate State (Remove OrchestrationExecution)
+
+### Current Problem
+- `OrchestrationExecution` in dashboard maintains: currentPhase, batches, status, config, executions, decisionLog, totalCostUsd
+- CLI state file maintains: step.current, step.status, step.index, phase info
+- These drift apart, causing confusion
+
+### Solution
+Extend the CLI state schema to include dashboard-specific fields:
+
+```typescript
+// Add to orchestration section of state file
+orchestration: {
+  // ... existing fields (step, phase, progress, etc.)
+
+  // NEW: Dashboard orchestration tracking
+  dashboard: {
+    // Active orchestration (null if none)
+    active: {
+      id: string;              // UUID for this orchestration run
+      startedAt: string;       // ISO timestamp
+      config: OrchestrationConfig;  // User's config choices
+    } | null;
+
+    // Batch tracking for implement phase
+    batches: {
+      total: number;
+      current: number;
+      items: Array<{
+        section: string;
+        taskIds: string[];
+        status: 'pending' | 'running' | 'completed' | 'failed' | 'healed';
+        workflowId?: string;
+        healAttempts: number;
+      }>;
+    };
+
+    // Cost tracking
+    cost: {
+      total: number;
+      perBatch: number[];
+    };
+
+    // Decision log (last 20)
+    decisionLog: Array<{
+      timestamp: string;
+      action: string;
+      reason: string;
+    }>;
+
+    // Last workflow tracking
+    lastWorkflow: {
+      id: string;
+      skill: string;
+      status: 'running' | 'completed' | 'failed' | 'cancelled';
+    } | null;
+  }
+}
+```
+
+### Tasks
+1. [ ] Update `OrchestrationStateSchema` in `packages/shared/src/schemas/events.ts`
+2. [ ] Add `specflow state set orchestration.dashboard.*` support
+3. [ ] Remove `OrchestrationExecution` type and storage
+4. [ ] Update `orchestration-service.ts` to read/write via specflow CLI (or direct file with schema validation)
+5. [ ] Remove `orchestration-execution.ts` schema
+
+---
+
+## Phase 2: Simplify Decision Logic
+
+### Current Problem
+- `orchestration-decisions.ts` has complex logic
+- `orchestration-runner.ts` has legacy `makeDecision()` plus adapter pattern
+- Guards that block transitions after wrong decisions
+- Claude analyzer fallback when state is unclear
+
+### Solution
+Simple decision matrix based on state file:
+
+```typescript
+function getNextAction(state: OrchestrationState): Decision {
+  const { step, dashboard } = state.orchestration;
+  const workflow = dashboard?.lastWorkflow;
+
+  // 1. If no active orchestration, nothing to do
+  if (!dashboard?.active) {
+    return { action: 'idle', reason: 'No active orchestration' };
+  }
+
+  // 2. If workflow is running, wait
+  if (workflow?.status === 'running') {
+    return { action: 'wait', reason: 'Workflow running' };
+  }
+
+  // 3. Based on current step and status
+  switch (step.current) {
+    case 'design':
+      if (step.status === 'complete') return transition('analyze');
+      if (step.status === 'failed') return heal('design');
+      if (!workflow) return spawn('flow.design');
+      return { action: 'wait', reason: 'Design in progress' };
+
+    case 'analyze':
+      if (step.status === 'complete') return transition('implement');
+      if (step.status === 'failed') return heal('analyze');
+      if (!workflow) return spawn('flow.analyze');
+      return { action: 'wait', reason: 'Analyze in progress' };
+
+    case 'implement':
+      return handleImplementBatches(state);
+
+    case 'verify':
+      if (step.status === 'complete') return mergeOrWait(state);
+      if (step.status === 'failed') return heal('verify');
+      if (!workflow) return spawn('flow.verify');
+      return { action: 'wait', reason: 'Verify in progress' };
+
+    default:
+      return { action: 'wait', reason: 'Unknown step' };
+  }
+}
+
+function handleImplementBatches(state): Decision {
+  const { batches } = state.orchestration.dashboard;
+
+  // All batches done?
+  if (allBatchesComplete(batches)) {
+    return transition('verify');
+  }
+
+  const currentBatch = batches.items[batches.current];
+
+  // Current batch failed?
+  if (currentBatch.status === 'failed') {
+    if (canHeal(currentBatch)) return healBatch(batches.current);
+    return { action: 'needs_attention', reason: 'Batch failed' };
+  }
+
+  // Current batch pending?
+  if (currentBatch.status === 'pending') {
+    return spawnBatch(currentBatch);
+  }
+
+  // Current batch complete? Move to next
+  if (currentBatch.status === 'completed') {
+    return advanceBatch();
+  }
+
+  return { action: 'wait', reason: 'Batch in progress' };
+}
+```
+
+### Tasks
+1. [ ] Rewrite `orchestration-decisions.ts` with simplified logic above
+2. [ ] Remove legacy `makeDecision()` from runner
+3. [ ] Remove `createDecisionInput()` adapter
+4. [ ] Remove guards that block after-the-fact
+5. [ ] Remove Claude analyzer fallback (replaced by simple heal logic)
+
+---
+
+## Phase 3: Fix State Transitions
+
+### Current Problem
+- Dashboard tries to reconcile its currentPhase with CLI's step.current
+- Hack at line 889-893: "if mismatch, treat as not_started"
+- `isPhaseComplete()` checks artifacts instead of trusting state
+
+### Solution
+Trust the state file. Period.
+
+```typescript
+// REMOVE THIS:
+const stepStatus = (stateFileStep === orchestration.currentPhase && rawStatus && ...)
+  ? rawStatus
+  : 'not_started';  // HACK
+
+// REPLACE WITH:
+const stepStatus = state.orchestration.step.status;
+const stepCurrent = state.orchestration.step.current;
+// That's it. Trust the state.
+```
+
+### Auto-Heal Rules (Simple)
+
+After a workflow ends, check state matches expectations:
+
+| Skill | Expected State | Auto-Heal If |
+|-------|---------------|--------------|
+| flow.design | step.current=design, step.status=complete | status != complete → set to complete |
+| flow.analyze | step.current=analyze, step.status=complete | status != complete → set to complete |
+| flow.implement | (batch-specific) | batch status not updated → mark complete |
+| flow.verify | step.current=verify, step.status=complete | status != complete → set to complete |
+
+If heal rule doesn't apply (ambiguous case), spawn Claude helper to analyze and fix.
+
+### Tasks
+1. [ ] Remove `isPhaseComplete()` function (or make it only check state)
+2. [ ] Remove state reconciliation hack (line 889-893)
+3. [ ] Add `autoHealAfterWorkflow()` function with simple rules
+4. [ ] Add Claude helper fallback for ambiguous cases only
+
+---
+
+## Phase 4: Clean Up Batch Handling
+
+### Current Problem
+- Batch completion uses `every()` on empty array (returns true = bug)
+- Guards prevent implement→verify transition when batches incomplete
+- Batches initialized late (during implement transition)
+
+### Solution
+Initialize batches when orchestration starts, track in state file:
+
+```typescript
+async function startOrchestration(projectPath: string, config: OrchestrationConfig) {
+  // 1. Parse batches from tasks.md NOW
+  const batchPlan = parseBatchesFromProject(projectPath, config.batchSizeFallback);
+
+  // 2. Initialize state with batches
+  await execAsync(`specflow state set \
+    orchestration.dashboard.active.id=${uuid()} \
+    orchestration.dashboard.active.startedAt=${new Date().toISOString()} \
+    orchestration.dashboard.batches.total=${batchPlan.batches.length} \
+    orchestration.dashboard.batches.current=0 \
+    orchestration.dashboard.batches.items='${JSON.stringify(batchPlan.batches)}'
+  `);
+
+  // 3. Start from current step (trust state file)
+  // Decision logic will spawn appropriate workflow
+}
+```
+
+### Tasks
+1. [ ] Move batch initialization to orchestration start
+2. [ ] Update batch status via `specflow state set` not direct writes
+3. [ ] Remove empty array guards (not needed if initialized properly)
+4. [ ] Remove batch-specific guards in executeDecision
+
+---
+
+## Phase 5: Remove Hacks
+
+List of specific hacks to remove once above is implemented:
+
+| Location | Hack | Remove When |
+|----------|------|-------------|
+| runner:889-893 | State reconciliation | Phase 3 complete |
+| runner:1134-1142 | Workflow lookup fallback | Phase 1 complete (tracked in state) |
+| runner:1450-1454 | Claude analyzer fallback | Phase 2 complete |
+| runner:1570-1584 | Batch completion guard | Phase 4 complete |
+| runner:1030-1037 | Empty array guard | Phase 4 complete |
+| service:291-295 | Circular phase completion | Phase 3 complete |
+
+---
+
+## Phase 6: UI Enhancements
+
+### Manual Step Override
+Add ability for user to manually go back to a previous step:
+
+```tsx
+// In OrchestrationProgress or similar
+<Button onClick={() => setStep('analyze')}>
+  Go back to Analyze
+</Button>
+```
+
+Implementation:
+```typescript
+async function setStepManually(step: string) {
+  await execAsync(`specflow state set \
+    orchestration.step.current=${step} \
+    orchestration.step.status=not_started
+  `);
+  // Orchestration runner will detect change and spawn appropriate workflow
+}
+```
+
+### Tasks
+1. [ ] Add step override buttons to UI
+2. [ ] Show current state clearly (what step we're on, what status)
+3. [ ] Add warning when external changes detected
+
+---
+
+## Implementation Order
+
+1. **Phase 1**: Consolidate state (biggest change, enables everything else)
+2. **Phase 4**: Clean up batch handling (depends on Phase 1)
+3. **Phase 3**: Fix state transitions (depends on Phase 1)
+4. **Phase 2**: Simplify decision logic (depends on Phase 1, 3, 4)
+5. **Phase 5**: Remove hacks (depends on all above)
+6. **Phase 6**: UI enhancements (can be parallel)
+
+---
+
+## Success Criteria
+
+- [ ] Single state file (no OrchestrationExecution)
+- [ ] Decision logic < 100 lines (currently ~700)
+- [ ] No reconciliation hacks
+- [ ] No guards that block after wrong decisions
+- [ ] No Claude analyzer fallback (simple heal rules only)
+- [ ] User can manually override step if needed
+- [ ] External runs (manual /flow.implement) don't break orchestration
+
+---
+
+## Scope Clarifications
+
+**In Scope (if needed for state management)**:
+- Updates to /flow.* commands for state-setting logic
+- Updates to specflow CLI core commands for state management
+- Schema extensions for dashboard tracking
+
+**Out of Scope**:
+- Major UI redesign (just adding step override)
+- Changes to /flow.* command core logic (design artifacts, TDD workflow, etc.)
diff --git a/.specify/archive/1057-orchestration-simplification/checklists/implementation.md b/.specify/archive/1057-orchestration-simplification/checklists/implementation.md
new file mode 100644
index 0000000..1f4060d
--- /dev/null
+++ b/.specify/archive/1057-orchestration-simplification/checklists/implementation.md
@@ -0,0 +1,94 @@
+# Implementation Checklist: Orchestration Simplification
+
+**Purpose**: Verify requirements quality and implementation readiness before coding begins
+**Created**: 2026-01-23
+**Feature**: [plan.md](../plan.md)
+**Phase**: 1057
+
+**Note**: This checklist is generated by `/flow.design` and verified during `/flow.implement`.
+
+## Checklist ID Format
+
+All items use `I-###` prefix (e.g., I-001, I-002).
+Mark complete with: `specflow mark I-001`
+
+---
+
+## Requirements Completeness
+
+Verify all necessary requirements are present in plan.md:
+
+- [ ] I-001 Decision matrix conditions (G1.1-G1.18) are fully specified
+- [ ] I-002 Batch state machine conditions (G2.1-G2.10) are fully specified
+- [ ] I-003 Claude Helper use cases (G3.1-G3.17) are fully specified
+- [ ] I-004 Question flow data plumbing (G4.1-G4.8) is documented
+- [ ] I-005 Race mitigation patterns (G5.1-G5.13) are documented
+
+## Requirements Clarity
+
+Verify requirements are specific and unambiguous:
+
+- [ ] I-010 Stale threshold is explicit: 10 minutes fixed (not configurable)
+- [ ] I-011 Valid step values are explicit: design, analyze, implement, verify, merge
+- [ ] I-012 Valid status values are explicit: not_started, pending, in_progress, complete, failed, blocked, skipped
+- [ ] I-013 Atomic write pattern is specified: write to .tmp, then rename
+- [ ] I-014 Claude Helper budget limits are specified: $1.0 for state recovery, $0.5 for stale diagnosis
+
+## Scenario Coverage
+
+Verify all conditions in decision matrix:
+
+- [ ] I-020 Running workflow scenarios covered (G1.4-G1.7)
+- [ ] I-021 Step complete scenarios covered (G1.8-G1.12)
+- [ ] I-022 Error state scenarios covered (G1.13-G1.14)
+- [ ] I-023 Spawn scenarios covered (G1.15-G1.17)
+- [ ] I-024 Batch scenarios covered (G2.1-G2.10)
+
+## Dependencies & Assumptions
+
+Verify external dependencies are documented:
+
+- [ ] I-030 Claude Helper API requirements documented
+- [ ] I-031 File watching requirements (chokidar) documented
+- [ ] I-032 State file format (OrchestrationStateSchema, OrchestrationExecutionSchema) documented
+- [ ] I-033 SSE event types documented (session:question, session:created, session:activity)
+- [ ] I-034 Project hash algorithm for CLI session detection documented
+
+## Task Readiness
+
+Verify tasks.md is implementation-ready:
+
+- [ ] I-040 Every task has clear file path
+- [ ] I-041 Task dependencies are explicit (phases ordered by dependency)
+- [ ] I-042 Parallel opportunities marked with [P]
+- [ ] I-043 Tasks are sized appropriately (single concern per task)
+- [ ] I-044 Test tasks identified with test file locations
+
+---
+
+## Architecture Readiness
+
+Verify pure function extraction is planned:
+
+- [ ] I-050 `makeDecision()` is designed as pure function (no I/O)
+- [ ] I-051 `handleImplementBatching()` is designed as pure function
+- [ ] I-052 `validateState()` is designed as pure function
+- [ ] I-053 `OrchestrationDeps` interface is designed for DI
+- [ ] I-054 Clock abstraction is included in deps for time-based logic
+
+## State Ownership
+
+Verify state ownership pattern is clear:
+
+- [ ] I-060 Orchestrate owns step transitions (step.current, step.index)
+- [ ] I-061 Sub-commands only update step.status
+- [ ] I-062 Two state files relationship is documented
+- [ ] I-063 Cross-file invariants are specified
+
+---
+
+## Notes
+
+- Address any unchecked items before starting implementation
+- Items blocking implementation should be resolved by updating plan.md
+- Use `specflow mark I-### --blocked "reason"` for items that cannot be resolved
diff --git a/.specify/archive/1057-orchestration-simplification/checklists/verification.md b/.specify/archive/1057-orchestration-simplification/checklists/verification.md
new file mode 100644
index 0000000..88ccef2
--- /dev/null
+++ b/.specify/archive/1057-orchestration-simplification/checklists/verification.md
@@ -0,0 +1,169 @@
+# Verification Checklist: Orchestration Simplification
+
+**Purpose**: Verify implementation quality and completeness after coding is done
+**Created**: 2026-01-23
+**Feature**: [plan.md](../plan.md)
+**Phase**: 1057
+
+**Note**: This checklist is verified during `/flow.verify` before phase completion.
+
+## Checklist ID Format
+
+All items use `V-###` prefix (e.g., V-001, V-002).
+Mark complete with: `specflow mark V-001`
+
+---
+
+## Phase Goal Verification
+
+Verify all phase goals from `.specify/phases/1057-orchestration-simplification.md` are achieved:
+
+- [ ] V-001 Goal 1: Trust step.status - orchestration advances based on step.status, not artifact existence
+- [ ] V-002 Goal 2: Complete decision matrix - every state combination has explicit action
+- [ ] V-003 Goal 3: Fix question flow - question toast appears when workflow needs input
+- [ ] V-004 Goal 4: Claude Helper for 3 cases only - with explicit fallback chains
+- [ ] V-005 Goal 5: Eliminate race conditions - atomic writes, spawn intent pattern working
+- [ ] V-006 Goal 6: Code simplified - duplicate logic consolidated
+
+## Decision Matrix Verification (G1)
+
+Verify all decision matrix conditions work correctly:
+
+- [ ] V-010 [G1.1] Budget exceeded → fail action triggers
+- [ ] V-011 [G1.2] Duration > 4 hours → needs_attention triggers
+- [ ] V-012 [G1.4] Running workflow + recent activity → wait action
+- [ ] V-013 [G1.5] Stale workflow (>10 min) → recover_stale triggers
+- [ ] V-014 [G1.8] Verify complete + USER_GATE pending → wait_user_gate
+- [ ] V-015 [G1.9] Verify complete + autoMerge=false → wait_merge
+- [ ] V-016 [G1.10] Verify complete + autoMerge=true → transitions to merge
+- [ ] V-017 [G1.13-14] Failed/blocked step → recover_failed triggers
+
+## Batch State Machine Verification (G2)
+
+Verify batch handling works correctly:
+
+- [ ] V-020 [G2.1] No batches → initialize_batches triggers
+- [ ] V-021 [G2.4] Pending batch + no workflow → spawn_batch triggers
+- [ ] V-022 [G2.6] Batch complete + pauseBetweenBatches → pause triggers
+- [ ] V-023 [G2.7] Batch complete + continue → advance_batch triggers
+- [ ] V-024 [G2.9-10] Failed batch → heal or recover_failed based on attempts
+
+## Claude Helper Verification (G3)
+
+Verify Claude Helper works for exactly 3 cases:
+
+- [ ] V-030 [G3.2] State recovery creates .bak backup BEFORE recovery
+- [ ] V-031 [G3.5] State recovery fallback to heuristic is silent
+- [ ] V-032 [G3.10] Stale workflow fallback to needs_attention is silent
+- [ ] V-033 [G3.15-16] Failed step fallback to retry or needs_attention is silent
+- [ ] V-034 [G3.17] Grep shows Claude Helper ONLY called for these 3 cases
+
+## Question Flow Verification (G4)
+
+Verify question data flows to UI:
+
+- [ ] V-040 [G4.1] Watcher detects questions and emits session:question event
+- [ ] V-041 [G4.3] use-sse.ts populates sessionQuestions on event
+- [ ] V-042 [G4.6] decisionQuestions is NOT hardcoded to []
+- [ ] V-043 [G4.8] Questions cleared from map after user answers
+
+## Race Mitigation Verification (G5)
+
+Verify race conditions are prevented:
+
+- [ ] V-050 [G5.1-2] State writes use atomic temp file + rename pattern
+- [ ] V-051 [G5.3-7] Spawn intent pattern prevents duplicate spawns
+- [ ] V-052 [G5.8-10] Runner state persists across dashboard restart
+- [ ] V-053 [G5.11-13] Event sleep uses Set of callbacks (not single)
+
+## Session Tracking Verification (G6)
+
+Verify unified session tracking works:
+
+- [ ] V-060 [G6.1-5] External CLI sessions detected via JSONL watching
+- [ ] V-061 [G6.6-7] Omnibox commands update orchestration state
+- [ ] V-062 [G6.8-11] Pause/play button works, omnibox can resume
+
+## State Validation Verification (G7)
+
+Verify state validation catches errors:
+
+- [ ] V-070 [G7.1] Invalid step.index is detected
+- [ ] V-071 [G7.5] Invalid batches.current is detected
+- [ ] V-072 [G7.6] Missing recoveryContext when needs_attention is detected
+- [ ] V-073 [G7.7] Cross-file inconsistency is detected
+
+## Code Quality
+
+Verify implementation meets coding standards:
+
+- [ ] V-080 All tests pass (`pnpm test:dashboard`)
+- [ ] V-081 No linting errors (`pnpm lint`)
+- [ ] V-082 Type checking passes (`pnpm typecheck`)
+- [ ] V-083 No TODO/FIXME comments remain in new code
+
+## Code Cleanup Verification (G10)
+
+Verify obsolete code is removed:
+
+- [ ] V-090 [G10.1] No hasPlan/hasTasks/hasSpec checks in decision logic: `grep -n "hasPlan\|hasTasks\|hasSpec" orchestration-runner.ts` returns nothing
+- [ ] V-091 [G10.2-3] Duplicate functions consolidated
+- [ ] V-092 [G10.4] orchestration-service.ts contains only persistence logic
+
+## Test Coverage Verification (G11)
+
+Verify tests exist and pass:
+
+- [ ] V-100 [G11.1] Unit tests for makeDecision() cover all conditions
+- [ ] V-101 [G11.2] Unit tests for handleImplementBatching() cover all conditions
+- [ ] V-102 [G11.3] Unit tests for validateState() cover all conditions
+- [ ] V-103 [G11.5] Happy path integration test passes
+- [ ] V-104 [G11.12] Race condition test prevents duplicate spawns
+
+---
+
+## USER GATE Verification
+
+**USER GATE**: User must manually verify these items:
+
+- [ ] V-GATE-01 Start orchestration on a test phase
+- [ ] V-GATE-02 Orchestration advances based on step.status (not artifacts)
+- [ ] V-GATE-03 Batch handling: implement with multiple batches → each spawned sequentially
+- [ ] V-GATE-04 When workflow needs input, question toast appears
+- [ ] V-GATE-05 Answer question, workflow resumes
+- [ ] V-GATE-06 If step fails, Claude Helper diagnoses and recovers (silent fallback if Claude fails)
+- [ ] V-GATE-07 With autoMerge=false: verify complete → wait_merge → user triggers
+- [ ] V-GATE-08 With autoMerge=true: verify complete → merge runs automatically (no prompt)
+- [ ] V-GATE-09 Rapid triggers don't spawn duplicate workflows
+- [ ] V-GATE-10 Pause button → Play button when paused
+- [ ] V-GATE-11 Omnibox command resumes paused orchestration
+- [ ] V-GATE-12 Start session from external CLI terminal → dashboard detects it
+- [ ] V-GATE-13 Decision log appears correctly in Phase Completion card
+- [ ] V-GATE-14 Orchestration completes successfully
+
+---
+
+## Quick Verification Commands
+
+```bash
+# V-090: No artifact checks in decision logic
+grep -n "hasPlan\|hasTasks\|hasSpec" packages/dashboard/src/lib/services/orchestration-runner.ts
+
+# V-034: Claude Helper only called for 3 cases
+grep -r "claudeHelper\|claude-helper" packages/dashboard/src/lib/services/ --include="*.ts" -l
+
+# V-042: No hardcoded empty questions array
+grep -n "decisionQuestions = \[\]" packages/dashboard/src/
+
+# V-050: Atomic writes exist
+grep -n "\.tmp\|rename" packages/dashboard/src/lib/services/orchestration-service.ts
+```
+
+---
+
+## Notes
+
+- All V-### items must be checked before `/flow.merge`
+- Items that fail should be fixed or deferred with `specflow phase defer "reason"`
+- Use `specflow mark V-### --blocked "reason"` for items that cannot be verified
+- USER GATE items require manual testing by the user
diff --git a/.specify/archive/1057-orchestration-simplification/plan.md b/.specify/archive/1057-orchestration-simplification/plan.md
new file mode 100644
index 0000000..afddf05
--- /dev/null
+++ b/.specify/archive/1057-orchestration-simplification/plan.md
@@ -0,0 +1,1698 @@
+# Orchestration Simplification Plan
+
+## Problem Statement
+
+The dashboard orchestration-runner (1,412 lines) reimplements /flow.orchestrate logic poorly:
+
+1. `isPhaseComplete()` checks artifacts instead of trusting `step.status`
+2. Question flow is broken (watcher detects questions but data never reaches UI - needs verification)
+3. No recovery path when things go wrong
+4. 2,343 lines of redundant code between runner and service
+5. Race conditions in workflow spawning and state file access
+6. Batch handling logic scattered and incomplete
+7. No detection of sessions started/resumed from external Claude CLI
+8. Dashboard and CLI should work identically - terminal is just manual orchestration
+
+## The Fix
+
+Trust the state file. Sub-commands set `step.status=complete` when done. The runner just:
+1. Reads state (with atomic file access)
+2. Validates state consistency
+3. Spawns workflows (with spawn intent pattern to prevent races)
+4. Transitions when `step.status=complete`
+5. Uses Claude Helper for exactly 3 recovery scenarios
+6. Tracks ALL session activity (dashboard workflows, omnibox commands, external CLI)
+
+## Key Alignment Decisions
+
+| Topic | Decision |
+|-------|----------|
+| Auto-merge | Fully automatic when `autoMerge=true` (no confirmation prompt) |
+| Question flow | Needs testing to verify watcher detection works |
+| Claude Helper failures | Silent fallback (don't clutter UI with failure details) |
+| Race fixes | Must-have for this phase |
+| Stale threshold | 10 minutes fixed |
+| Batch pause/resume | Existing pause→play button, also omnibox resume |
+| Code size | Focus on simplicity, not line count |
+| External CLI | Watch `~/.claude/projects/{hash}/` for JSONL creation AND modification |
+| Decision log | Wire up correctly in UI, make improvements if needed |
+| Testing | Both unit tests AND integration tests |
+| Features | Keep cost tracking, heal attempts - improve implementation, don't neuter |
+
+---
+
+## State Files Overview
+
+There are TWO state files that must stay consistent:
+
+| File | Schema | Purpose |
+|------|--------|---------|
+| `.specflow/orchestration-state.json` | `OrchestrationStateSchema` | Project-level: phase, step, progress |
+| `.specflow/workflows/orchestration-{id}.json` | `OrchestrationExecutionSchema` | Per-run: batches, costs, decision log |
+
+**Invariants that must hold:**
+- `step.index === STEP_INDEX_MAP[step.current]`
+- `OrchestrationState.phase.number === OrchestrationExecution.currentPhase` (when linked)
+- `batches.current < batches.total` (unless all complete)
+- `recoveryContext` must exist when `status === 'needs_attention'`
+
+---
+
+## Core Decision Loop
+
+```typescript
+async function runOrchestrationLoop(orchestrationId: string, projectId: string) {
+  // Persist runner state to survive dashboard restarts
+  await persistRunnerState(orchestrationId, { startedAt: Date.now(), pid: process.pid });
+
+  while (true) {
+    // ═══════════════════════════════════════════════════════════════════
+    // 1. READ STATE (with atomic access)
+    // ═══════════════════════════════════════════════════════════════════
+    let state: OrchestrationState;
+    try {
+      state = await readOrchestrationState(projectPath); // Uses file locking
+    } catch (error) {
+      // CORRUPT/MISSING STATE: Use Claude Helper to rebuild
+      await createStateBackup(projectPath); // .bak before any recovery
+      state = await recoverStateWithClaudeHelper(projectPath, error);
+      if (!state) {
+        await setOrchestrationStatus('failed', 'Could not recover state');
+        break;
+      }
+    }
+
+    const { step, phase } = state.orchestration;
+    const execution = await readOrchestrationExecution(orchestrationId);
+
+    // ═══════════════════════════════════════════════════════════════════
+    // 2. PRE-DECISION GATES (checked before decision matrix)
+    // ═══════════════════════════════════════════════════════════════════
+
+    // Budget gate
+    if (execution.totalCostUsd >= execution.config.budget.maxTotal) {
+      await setOrchestrationStatus('failed', `Budget exceeded: $${execution.totalCostUsd.toFixed(2)}`);
+      break;
+    }
+
+    // Duration gate (4 hour max)
+    const duration = Date.now() - new Date(execution.startedAt).getTime();
+    if (duration > MAX_ORCHESTRATION_DURATION_MS) {
+      await setOrchestrationStatus('needs_attention', 'Orchestration running too long');
+      break;
+    }
+
+    // ═══════════════════════════════════════════════════════════════════
+    // 3. VALIDATE STATE CONSISTENCY
+    // ═══════════════════════════════════════════════════════════════════
+    const validation = validateState(state, execution);
+    if (!validation.valid) {
+      const fixed = await fixStateWithClaudeHelper(projectPath, state, validation.issues);
+      if (!fixed) {
+        await setOrchestrationStatus('needs_attention', validation.issues.join(', '));
+        await sleep(POLL_INTERVAL);
+        continue;
+      }
+      state = fixed;
+    }
+
+    // ═══════════════════════════════════════════════════════════════════
+    // 4. CHECK TERMINAL CONDITIONS
+    // ═══════════════════════════════════════════════════════════════════
+    if (execution.status === 'completed') break;
+    if (execution.status === 'cancelled') break;
+    if (execution.status === 'paused') {
+      await sleep(POLL_INTERVAL);
+      continue;
+    }
+
+    // ═══════════════════════════════════════════════════════════════════
+    // 5. MAKE DECISION (complete matrix, no ambiguity)
+    // ═══════════════════════════════════════════════════════════════════
+    const decision = makeDecision(step, phase, execution);
+
+    // ═══════════════════════════════════════════════════════════════════
+    // 6. EXECUTE DECISION
+    // ═══════════════════════════════════════════════════════════════════
+    await executeDecision(decision, orchestrationId, projectId);
+
+    // ═══════════════════════════════════════════════════════════════════
+    // 7. WAIT FOR EVENT OR TIMEOUT
+    // ═══════════════════════════════════════════════════════════════════
+    await waitForEventOrTimeout(orchestrationId, POLL_INTERVAL);
+  }
+
+  // Cleanup runner state
+  await clearRunnerState(orchestrationId);
+}
+```
+
+---
+
+## Decision Matrix
+
+This is the COMPLETE decision logic. Every possible state combination has an explicit action.
+
+```typescript
+const STEP_INDEX_MAP = { design: 0, analyze: 1, implement: 2, verify: 3, merge: 4 };
+const STALE_THRESHOLD_MS = 10 * 60 * 1000; // 10 minutes (increased from 5)
+
+function makeDecision(step: Step, phase: Phase, execution: OrchestrationExecution): Decision {
+  const { current, status } = step;
+  const workflow = getActiveWorkflow(execution);
+  const config = execution.config;
+
+  // ═══════════════════════════════════════════════════════════════════
+  // IMPLEMENT PHASE: BATCH HANDLING (checked first)
+  // ═══════════════════════════════════════════════════════════════════
+  if (current === 'implement') {
+    const batchDecision = handleImplementBatching(step, execution, workflow);
+    if (batchDecision) return batchDecision;
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // WORKFLOW IS RUNNING
+  // ═══════════════════════════════════════════════════════════════════
+  if (workflow?.status === 'running') {
+    const lastActivity = getLastFileChangeTime(projectPath);
+    const staleDuration = Date.now() - lastActivity;
+
+    if (staleDuration > STALE_THRESHOLD_MS) {
+      return {
+        action: 'recover_stale',
+        reason: `No activity for ${Math.round(staleDuration / 60000)} minutes`,
+        workflowId: workflow.id
+      };
+    }
+
+    return { action: 'wait', reason: 'Workflow running' };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // WORKFLOW NEEDS INPUT
+  // ═══════════════════════════════════════════════════════════════════
+  if (workflow?.status === 'waiting_for_input') {
+    return { action: 'wait', reason: 'Waiting for user input' };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // WORKFLOW ID EXISTS BUT LOOKUP FAILS
+  // ═══════════════════════════════════════════════════════════════════
+  if (execution.executions[current] && !workflow) {
+    // Workflow ID in state but can't find workflow - wait with backoff
+    return {
+      action: 'wait_with_backoff',
+      reason: `Workflow ${execution.executions[current]} lookup failed, waiting...`,
+      backoffMs: calculateExponentialBackoff(execution.lookupFailures || 0)
+    };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // STEP IS COMPLETE - DETERMINE NEXT ACTION
+  // ═══════════════════════════════════════════════════════════════════
+  if (status === 'complete') {
+    const nextStep = getNextStep(current);
+
+    // All steps done (after merge completes)
+    if (nextStep === null) {
+      return { action: 'complete', reason: 'All steps finished' };
+    }
+
+    // Verify complete → check USER_GATE before merge
+    if (current === 'verify' && nextStep === 'merge') {
+      // USER_GATE requires explicit confirmation
+      if (phase.hasUserGate && phase.userGateStatus !== 'confirmed') {
+        return { action: 'wait_user_gate', reason: 'USER_GATE requires confirmation' };
+      }
+      // autoMerge disabled → wait for user to trigger
+      if (!config.autoMerge) {
+        return { action: 'wait_merge', reason: 'Auto-merge disabled, waiting for user' };
+      }
+      // autoMerge enabled → transition to merge step
+      return {
+        action: 'transition',
+        nextStep: 'merge',
+        nextIndex: STEP_INDEX_MAP.merge,
+        reason: 'Verify complete, auto-merge enabled'
+      };
+    }
+
+    // Normal step transition
+    return {
+      action: 'transition',
+      nextStep,
+      nextIndex: STEP_INDEX_MAP[nextStep],
+      reason: `${current} complete, advancing to ${nextStep}`
+    };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // STEP FAILED OR BLOCKED
+  // ═══════════════════════════════════════════════════════════════════
+  if (status === 'failed' || status === 'blocked') {
+    return {
+      action: 'recover_failed',
+      reason: `Step ${current} is ${status}`,
+      error: step.error
+    };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // STEP IN PROGRESS BUT NO WORKFLOW
+  // ═══════════════════════════════════════════════════════════════════
+  if (status === 'in_progress' && !workflow) {
+    return { action: 'spawn', skill: getSkillForStep(current) };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // STEP NOT STARTED - SPAWN WORKFLOW
+  // ═══════════════════════════════════════════════════════════════════
+  if (status === 'not_started' || status === null || status === undefined) {
+    // Initialize batches when entering implement
+    if (current === 'implement' && execution.batches.total === 0) {
+      return { action: 'initialize_batches', reason: 'Entering implement, need to populate batches' };
+    }
+    return { action: 'spawn', skill: getSkillForStep(current) };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // UNKNOWN STATUS - BUG, USE CLAUDE HELPER
+  // ═══════════════════════════════════════════════════════════════════
+  console.error(`Unknown step.status: ${status}`);
+  return {
+    action: 'recover_unknown',
+    reason: `Unknown status: ${status}`
+  };
+}
+```
+
+---
+
+## Implement Phase: Batch Handling
+
+Batching has its own state machine within the implement phase:
+
+```typescript
+function handleImplementBatching(
+  step: Step,
+  execution: OrchestrationExecution,
+  workflow: Workflow | null
+): Decision | null {
+  const { batches, config } = execution;
+
+  // No batches yet - need to initialize
+  if (batches.total === 0) {
+    return { action: 'initialize_batches', reason: 'No batches populated' };
+  }
+
+  const currentBatch = batches.items[batches.current];
+  const allBatchesComplete = batches.items.every(
+    b => b.status === 'completed' || b.status === 'healed'
+  );
+
+  // All batches done → step is complete
+  if (allBatchesComplete) {
+    // Trust sub-command to set step.status=complete
+    // But if it didn't, force it
+    if (step.status !== 'complete') {
+      return { action: 'force_step_complete', reason: 'All batches complete but step.status not updated' };
+    }
+    return null; // Let normal decision matrix handle transition
+  }
+
+  // Current batch running with active workflow → wait
+  if (currentBatch?.status === 'running' && workflow?.status === 'running') {
+    return null; // Let normal staleness check handle this
+  }
+
+  // Current batch completed → advance to next batch
+  if (currentBatch?.status === 'completed' || currentBatch?.status === 'healed') {
+    // Check pauseBetweenBatches config
+    if (config.pauseBetweenBatches) {
+      return { action: 'pause', reason: 'Batch complete, pauseBetweenBatches enabled' };
+    }
+
+    const nextBatchIndex = batches.current + 1;
+    if (nextBatchIndex < batches.total) {
+      return {
+        action: 'advance_batch',
+        batchIndex: nextBatchIndex,
+        reason: `Batch ${batches.current} complete, advancing to batch ${nextBatchIndex}`
+      };
+    }
+  }
+
+  // Current batch pending + no workflow → spawn batch
+  if (currentBatch?.status === 'pending' && !workflow) {
+    return {
+      action: 'spawn_batch',
+      batch: currentBatch,
+      skill: 'flow.implement',
+      context: `Execute tasks ${currentBatch.taskIds.join(', ')} in section "${currentBatch.section}"`
+    };
+  }
+
+  // Current batch failed → try healing
+  if (currentBatch?.status === 'failed') {
+    if (config.autoHealEnabled && currentBatch.healAttempts < config.maxHealAttempts) {
+      return { action: 'heal_batch', batchIndex: batches.current, reason: 'Batch failed, attempting heal' };
+    }
+    return {
+      action: 'recover_failed',
+      reason: `Batch ${batches.current} failed after ${currentBatch.healAttempts} heal attempts`,
+      error: currentBatch.error
+    };
+  }
+
+  return null; // No batch-specific decision, use normal matrix
+}
+```
+
+---
+
+## Execute Decision
+
+Each decision action has a specific handler:
+
+```typescript
+async function executeDecision(decision: Decision, orchestrationId: string, projectId: string) {
+  // Log every decision for debugging
+  await logDecision(orchestrationId, decision);
+
+  switch (decision.action) {
+    case 'wait':
+      // Do nothing, loop will sleep
+      break;
+
+    case 'wait_with_backoff':
+      await incrementLookupFailures(orchestrationId);
+      await sleep(decision.backoffMs);
+      break;
+
+    case 'transition':
+      await transitionToStep(decision.nextStep, decision.nextIndex);
+      await spawnWorkflowWithIntent(getSkillForStep(decision.nextStep)); // Atomic spawn
+      break;
+
+    case 'spawn':
+      await spawnWorkflowWithIntent(decision.skill); // Uses spawn intent pattern
+      break;
+
+    case 'spawn_batch':
+      await linkBatchToWorkflow(decision.batch.index);
+      await spawnWorkflowWithIntent(decision.skill, decision.context);
+      break;
+
+    case 'advance_batch':
+      await advanceBatchIndex(decision.batchIndex);
+      // Next iteration will spawn the batch
+      break;
+
+    case 'initialize_batches':
+      const batches = parseBatchesFromProject(projectPath, config.batchSizeFallback);
+      await setBatches(orchestrationId, batches);
+      break;
+
+    case 'force_step_complete':
+      await setStepStatus('complete');
+      break;
+
+    case 'heal_batch':
+      await incrementBatchHealAttempts(decision.batchIndex);
+      await spawnHealerWorkflow(decision.batchIndex);
+      break;
+
+    case 'pause':
+      await setOrchestrationStatus('paused');
+      break;
+
+    case 'wait_merge':
+      await setOrchestrationStatus('waiting_merge');
+      break;
+
+    case 'wait_user_gate':
+      await setOrchestrationStatus('waiting_user_gate');
+      break;
+
+    case 'complete':
+      await setOrchestrationStatus('completed');
+      break;
+
+    case 'recover_stale':
+      await handleStaleWorkflow(decision.workflowId);
+      break;
+
+    case 'recover_failed':
+      await handleFailedStep(decision.error);
+      break;
+
+    case 'recover_unknown':
+      await handleUnknownState(decision.reason);
+      break;
+  }
+}
+```
+
+---
+
+## Atomic Workflow Spawning
+
+Prevent race conditions with spawn intent pattern:
+
+```typescript
+async function spawnWorkflowWithIntent(skill: string, context?: string): Promise<void> {
+  const intentKey = `spawn_intent_${orchestrationId}`;
+
+  // 1. Check if spawn already in progress
+  const existingIntent = await getSpawnIntent(intentKey);
+  if (existingIntent && Date.now() - existingIntent.timestamp < 30000) {
+    console.log('Spawn already in progress, skipping');
+    return;
+  }
+
+  // 2. Check if workflow already active
+  if (workflowService.hasActiveWorkflow(projectId, orchestrationId)) {
+    console.log('Workflow already active, skipping spawn');
+    return;
+  }
+
+  // 3. Write spawn intent BEFORE spawning
+  await setSpawnIntent(intentKey, { skill, timestamp: Date.now() });
+
+  try {
+    // 4. Actually spawn
+    await workflowService.start({ projectId, skill, orchestrationId, context });
+  } finally {
+    // 5. Clear intent regardless of success/failure
+    await clearSpawnIntent(intentKey);
+  }
+}
+```
+
+---
+
+## Claude Helper: Specific Use Cases
+
+Claude Helper is used for THREE specific scenarios only. Each has a defined contract and fallback.
+
+### 1. Recover Corrupt/Missing State File
+
+**When**: `readOrchestrationState()` throws an error
+
+**Fallback Chain**:
+1. Try Claude Helper → if success + confidence > 0.7 → use recovered state
+2. If Claude Helper fails → try heuristic recovery (read ROADMAP.md, git branch)
+3. If heuristic fails → return null → escalate to `needs_attention`
+
+**Always**: Create `.bak` backup BEFORE any recovery attempt
+
+```typescript
+async function recoverStateWithClaudeHelper(projectPath: string, error: Error): Promise<OrchestrationState | null> {
+  // Always backup first
+  await createStateBackup(projectPath);
+
+  const availableFiles = await scanProjectFiles(projectPath);
+
+  try {
+    const result = await claudeHelper.ask({
+      task: 'recover_state',
+      context: { projectPath, error: error.message, availableFiles },
+      model: 'sonnet',
+      tools: ['Read', 'Grep', 'Glob'],
+      maxTurns: 5,
+      maxBudgetUsd: 1.0,
+      responseSchema: RecoverStateResponseSchema,
+    });
+
+    if (result.recoverable && result.confidence > 0.7) {
+      await writeOrchestrationState(result.state);
+      logDecision('state_recovered', { confidence: result.confidence, reasoning: result.reasoning });
+      return result.state;
+    }
+
+    logDecision('state_low_confidence', { confidence: result.confidence, reasoning: result.reasoning });
+  } catch (e) {
+    console.error('Claude Helper failed for state recovery:', e);
+  }
+
+  // FALLBACK: Heuristic recovery
+  const heuristicState = await tryHeuristicStateRecovery(projectPath);
+  if (heuristicState) {
+    logDecision('state_heuristic_recovered', { method: 'roadmap_git_branch' });
+    return heuristicState;
+  }
+
+  return null; // Caller will escalate to needs_attention
+}
+```
+
+### 2. Recover Stale Workflow
+
+**When**: Workflow `status === 'running'` but no file changes for > 10 minutes
+
+**Fallback**: If Claude Helper fails → conservative action: `needs_attention`
+
+```typescript
+async function handleStaleWorkflow(workflowId: string) {
+  const workflow = await getWorkflow(workflowId);
+  const lastMessages = await getLastSessionMessages(workflow.sessionId, 10);
+  const staleDuration = Date.now() - new Date(workflow.lastActivityAt).getTime();
+
+  try {
+    const result = await claudeHelper.ask({
+      task: 'diagnose_stale_workflow',
+      context: {
+        workflowId,
+        sessionId: workflow.sessionId,
+        lastActivity: workflow.lastActivityAt,
+        staleDuration,
+        lastMessages,
+        currentStep: orchestration.step.current,
+        currentTask: orchestration.implement?.currentTask
+      },
+      model: 'haiku', // Quick decision
+      tools: ['Read'],
+      maxTurns: 3,
+      maxBudgetUsd: 0.5,
+      responseSchema: DiagnoseStaleResponseSchema,
+    });
+
+    switch (result.action) {
+      case 'continue':
+        logDecision('stale_false_alarm', { reasoning: result.reasoning });
+        break;
+
+      case 'restart_task':
+        await killWorkflow(workflowId);
+        await spawnWorkflowWithIntent('flow.implement');
+        logDecision('stale_restart', { reasoning: result.reasoning });
+        break;
+
+      case 'skip_task':
+        await killWorkflow(workflowId);
+        await markTaskBlocked(orchestration.implement.currentTask, result.blockReason);
+        await spawnWorkflowWithIntent('flow.implement');
+        logDecision('stale_skip', { task: orchestration.implement.currentTask, reason: result.blockReason });
+        break;
+
+      case 'abort':
+        await killWorkflow(workflowId);
+        await setOrchestrationStatus('needs_attention', result.reasoning);
+        logDecision('stale_abort', { reasoning: result.reasoning });
+        break;
+    }
+  } catch (e) {
+    console.error('Claude Helper failed for stale diagnosis:', e);
+    // FALLBACK: Conservative - notify user
+    await setOrchestrationStatus('needs_attention',
+      `Workflow appears stale for ${Math.round(staleDuration / 60000)} minutes - diagnosis failed`);
+  }
+}
+```
+
+### 3. Recover Failed Step
+
+**When**: `step.status === 'failed'` or `step.status === 'blocked'`
+
+**Pre-check**: If max heal attempts reached, skip Claude Helper and go straight to `needs_attention`
+
+**Fallback**: If Claude Helper fails → simple retry if within limits → else `needs_attention`
+
+```typescript
+async function handleFailedStep(error: string) {
+  const step = orchestration.step;
+
+  // Pre-check: Max attempts already reached?
+  if (execution.healAttempts >= execution.config.maxHealAttempts) {
+    await setOrchestrationStatus('needs_attention', `Max heal attempts (${execution.config.maxHealAttempts}) reached`);
+    return;
+  }
+
+  const workflow = getLastWorkflowForStep(step.current);
+
+  try {
+    const result = await claudeHelper.ask({
+      task: 'diagnose_failed_step',
+      context: {
+        step: step.current,
+        status: step.status,
+        error,
+        lastWorkflowOutput: workflow?.output,
+        failedTasks: execution.implement?.failedTasks || [],
+        passedTasks: execution.implement?.passedTasks || [],
+        healAttempts: execution.healAttempts || 0,
+        maxHealAttempts: execution.config.maxHealAttempts
+      },
+      model: 'sonnet',
+      tools: ['Read', 'Grep', 'Glob'],
+      maxTurns: 5,
+      maxBudgetUsd: 1.0,
+      responseSchema: DiagnoseFailedResponseSchema,
+    });
+
+    switch (result.action) {
+      case 'retry':
+        await incrementHealAttempts();
+        await setStepStatus('in_progress');
+        await spawnWorkflowWithIntent(getSkillForStep(step.current));
+        logDecision('failed_retry', { attempt: execution.healAttempts + 1, reasoning: result.reasoning });
+        break;
+
+      case 'skip_tasks':
+        for (const taskId of result.tasksToSkip || []) {
+          await markTaskBlocked(taskId, result.reasoning);
+        }
+        await setStepStatus('in_progress');
+        await spawnWorkflowWithIntent('flow.implement');
+        logDecision('failed_skip_tasks', { tasks: result.tasksToSkip, reasoning: result.reasoning });
+        break;
+
+      case 'run_prerequisite':
+        await transitionToStep(result.prerequisiteStep, STEP_INDEX_MAP[result.prerequisiteStep]);
+        await spawnWorkflowWithIntent(getSkillForStep(result.prerequisiteStep));
+        logDecision('failed_prerequisite', { step: result.prerequisiteStep, reasoning: result.reasoning });
+        break;
+
+      case 'abort':
+        await setOrchestrationStatus('needs_attention', result.reasoning);
+        logDecision('failed_abort', { reasoning: result.reasoning });
+        break;
+    }
+  } catch (e) {
+    console.error('Claude Helper failed for failure diagnosis:', e);
+    // FALLBACK: Simple retry if within limits
+    if (execution.healAttempts < execution.config.maxHealAttempts) {
+      await incrementHealAttempts();
+      await setStepStatus('in_progress');
+      await spawnWorkflowWithIntent(getSkillForStep(step.current));
+      logDecision('failed_fallback_retry', { reason: 'Claude Helper unavailable, attempting simple retry' });
+    } else {
+      await setOrchestrationStatus('needs_attention', error);
+    }
+  }
+}
+```
+
+---
+
+## Question Flow (Fixed)
+
+### The Problem
+
+The watcher CORRECTLY detects questions from JSONL. The SSE event is broadcast. But:
+1. `use-sse.ts` receives `session:question` and DROPS IT (does nothing)
+2. `page.tsx` has hardcoded `decisionQuestions = []`
+
+### The Fix (Data Plumbing)
+
+**use-sse.ts** - Add state and handler:
+```typescript
+// Add to hook state
+const [sessionQuestions, setSessionQuestions] = useState<Map<string, SessionQuestion[]>>(new Map());
+
+// In event handler switch:
+case 'session:question':
+  setSessionQuestions((prev) => {
+    const next = new Map(prev);
+    next.set(data.sessionId, data.data.questions);
+    return next;
+  });
+  break;
+
+// Return in hook result
+return { ..., sessionQuestions };
+```
+
+**unified-data-context.tsx** - Export questions:
+```typescript
+// Add to context value
+<UnifiedDataContext.Provider value={{ ..., sessionQuestions }}>
+```
+
+**page.tsx** - Replace hardcoded array:
+```typescript
+// Before (BROKEN):
+const decisionQuestions = useMemo(() => {
+  return [] as Array<...>  // HARDCODED EMPTY
+}, []);
+
+// After (FIXED):
+const { sessionQuestions } = useUnifiedData();
+const decisionQuestions = useMemo(() => {
+  if (!consoleSessionId) return [];
+  return sessionQuestions.get(consoleSessionId) ?? [];
+}, [consoleSessionId, sessionQuestions]);
+
+// Clear questions after answer
+async function handleDecisionAnswer(answers: Record<string, string>) {
+  await submitAnswers(workflowId, answers);
+  setSessionQuestions((prev) => {
+    const next = new Map(prev);
+    next.delete(consoleSessionId);
+    return next;
+  });
+}
+```
+
+---
+
+## State Validation
+
+Validate BOTH state files and their consistency:
+
+```typescript
+const STEP_INDEX_MAP = { design: 0, analyze: 1, implement: 2, verify: 3, merge: 4 };
+const VALID_STEPS = ['design', 'analyze', 'implement', 'verify', 'merge'];
+const VALID_STATUSES = ['not_started', 'pending', 'in_progress', 'complete', 'failed', 'blocked', 'skipped'];
+
+function validateState(state: OrchestrationState, execution: OrchestrationExecution): ValidationResult {
+  const issues: string[] = [];
+
+  // ═══════════════════════════════════════════════════════════════════
+  // ORCHESTRATION STATE VALIDATION
+  // ═══════════════════════════════════════════════════════════════════
+
+  // Check phase exists
+  if (!state.orchestration?.phase?.number) {
+    issues.push('No active phase');
+  }
+
+  // Check step is valid
+  const stepCurrent = state.orchestration?.step?.current;
+  if (stepCurrent && !VALID_STEPS.includes(stepCurrent)) {
+    issues.push(`Invalid step: ${stepCurrent}`);
+  }
+
+  // Check status is valid
+  const stepStatus = state.orchestration?.step?.status;
+  if (stepStatus && !VALID_STATUSES.includes(stepStatus)) {
+    issues.push(`Invalid status: ${stepStatus}`);
+  }
+
+  // Check step.index matches step.current
+  const expectedIndex = STEP_INDEX_MAP[stepCurrent];
+  const actualIndex = state.orchestration?.step?.index;
+  if (expectedIndex !== undefined && actualIndex !== expectedIndex) {
+    issues.push(`Step index mismatch: ${stepCurrent} should be ${expectedIndex}, got ${actualIndex}`);
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // EXECUTION STATE VALIDATION
+  // ═══════════════════════════════════════════════════════════════════
+
+  // Check batch indices
+  execution.batches.items.forEach((batch, index) => {
+    if (batch.index !== index) {
+      issues.push(`Batch index mismatch: position ${index} has index ${batch.index}`);
+    }
+  });
+
+  // Check batches.current is valid
+  if (execution.batches.current >= execution.batches.total && execution.batches.total > 0) {
+    issues.push(`Batch current (${execution.batches.current}) >= total (${execution.batches.total})`);
+  }
+
+  // Check recovery context when needed
+  if (execution.status === 'needs_attention' && !execution.recoveryContext) {
+    issues.push('needs_attention status requires recoveryContext');
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // CROSS-FILE CONSISTENCY
+  // ═══════════════════════════════════════════════════════════════════
+
+  // Phase alignment (when execution is linked)
+  if (state.orchestration?.phase?.number && execution.currentPhase) {
+    const statePhase = state.orchestration.phase.number;
+    const execPhase = execution.currentPhase;
+    // Note: execution.currentPhase is the step name, not phase number
+    // This check ensures we're on the same step
+    if (stepCurrent && stepCurrent !== execPhase && execPhase !== 'complete') {
+      issues.push(`Step mismatch: state has ${stepCurrent}, execution has ${execPhase}`);
+    }
+  }
+
+  return {
+    valid: issues.length === 0,
+    issues
+  };
+}
+```
+
+---
+
+## Race Condition Mitigations
+
+### 1. Atomic State File Writes
+
+```typescript
+async function writeOrchestrationState(state: OrchestrationState): Promise<void> {
+  const statePath = join(projectPath, '.specflow/orchestration-state.json');
+  const tempPath = `${statePath}.tmp.${Date.now()}`;
+
+  // Write to temp file
+  await writeFile(tempPath, JSON.stringify(state, null, 2));
+
+  // Atomic rename
+  await rename(tempPath, statePath);
+}
+```
+
+### 2. Spawn Intent Pattern
+
+See `spawnWorkflowWithIntent()` above.
+
+### 3. Persistent Runner State
+
+```typescript
+interface RunnerState {
+  orchestrationId: string;
+  pid: number;
+  startedAt: number;
+}
+
+async function persistRunnerState(orchestrationId: string, state: RunnerState): Promise<void> {
+  const runnerPath = join(projectPath, `.specflow/runner-${orchestrationId}.json`);
+  await writeFile(runnerPath, JSON.stringify(state));
+}
+
+// On dashboard startup, check for orphaned runners
+async function reconcileRunners(): Promise<void> {
+  const runnerFiles = await glob('.specflow/runner-*.json', { cwd: projectPath });
+  for (const file of runnerFiles) {
+    const state = JSON.parse(await readFile(file, 'utf-8'));
+    if (!isPidAlive(state.pid)) {
+      // Runner died, clean up
+      await unlink(file);
+      // Optionally restart orchestration
+    }
+  }
+}
+```
+
+### 4. Fix Event Sleep Callback Bug
+
+```typescript
+// Current (broken): Overwrites previous callback
+const eventSignals = new Map<string, () => void>();
+
+// Fixed: Use array of callbacks
+const eventSignals = new Map<string, Set<() => void>>();
+
+function eventDrivenSleep(ms: number, orchestrationId: string): Promise<void> {
+  return new Promise((resolve) => {
+    const timeout = setTimeout(resolve, ms);
+
+    const cleanup = () => {
+      clearTimeout(timeout);
+      resolve();
+    };
+
+    // Add to set instead of replacing
+    if (!eventSignals.has(orchestrationId)) {
+      eventSignals.set(orchestrationId, new Set());
+    }
+    eventSignals.get(orchestrationId)!.add(cleanup);
+  });
+}
+
+function wakeUp(orchestrationId: string): void {
+  const callbacks = eventSignals.get(orchestrationId);
+  if (callbacks) {
+    callbacks.forEach(cb => cb());
+    callbacks.clear();
+  }
+}
+```
+
+---
+
+## Unified Session Tracking
+
+The dashboard and CLI should work identically. Terminal is just the manual version of dashboard automation.
+
+### What to Watch
+
+Watch `~/.claude/projects/{project-hash}/` for:
+1. **New JSONL files created** - User started a new session from CLI
+2. **Existing JSONL files modified** - User resumed/continued a session
+
+### Detection Requirements
+
+```typescript
+// Session activity sources to track:
+type SessionActivitySource =
+  | 'dashboard_workflow'     // Started via dashboard workflow API
+  | 'dashboard_omnibox'      // User typed in omnibox on session viewer
+  | 'external_cli_new'       // User started new session from terminal
+  | 'external_cli_resume';   // User resumed session from terminal
+
+// All sources should update orchestration's view of session state
+```
+
+### Integration with Orchestration
+
+When orchestration is running:
+1. If user interacts with session via omnibox → orchestration sees activity, updates lastActivity
+2. If user resumes session from CLI terminal → orchestration detects JSONL changes, knows session is active
+3. Pause button → Play button when paused → resume via click OR omnibox command
+
+### Implementation Approach
+
+```typescript
+// In watcher.ts or new session-watcher.ts
+function watchProjectSessions(projectPath: string) {
+  const claudeProjectsDir = join(homedir(), '.claude/projects');
+  const projectHash = getProjectHash(projectPath);
+  const sessionDir = join(claudeProjectsDir, projectHash);
+
+  // Watch for new files (new sessions) and modifications (activity)
+  const watcher = chokidar.watch(sessionDir, {
+    ignored: /^\./,
+    persistent: true,
+    ignoreInitial: true,
+    awaitWriteFinish: { stabilityThreshold: 500 }
+  });
+
+  watcher.on('add', (filePath) => {
+    if (filePath.endsWith('.jsonl')) {
+      // New session started externally
+      broadcast({ type: 'session:created', sessionId: extractSessionId(filePath) });
+    }
+  });
+
+  watcher.on('change', (filePath) => {
+    if (filePath.endsWith('.jsonl')) {
+      // Session activity detected
+      broadcast({ type: 'session:activity', sessionId: extractSessionId(filePath) });
+    }
+  });
+}
+```
+
+---
+
+## Files to Modify
+
+| File | Changes |
+|------|---------|
+| `orchestration-runner.ts` | Rewrite with complete decision matrix, atomic spawning, batch handling |
+| `orchestration-service.ts` | Thin to persistence only, remove duplicate logic |
+| `watcher.ts` | Add project session watching for external CLI detection |
+| `use-sse.ts` | Add `sessionQuestions` state, handle `session:question` event |
+| `unified-data-context.tsx` | Export `sessionQuestions` from context |
+| `page.tsx` | Replace hardcoded `[]` with context data, clear on answer |
+| `claude-helper.ts` | Add fallback chains (silent), backup before recovery |
+| `session-viewer-drawer.tsx` | Verify omnibox commands update orchestration state |
+
+---
+
+## Verifiable Goals Checklist
+
+Each item below is concrete and can be verified by an agent reading code, running tests, or checking behavior.
+
+---
+
+### G1. Decision Matrix (in `makeDecision()`)
+
+**Pre-decision gates:**
+- [ ] G1.1: Budget check exists before matrix - if `totalCostUsd >= budget.maxTotal` → return `{ action: 'fail' }`
+- [ ] G1.2: Duration check exists - if orchestration running > 4 hours → return `{ action: 'needs_attention' }`
+
+**Implement phase checked first:**
+- [ ] G1.3: If `step.current === 'implement'`, calls `handleImplementBatching()` before other checks
+
+**Workflow status checks:**
+- [ ] G1.4: `workflow.status === 'running'` + activity within 10min → returns `{ action: 'wait' }`
+- [ ] G1.5: `workflow.status === 'running'` + no activity for >10min → returns `{ action: 'recover_stale' }`
+- [ ] G1.6: `workflow.status === 'waiting_for_input'` → returns `{ action: 'wait' }`
+- [ ] G1.7: Workflow ID in state but `getWorkflow()` returns null → returns `{ action: 'wait_with_backoff' }`
+
+**Step complete transitions:**
+- [ ] G1.8: `step.status === 'complete'` + `current === 'verify'` + `phase.hasUserGate && userGateStatus !== 'confirmed'` → returns `{ action: 'wait_user_gate' }`
+- [ ] G1.9: `step.status === 'complete'` + `current === 'verify'` + `!config.autoMerge` → returns `{ action: 'wait_merge' }`
+- [ ] G1.10: `step.status === 'complete'` + `current === 'verify'` + `config.autoMerge` → returns `{ action: 'transition', nextStep: 'merge' }`
+- [ ] G1.11: `step.status === 'complete'` + `current === 'merge'` → returns `{ action: 'complete' }`
+- [ ] G1.12: `step.status === 'complete'` + other steps → returns `{ action: 'transition', nextStep: getNextStep(current) }`
+
+**Error states:**
+- [ ] G1.13: `step.status === 'failed'` → returns `{ action: 'recover_failed' }`
+- [ ] G1.14: `step.status === 'blocked'` → returns `{ action: 'recover_failed' }`
+
+**Spawn conditions:**
+- [ ] G1.15: `step.status === 'in_progress'` + no active workflow → returns `{ action: 'spawn' }`
+- [ ] G1.16: `step.status === 'not_started'` → returns `{ action: 'spawn' }` (with batch init if implement)
+- [ ] G1.17: `step.status === null/undefined` → returns `{ action: 'spawn' }`
+
+**No catch-all:**
+- [ ] G1.18: There is NO generic `else` or `default` case that handles "unknown" without logging an error
+
+---
+
+### G2. Batch State Machine (in `handleImplementBatching()`)
+
+- [ ] G2.1: `batches.total === 0` → returns `{ action: 'initialize_batches' }`
+- [ ] G2.2: All batches `status === 'completed' || 'healed'` + `step.status !== 'complete'` → returns `{ action: 'force_step_complete' }`
+- [ ] G2.3: All batches complete + `step.status === 'complete'` → returns `null` (let main matrix handle)
+- [ ] G2.4: `currentBatch.status === 'pending'` + no workflow → returns `{ action: 'spawn_batch' }`
+- [ ] G2.5: `currentBatch.status === 'running'` + workflow running → returns `null` (let staleness check handle)
+- [ ] G2.6: `currentBatch.status === 'completed'` + `config.pauseBetweenBatches` → returns `{ action: 'pause' }`
+- [ ] G2.7: `currentBatch.status === 'completed'` + `!pauseBetweenBatches` + more batches → returns `{ action: 'advance_batch' }`
+- [ ] G2.8: `currentBatch.status === 'healed'` + more batches → returns `{ action: 'advance_batch' }`
+- [ ] G2.9: `currentBatch.status === 'failed'` + `healAttempts < maxHealAttempts` → returns `{ action: 'heal_batch' }`
+- [ ] G2.10: `currentBatch.status === 'failed'` + `healAttempts >= maxHealAttempts` → returns `{ action: 'recover_failed' }`
+
+---
+
+### G3. Claude Helper (exactly 3 cases, silent fallbacks)
+
+**Case 1: Corrupt/Missing State**
+- [ ] G3.1: `recoverStateWithClaudeHelper()` function exists
+- [ ] G3.2: Creates `.bak` backup BEFORE attempting recovery
+- [ ] G3.3: Calls Claude Helper with `task: 'recover_state'`
+- [ ] G3.4: If Claude Helper succeeds + confidence > 0.7 → uses recovered state
+- [ ] G3.5: If Claude Helper fails → tries `tryHeuristicStateRecovery()` (silent, no UI notification)
+- [ ] G3.6: If heuristic fails → returns null (caller sets `needs_attention`)
+
+**Case 2: Stale Workflow**
+- [ ] G3.7: `handleStaleWorkflow()` function exists
+- [ ] G3.8: Calls Claude Helper with `task: 'diagnose_stale_workflow'`
+- [ ] G3.9: Handles response actions: `continue`, `restart_task`, `skip_task`, `abort`
+- [ ] G3.10: If Claude Helper fails → sets `needs_attention` (silent, no error toast)
+
+**Case 3: Failed Step**
+- [ ] G3.11: `handleFailedStep()` function exists
+- [ ] G3.12: Pre-checks `healAttempts >= maxHealAttempts` → skips Claude Helper, goes to `needs_attention`
+- [ ] G3.13: Calls Claude Helper with `task: 'diagnose_failed_step'`
+- [ ] G3.14: Handles response actions: `retry`, `skip_tasks`, `run_prerequisite`, `abort`
+- [ ] G3.15: If Claude Helper fails + heal attempts remaining → simple retry (silent)
+- [ ] G3.16: If Claude Helper fails + no attempts remaining → `needs_attention` (silent)
+
+**No other Claude Helper calls:**
+- [ ] G3.17: Grep codebase - Claude Helper is NOT called for any other scenarios
+
+---
+
+### G4. Question Flow (data plumbing)
+
+**Pre-verification:**
+- [ ] G4.1: Manual test confirms watcher.ts detects questions and emits `session:question` SSE event
+
+**use-sse.ts:**
+- [ ] G4.2: `sessionQuestions` state exists (type: `Map<string, SessionQuestion[]>`)
+- [ ] G4.3: `session:question` case in switch populates `sessionQuestions` map
+- [ ] G4.4: `sessionQuestions` is returned from hook
+
+**unified-data-context.tsx:**
+- [ ] G4.5: `sessionQuestions` is included in context value
+
+**page.tsx:**
+- [ ] G4.6: `decisionQuestions` is NOT hardcoded to `[]`
+- [ ] G4.7: `decisionQuestions` reads from `sessionQuestions.get(consoleSessionId)`
+- [ ] G4.8: After user answers, questions are cleared from map
+
+---
+
+### G5. Race Condition Mitigations
+
+**Atomic state writes:**
+- [ ] G5.1: `writeOrchestrationState()` writes to `.tmp` file first
+- [ ] G5.2: `writeOrchestrationState()` uses `rename()` for atomic swap
+
+**Spawn intent pattern:**
+- [ ] G5.3: `spawnWorkflowWithIntent()` function exists
+- [ ] G5.4: Checks for existing spawn intent before spawning
+- [ ] G5.5: Checks `hasActiveWorkflow()` before spawning
+- [ ] G5.6: Writes spawn intent to file/state BEFORE calling `workflowService.start()`
+- [ ] G5.7: Clears spawn intent in `finally` block (regardless of success/failure)
+
+**Persistent runner state:**
+- [ ] G5.8: `persistRunnerState()` writes `runner-{orchestrationId}.json` with PID and startedAt
+- [ ] G5.9: `clearRunnerState()` removes file when loop exits
+- [ ] G5.10: Dashboard startup calls `reconcileRunners()` to detect orphans
+
+**Event sleep fix:**
+- [ ] G5.11: `eventSignals` uses `Map<string, Set<() => void>>` (not single callback)
+- [ ] G5.12: `eventDrivenSleep()` adds callback to Set
+- [ ] G5.13: `wakeUp()` iterates Set and calls all callbacks
+
+---
+
+### G6. Unified Session Tracking
+
+**File watching:**
+- [ ] G6.1: Watches `~/.claude/projects/{hash}/` directory
+- [ ] G6.2: Detects new `.jsonl` files (new sessions from CLI)
+- [ ] G6.3: Detects modified `.jsonl` files (session activity from CLI)
+- [ ] G6.4: Emits `session:created` SSE event for new files
+- [ ] G6.5: Emits `session:activity` SSE event for modifications
+
+**Orchestration integration:**
+- [ ] G6.6: External session activity updates `lastActivity` in orchestration
+- [ ] G6.7: Omnibox commands in session viewer update orchestration state
+
+**Pause/Resume UI:**
+- [ ] G6.8: Pause button exists and sets `status: 'paused'`
+- [ ] G6.9: When paused, pause button becomes Play button
+- [ ] G6.10: Play button click resumes orchestration
+- [ ] G6.11: Omnibox command while paused resumes orchestration
+
+---
+
+### G7. State Validation
+
+- [ ] G7.1: `validateState()` checks `step.index === STEP_INDEX_MAP[step.current]`
+- [ ] G7.2: `validateState()` checks `step.current` is in `['design', 'analyze', 'implement', 'verify', 'merge']`
+- [ ] G7.3: `validateState()` checks `step.status` is in valid statuses
+- [ ] G7.4: `validateState()` checks `batches.items[i].index === i`
+- [ ] G7.5: `validateState()` checks `batches.current < batches.total` (unless all complete)
+- [ ] G7.6: `validateState()` checks `recoveryContext` exists when `status === 'needs_attention'`
+- [ ] G7.7: `validateState()` checks cross-file consistency (state step vs execution phase)
+
+---
+
+### G8. Decision Log UI
+
+- [ ] G8.1: `logDecision()` writes to `orchestration.decisionLog` array
+- [ ] G8.2: Phase Completion card reads from `decisionLog`
+- [ ] G8.3: New decision matrix decisions appear in UI
+- [ ] G8.4: Log entries include timestamp, action, and reason
+
+---
+
+### G9. Features Preserved
+
+**Cost tracking:**
+- [ ] G9.1: `addCost()` is called after workflow completes
+- [ ] G9.2: `totalCostUsd` accumulates across workflows
+- [ ] G9.3: Budget exceeded triggers `fail` action (from G1.1)
+
+**Heal attempts:**
+- [ ] G9.4: `healAttempts` counter exists in execution state
+- [ ] G9.5: `incrementHealAttempts()` is called before retry
+- [ ] G9.6: Max heal attempts check prevents infinite loops (from G3.12)
+- [ ] G9.7: Batch-level `healAttempts` tracked separately from step-level
+
+---
+
+### G10. Code Cleanup
+
+- [ ] G10.1: `isPhaseComplete()` artifact checks are REMOVED
+- [ ] G10.2: Duplicate `getNextPhase()` functions consolidated
+- [ ] G10.3: Duplicate `isStepComplete()` functions consolidated
+- [ ] G10.4: `orchestration-service.ts` contains only persistence logic (no decision logic)
+
+---
+
+### G11. Tests Exist
+
+**Unit tests:**
+- [ ] G11.1: Test for `makeDecision()` covers all G1.* conditions
+- [ ] G11.2: Test for `handleImplementBatching()` covers all G2.* conditions
+- [ ] G11.3: Test for `validateState()` covers all G7.* conditions
+- [ ] G11.4: Test for `spawnWorkflowWithIntent()` prevents duplicate spawns
+
+**Integration tests:**
+- [ ] G11.5: Happy path test: design → analyze → implement → verify → merge (autoMerge=true)
+- [ ] G11.6: Manual merge test: verify → wait_merge (autoMerge=false)
+- [ ] G11.7: USER_GATE test: verify → wait_user_gate → confirm → merge
+- [ ] G11.8: Question flow test: workflow asks → toast appears → answer → resumes
+- [ ] G11.9: Batch test: implement with multiple batches sequentially
+- [ ] G11.10: Pause/resume test: pause button → play button → resume
+- [ ] G11.11: External CLI test: start session from terminal → dashboard detects
+- [ ] G11.12: Race condition test: rapid spawn triggers → only one workflow
+
+---
+
+## Verification Commands
+
+Agents can verify goals using:
+
+```bash
+# G1-G2: Check decision matrix completeness
+grep -n "action:" orchestration-runner.ts | wc -l  # Should cover all cases
+
+# G3.17: Verify Claude Helper only called for 3 cases
+grep -r "claudeHelper" packages/dashboard/src/ --include="*.ts"
+
+# G4.6: Verify no hardcoded empty array
+grep -n "decisionQuestions = \[\]" packages/dashboard/src/
+
+# G5.1-G5.2: Verify atomic writes
+grep -n "\.tmp" orchestration-service.ts
+grep -n "rename" orchestration-service.ts
+
+# G10.1: Verify artifact checks removed
+grep -n "hasPlan\|hasTasks\|hasSpec" orchestration-runner.ts  # Should return nothing
+```
+
+---
+
+## Testing Infrastructure
+
+The current runner is hard to test because logic is intertwined with I/O. The simplification enables proper testing.
+
+### Pure Function Extraction
+
+Extract decision logic into pure functions with no side effects:
+
+```typescript
+// PURE FUNCTIONS (unit testable, no I/O)
+function makeDecision(
+  step: Step,
+  phase: Phase,
+  execution: OrchestrationExecution,
+  workflow: Workflow | null,
+  config: { staleDurationMs: number }
+): Decision
+
+function handleImplementBatching(
+  step: Step,
+  execution: OrchestrationExecution,
+  workflow: Workflow | null
+): Decision | null
+
+function validateState(
+  state: OrchestrationState,
+  execution: OrchestrationExecution
+): ValidationResult
+```
+
+### Dependency Injection
+
+The orchestration loop takes dependencies as parameters for easy mocking:
+
+```typescript
+interface OrchestrationDeps {
+  readState: () => Promise<OrchestrationState>;
+  readExecution: () => Promise<OrchestrationExecution>;
+  writeState: (state: OrchestrationState) => Promise<void>;
+  getWorkflow: (id: string) => Promise<Workflow | null>;
+  spawnWorkflow: (skill: string, context?: string) => Promise<string>;
+  killWorkflow: (id: string) => Promise<void>;
+  claudeHelper: {
+    recoverState: (error: Error) => Promise<OrchestrationState | null>;
+    diagnoseStale: (context: StaleContext) => Promise<StaleResponse>;
+    diagnoseFailed: (context: FailedContext) => Promise<FailedResponse>;
+  };
+  clock: { now: () => number };  // For testing time-based logic
+}
+
+async function runOrchestrationLoop(
+  orchestrationId: string,
+  projectPath: string,
+  deps: OrchestrationDeps
+) {
+  // Uses deps.* instead of direct imports
+}
+```
+
+### Test Project: ~/dev/test-app/
+
+Use existing test project with git tags for state reset:
+
+```bash
+# Setup tags for different test scenarios
+cd ~/dev/test-app
+
+# Tag: Clean slate - no orchestration state
+git tag test/clean-slate
+
+# Tag: Design phase complete
+git tag test/design-complete
+
+# Tag: Implement with 3 batches, batch 1 complete
+git tag test/implement-batch-1-done
+
+# Tag: Verify complete, USER_GATE pending
+git tag test/verify-user-gate
+
+# Tag: Corrupt state file
+git tag test/corrupt-state
+
+# Reset to a tag for testing
+git checkout test/design-complete
+git checkout -b test-run-$(date +%s)
+```
+
+### Unit Tests (Pure Functions)
+
+```typescript
+// packages/dashboard/tests/orchestration/decision-matrix.test.ts
+
+describe('makeDecision', () => {
+  // G1.4: workflow running + recent activity → wait
+  it('waits when workflow is running with recent activity', () => {
+    const step = { current: 'implement', status: 'in_progress', index: 2 };
+    const workflow = { status: 'running', lastActivityAt: Date.now() - 1000 };
+    const execution = createMockExecution();
+
+    const decision = makeDecision(step, mockPhase, execution, workflow, { staleDurationMs: 600000 });
+
+    expect(decision).toEqual({ action: 'wait', reason: 'Workflow running' });
+  });
+
+  // G1.5: workflow running + stale → recover_stale
+  it('recovers when workflow is stale for 10+ minutes', () => {
+    const step = { current: 'implement', status: 'in_progress', index: 2 };
+    const workflow = {
+      id: 'wf-123',
+      status: 'running',
+      lastActivityAt: Date.now() - 11 * 60 * 1000
+    };
+
+    const decision = makeDecision(step, mockPhase, execution, workflow, { staleDurationMs: 600000 });
+
+    expect(decision.action).toBe('recover_stale');
+    expect(decision.workflowId).toBe('wf-123');
+  });
+
+  // ... tests for all 18 G1.* items
+});
+
+describe('handleImplementBatching', () => {
+  // G2.1: no batches → initialize
+  it('initializes batches when total is 0', () => {
+    const execution = createMockExecution({ batches: { total: 0, current: 0, items: [] } });
+
+    const decision = handleImplementBatching(mockStep, execution, null);
+
+    expect(decision).toEqual({ action: 'initialize_batches', reason: expect.any(String) });
+  });
+
+  // ... tests for all 10 G2.* items
+});
+```
+
+### Integration Tests (Mocked Dependencies)
+
+```typescript
+// packages/dashboard/tests/orchestration/integration.test.ts
+
+describe('orchestration loop integration', () => {
+  // G11.5: Happy path
+  it('completes full orchestration: design → merge', async () => {
+    const stateSequence = [
+      fixtures.state.designNotStarted,
+      fixtures.state.designComplete,
+      fixtures.state.analyzeComplete,
+      fixtures.state.implementComplete,
+      fixtures.state.verifyComplete,
+      fixtures.state.mergeComplete,
+    ];
+    let stateIndex = 0;
+
+    const deps = createMockDeps({
+      readState: vi.fn(() => Promise.resolve(stateSequence[stateIndex++])),
+      spawnWorkflow: vi.fn().mockResolvedValue('wf-123'),
+    });
+
+    await runOrchestrationLoop('orch-1', '/test/path', deps);
+
+    expect(deps.spawnWorkflow).toHaveBeenCalledWith('flow.design');
+    expect(deps.spawnWorkflow).toHaveBeenCalledWith('flow.analyze');
+    expect(deps.spawnWorkflow).toHaveBeenCalledWith('flow.implement');
+    expect(deps.spawnWorkflow).toHaveBeenCalledWith('flow.verify');
+    expect(deps.spawnWorkflow).toHaveBeenCalledWith('flow.merge');
+  });
+
+  // G11.12: Race condition prevention
+  it('prevents duplicate workflow spawns on rapid triggers', async () => {
+    const deps = createMockDeps({
+      readState: vi.fn().mockResolvedValue(fixtures.state.designNotStarted),
+      spawnWorkflow: vi.fn().mockImplementation(async () => {
+        await sleep(100); // Simulate spawn delay
+        return 'wf-123';
+      }),
+    });
+
+    // Trigger loop twice rapidly
+    const loop1 = runSingleIteration('orch-1', '/test', deps);
+    const loop2 = runSingleIteration('orch-1', '/test', deps);
+
+    await Promise.all([loop1, loop2]);
+
+    // Should only spawn once due to spawn intent pattern
+    expect(deps.spawnWorkflow).toHaveBeenCalledTimes(1);
+  });
+});
+```
+
+### Test Fixtures (in repo)
+
+```
+packages/dashboard/tests/fixtures/orchestration/
+├── state/
+│   ├── design-not-started.json
+│   ├── design-complete.json
+│   ├── implement-batch-1-of-3.json
+│   ├── verify-complete-user-gate.json
+│   ├── verify-complete-auto-merge.json
+│   └── corrupt.json
+├── execution/
+│   ├── running-design.json
+│   ├── running-implement-batches.json
+│   └── needs-attention.json
+├── workflows/
+│   ├── running.json
+│   ├── waiting-for-input.json
+│   └── completed.json
+└── helpers.ts  # createMockDeps(), createMockExecution(), etc.
+```
+
+### Git Tags for ~/dev/test-app/
+
+| Tag | State | Use Case |
+|-----|-------|----------|
+| `test/clean-slate` | No .specflow/, fresh project | Start orchestration test |
+| `test/design-complete` | Design done, analyze not started | Transition tests |
+| `test/implement-batch-1` | Batch 1 complete, batch 2 pending | Batch handling tests |
+| `test/implement-batch-failed` | Batch 2 failed, heal attempts = 1 | Heal/recovery tests |
+| `test/verify-user-gate` | Verify complete, USER_GATE pending | Gate tests |
+| `test/verify-auto-merge` | Verify complete, autoMerge=true | Auto-merge tests |
+| `test/corrupt-state` | Invalid JSON in state file | Recovery tests |
+| `test/stale-workflow` | Running workflow, old timestamps | Staleness tests |
+| `test/paused` | Orchestration status=paused | Pause/resume tests |
+| `test/verify-manual-merge` | Verify complete, autoMerge=false | Manual merge flow |
+| `test/waiting-for-input` | Workflow waiting, question in JSONL | Question flow tests |
+
+### External CLI / JSONL Testing
+
+Git tags only cover project state (`.specflow/`). Session data lives in `~/.claude/projects/{hash}/` and needs separate setup.
+
+**JSONL Test Fixtures** (in repo, copied to ~/.claude/ during tests):
+
+```
+packages/dashboard/tests/fixtures/jsonl/
+├── session-with-question.jsonl     # Contains AskUserQuestion tool call
+├── session-running.jsonl           # Active session with recent messages
+├── session-completed.jsonl         # Finished session
+└── session-external-cli.jsonl      # Simulates session started from terminal
+```
+
+**JSONL with question example:**
+```jsonl
+{"type":"assistant","message":{"role":"assistant","content":[{"type":"tool_use","id":"toolu_123","name":"AskUserQuestion","input":{"questions":[{"question":"Which approach should we use?","header":"Approach","options":[{"label":"Option A","description":"Fast but limited"},{"label":"Option B","description":"Comprehensive"}],"multiSelect":false}]}}]}}
+```
+
+**Setup script for external CLI testing:**
+```bash
+#!/bin/bash
+# packages/dashboard/tests/setup-jsonl-fixtures.sh
+
+TEST_APP_PATH="$HOME/dev/test-app"
+PROJECT_HASH=$(echo -n "$TEST_APP_PATH" | shasum -a 256 | cut -c1-16)
+CLAUDE_SESSION_DIR="$HOME/.claude/projects/$PROJECT_HASH"
+
+mkdir -p "$CLAUDE_SESSION_DIR"
+
+# Copy fixtures
+cp packages/dashboard/tests/fixtures/jsonl/*.jsonl "$CLAUDE_SESSION_DIR/"
+
+echo "JSONL fixtures installed to $CLAUDE_SESSION_DIR"
+```
+
+### E2E Test Harness
+
+Script to run E2E tests against ~/dev/test-app/:
+
+```typescript
+// packages/dashboard/tests/e2e/orchestration-harness.ts
+
+import { spawn } from 'child_process';
+
+interface E2ETestCase {
+  name: string;
+  gitTag: string;
+  jsonlFixtures?: string[];  // Copy these to ~/.claude/projects/
+  actions: E2EAction[];
+  assertions: E2EAssertion[];
+}
+
+const testCases: E2ETestCase[] = [
+  {
+    name: 'G11.5: Happy path design → merge',
+    gitTag: 'test/clean-slate',
+    actions: [
+      { type: 'start_orchestration', config: { autoMerge: true } },
+      { type: 'wait_for_status', status: 'completed', timeout: 300000 },
+    ],
+    assertions: [
+      { type: 'step_reached', step: 'merge' },
+      { type: 'status_is', status: 'completed' },
+    ],
+  },
+  {
+    name: 'G11.6: Manual merge (autoMerge=false)',
+    gitTag: 'test/verify-manual-merge',
+    actions: [
+      { type: 'start_orchestration', config: { autoMerge: false } },
+      { type: 'wait_for_status', status: 'waiting_merge', timeout: 60000 },
+    ],
+    assertions: [
+      { type: 'status_is', status: 'waiting_merge' },
+      { type: 'step_is', step: 'verify' },
+    ],
+  },
+  {
+    name: 'G11.8: Question flow',
+    gitTag: 'test/waiting-for-input',
+    jsonlFixtures: ['session-with-question.jsonl'],
+    actions: [
+      { type: 'wait_for_sse_event', event: 'session:question', timeout: 5000 },
+    ],
+    assertions: [
+      { type: 'question_displayed_in_ui' },
+    ],
+  },
+  {
+    name: 'G11.10: Pause/resume',
+    gitTag: 'test/paused',
+    actions: [
+      { type: 'click_play_button' },
+      { type: 'wait_for_status', status: 'running', timeout: 5000 },
+    ],
+    assertions: [
+      { type: 'status_is', status: 'running' },
+    ],
+  },
+  {
+    name: 'G11.11: External CLI detection',
+    gitTag: 'test/design-complete',
+    jsonlFixtures: ['session-external-cli.jsonl'],
+    actions: [
+      { type: 'simulate_jsonl_modification', file: 'session-external-cli.jsonl' },
+      { type: 'wait_for_sse_event', event: 'session:activity', timeout: 2000 },
+    ],
+    assertions: [
+      { type: 'session_activity_detected' },
+    ],
+  },
+];
+
+async function runE2ETests() {
+  for (const testCase of testCases) {
+    console.log(`Running: ${testCase.name}`);
+
+    // 1. Reset test-app to git tag
+    await exec(`cd ~/dev/test-app && git checkout ${testCase.gitTag} -f`);
+
+    // 2. Setup JSONL fixtures if needed
+    if (testCase.jsonlFixtures) {
+      await setupJsonlFixtures(testCase.jsonlFixtures);
+    }
+
+    // 3. Start dashboard in test mode
+    const dashboard = spawn('pnpm', ['dev:dashboard'], {
+      env: { ...process.env, TEST_MODE: 'true' }
+    });
+
+    // 4. Execute actions
+    for (const action of testCase.actions) {
+      await executeAction(action);
+    }
+
+    // 5. Run assertions
+    for (const assertion of testCase.assertions) {
+      await runAssertion(assertion);
+    }
+
+    // 6. Cleanup
+    dashboard.kill();
+  }
+}
+```
+
+### Test Coverage Matrix
+
+| Test Type | What It Tests | Runs Against | Speed |
+|-----------|---------------|--------------|-------|
+| **Unit** | Pure functions (makeDecision, validateState) | In-memory fixtures | <1s |
+| **Integration** | Orchestration loop with mocked deps | Mocked OrchestrationDeps | <5s |
+| **E2E** | Full system with real files | ~/dev/test-app + git tags | 30s-5min |
+
+**Coverage by Goal:**
+
+| Goal | Unit | Integration | E2E |
+|------|------|-------------|-----|
+| G1.* Decision Matrix | ✓ | ✓ | - |
+| G2.* Batch Handling | ✓ | ✓ | - |
+| G3.* Claude Helper | - | ✓ (mocked) | - |
+| G4.* Question Flow | - | - | ✓ |
+| G5.* Race Conditions | ✓ | ✓ | - |
+| G6.* Session Tracking | - | - | ✓ |
+| G7.* State Validation | ✓ | - | - |
+| G11.5-12 Integration | - | ✓ | ✓ |
+
+---
+
+## Verifiable Testing Goals
+
+**Pure function extraction:**
+- [ ] G12.1: `makeDecision()` is a pure function (no direct I/O calls)
+- [ ] G12.2: `handleImplementBatching()` is a pure function
+- [ ] G12.3: `validateState()` is a pure function
+- [ ] G12.4: `runOrchestrationLoop()` accepts `OrchestrationDeps` parameter
+
+**Test fixtures in repo:**
+- [ ] G12.5: State fixtures exist in `packages/dashboard/tests/fixtures/orchestration/state/`
+- [ ] G12.6: Execution fixtures exist in `packages/dashboard/tests/fixtures/orchestration/execution/`
+- [ ] G12.7: Workflow fixtures exist in `packages/dashboard/tests/fixtures/orchestration/workflows/`
+- [ ] G12.8: JSONL fixtures exist in `packages/dashboard/tests/fixtures/jsonl/`
+- [ ] G12.9: `helpers.ts` exports `createMockDeps()`, `createMockExecution()`, `createMockState()`
+
+**Unit tests:**
+- [ ] G12.10: Unit tests exist for all 18 G1.* decision matrix conditions
+- [ ] G12.11: Unit tests exist for all 10 G2.* batch handling conditions
+- [ ] G12.12: Unit tests exist for all 7 G7.* state validation checks
+- [ ] G12.13: Unit test for spawn intent pattern (G5.3-G5.7)
+
+**Integration tests (mocked deps):**
+- [ ] G12.14: Integration tests use `OrchestrationDeps` mocks (no real file I/O)
+- [ ] G12.15: Happy path test: design → merge with autoMerge=true
+- [ ] G12.16: Manual merge test: verify → wait_merge with autoMerge=false
+- [ ] G12.17: Race condition test: rapid triggers spawn only once
+
+**Git tags in ~/dev/test-app/:**
+- [ ] G12.18: Tag `test/clean-slate` exists (no .specflow/)
+- [ ] G12.19: Tag `test/design-complete` exists
+- [ ] G12.20: Tag `test/implement-batch-1` exists
+- [ ] G12.21: Tag `test/implement-batch-failed` exists
+- [ ] G12.22: Tag `test/verify-user-gate` exists
+- [ ] G12.23: Tag `test/verify-auto-merge` exists
+- [ ] G12.24: Tag `test/verify-manual-merge` exists
+- [ ] G12.25: Tag `test/corrupt-state` exists
+- [ ] G12.26: Tag `test/stale-workflow` exists
+- [ ] G12.27: Tag `test/paused` exists
+- [ ] G12.28: Tag `test/waiting-for-input` exists
+
+**E2E test harness:**
+- [ ] G12.29: `setup-jsonl-fixtures.sh` script exists and works
+- [ ] G12.30: E2E harness can reset to git tag
+- [ ] G12.31: E2E harness can setup JSONL fixtures in ~/.claude/projects/
+- [ ] G12.32: E2E harness can start/stop dashboard
+- [ ] G12.33: E2E harness can wait for SSE events
+
+**All tests pass:**
+- [ ] G12.34: `pnpm test:dashboard` passes all unit + integration tests
+- [ ] G12.35: E2E test harness passes all scenarios
diff --git a/.specify/archive/1057-orchestration-simplification/spec.md b/.specify/archive/1057-orchestration-simplification/spec.md
new file mode 100644
index 0000000..61b1679
--- /dev/null
+++ b/.specify/archive/1057-orchestration-simplification/spec.md
@@ -0,0 +1,227 @@
+# Specification: Orchestration Simplification
+
+**Phase**: 1057
+**Created**: 2026-01-23
+**Status**: In Progress
+
+---
+
+## Overview
+
+Refactor dashboard orchestration to trust state file, fix question flow, add Claude Helper for specific recovery scenarios, eliminate race conditions, and unify session tracking across dashboard and CLI.
+
+### Problem Statement
+
+The orchestration-runner (1,412 lines) reimplements /flow.orchestrate logic poorly:
+
+1. `isPhaseComplete()` checks artifacts instead of trusting `step.status`
+2. Question flow is broken (watcher detects questions but data never reaches UI)
+3. No recovery path when things go wrong
+4. 2,343 lines of redundant code between runner and service
+5. Race conditions in workflow spawning and state file access
+6. Batch handling logic scattered and incomplete
+7. No detection of sessions started/resumed from external Claude CLI
+
+### Solution
+
+Trust the state file. Sub-commands set `step.status=complete` when done. The runner:
+1. Reads state (with atomic file access)
+2. Validates state consistency
+3. Spawns workflows (with spawn intent pattern to prevent races)
+4. Transitions when `step.status=complete`
+5. Uses Claude Helper for exactly 3 recovery scenarios
+6. Tracks ALL session activity (dashboard workflows, omnibox commands, external CLI)
+
+---
+
+## Functional Requirements
+
+### FR-001: Trust Step Status
+
+The orchestration runner MUST advance based on `step.status`, not artifact existence.
+
+**Acceptance Criteria:**
+- When sub-command sets `step.status=complete`, orchestration transitions to next step
+- No checks for `hasPlan`, `hasTasks`, `hasSpec` in decision logic
+- `grep "hasPlan\|hasTasks\|hasSpec" orchestration-runner.ts` returns no results
+
+### FR-002: Complete Decision Matrix
+
+Every state combination MUST have an explicit action in `makeDecision()`.
+
+**Acceptance Criteria:**
+- Pre-decision gates: budget check, duration gate (4 hour max)
+- Workflow running: wait (recent) or recover_stale (>10 min)
+- Workflow waiting for input: wait
+- Workflow lookup failure: wait_with_backoff
+- Step complete + verify + USER_GATE: wait_user_gate
+- Step complete + verify + autoMerge=false: wait_merge
+- Step complete + verify + autoMerge=true: transition to merge
+- Step complete + merge: complete
+- Step complete + other: transition to next
+- Step failed/blocked: recover_failed
+- Step in_progress + no workflow: spawn
+- Step not_started: spawn (init batches if implement)
+- No generic else/default that handles "unknown"
+
+### FR-003: Batch State Machine
+
+Implement phase MUST handle batches through complete state machine.
+
+**Acceptance Criteria:**
+- No batches: initialize_batches
+- Pending batch + no workflow: spawn_batch
+- Running batch + workflow running: let staleness check handle
+- Completed batch + pauseBetweenBatches: pause
+- Completed batch + continue: advance_batch
+- Healed batch + more batches: advance_batch
+- Failed batch + heal attempts remaining: heal_batch
+- Failed batch + no attempts: recover_failed
+- All batches complete + step not complete: force_step_complete
+
+### FR-004: Question Flow
+
+Questions from workflows MUST display in UI.
+
+**Acceptance Criteria:**
+- use-sse.ts has `sessionQuestions` state
+- `session:question` event populates the map
+- unified-data-context.tsx exports `sessionQuestions`
+- page.tsx reads from context (NOT hardcoded `[]`)
+- Questions clear after user answers
+
+### FR-005: Claude Helper (Exactly 3 Cases)
+
+Claude Helper MUST only be called for these 3 scenarios:
+
+**Case 1: Corrupt/Missing State**
+- Creates .bak backup BEFORE recovery
+- Calls Claude Helper with `task: 'recover_state'`
+- Fallback to heuristic recovery (silent)
+- Fallback to null → needs_attention
+
+**Case 2: Stale Workflow**
+- Calls Claude Helper with `task: 'diagnose_stale_workflow'`
+- Handles: continue, restart_task, skip_task, abort
+- Fallback to needs_attention (silent)
+
+**Case 3: Failed Step**
+- Pre-checks max heal attempts before calling Claude Helper
+- Calls Claude Helper with `task: 'diagnose_failed_step'`
+- Handles: retry, skip_tasks, run_prerequisite, abort
+- Fallback to simple retry or needs_attention (silent)
+
+**Verification:**
+- `grep -r "claudeHelper" packages/dashboard/src/lib/services/` shows exactly 3 call sites
+
+### FR-006: Race Condition Mitigations
+
+Race conditions MUST be prevented via:
+
+**Atomic State Writes:**
+- Write to `.tmp` file first
+- Use `rename()` for atomic swap
+
+**Spawn Intent Pattern:**
+- Check for existing spawn intent before spawning
+- Check hasActiveWorkflow before spawning
+- Write spawn intent BEFORE calling workflowService.start()
+- Clear intent in finally block
+
+**Persistent Runner State:**
+- Write runner-{orchestrationId}.json with PID and startedAt
+- Reconcile orphaned runners on dashboard startup
+
+**Event Sleep Fix:**
+- Use `Map<string, Set<() => void>>` for eventSignals
+- Multiple callbacks supported
+
+### FR-007: Unified Session Tracking
+
+Dashboard MUST detect sessions from all sources:
+
+**File Watching:**
+- Watch `~/.claude/projects/{hash}/` for new JSONL files (new CLI sessions)
+- Watch for JSONL modifications (CLI session activity)
+- Emit session:created and session:activity SSE events
+
+**Orchestration Integration:**
+- External session activity updates lastActivity
+- Omnibox commands update orchestration state
+
+**Pause/Resume:**
+- Pause button sets status: 'paused'
+- When paused, pause button becomes Play button
+- Play click or omnibox command resumes
+
+---
+
+## Non-Functional Requirements
+
+### NFR-001: Code Simplicity
+
+Reduce complexity through:
+- Pure functions for decision logic (makeDecision, handleImplementBatching, validateState)
+- Dependency injection for testability
+- orchestration-service.ts contains only persistence logic (no decision logic)
+- Consolidate duplicate getNextPhase(), isStepComplete() functions
+
+### NFR-002: State Validation
+
+Validate state consistency:
+- step.index === STEP_INDEX_MAP[step.current]
+- step.current is valid (design, analyze, implement, verify, merge)
+- step.status is valid
+- batches.items[i].index === i
+- batches.current < batches.total (unless all complete)
+- recoveryContext exists when status === 'needs_attention'
+- Cross-file consistency: state step vs execution phase
+
+### NFR-003: Testability
+
+Support comprehensive testing:
+- Pure functions can be unit tested in isolation
+- OrchestrationDeps interface enables mocking
+- Clock abstraction for time-based logic
+- Test fixtures for various states
+
+---
+
+## Success Criteria
+
+### SC-001: Step Advancement
+
+Orchestration advances through steps based solely on `step.status` values.
+
+### SC-002: Question Display
+
+When workflow calls AskUserQuestion, question appears in UI within 2 seconds.
+
+### SC-003: No Duplicate Spawns
+
+Rapid triggers (e.g., multiple button clicks) spawn only one workflow.
+
+### SC-004: External CLI Detection
+
+Session started from external Claude CLI terminal is detected by dashboard within 5 seconds.
+
+### SC-005: Test Coverage
+
+Unit tests cover all decision matrix conditions (G1.1-G1.18, G2.1-G2.10).
+
+---
+
+## Out of Scope
+
+- Changing the workflow spawning mechanism itself
+- Modifying how Claude Helper calls the API
+- UI redesign (only fixing data plumbing)
+- New features beyond fixing existing broken functionality
+
+---
+
+## References
+
+- **Detailed Plan**: [plan.md](plan.md) - Contains 146 verifiable goals (G1-G12)
+- **Phase Document**: `.specify/phases/1057-orchestration-simplification.md`
+- **State Ownership Pattern**: commands/flow.orchestrate.md
diff --git a/.specify/archive/1057-orchestration-simplification/tasks.md b/.specify/archive/1057-orchestration-simplification/tasks.md
new file mode 100644
index 0000000..1aba8cb
--- /dev/null
+++ b/.specify/archive/1057-orchestration-simplification/tasks.md
@@ -0,0 +1,400 @@
+# Tasks: Phase 1057 - Orchestration Simplification
+
+## Phase Goals Coverage
+
+Phase: 1057 - Orchestration Simplification
+Source: `.specify/phases/1057-orchestration-simplification.md`
+
+| # | Phase Goal | Spec Requirement(s) | Task(s) | Status |
+|---|------------|---------------------|---------|--------|
+| 1 | Trust step.status - If sub-command set it to complete, step is done | FR-001 | T001-T023 | COVERED |
+| 2 | Complete decision matrix - Every state combination has explicit action | FR-002, FR-003 | T005-T033 | COVERED |
+| 3 | Fix question flow - Wire SSE data to DecisionToast (3 files) | FR-004 | T051-T058 | COVERED |
+| 4 | Claude Helper for 3 cases only - With explicit fallback chains | FR-005 | T034-T050 | COVERED |
+| 5 | Eliminate race conditions - Atomic writes, spawn intent pattern | FR-006 | T059-T071 | COVERED |
+| 6 | Reduce code - Target simplicity | NFR-001 | T101-T104 | COVERED |
+
+Coverage: 6/6 goals (100%)
+
+---
+
+## Progress Dashboard
+
+> Last updated: 2026-01-23 | Run `specflow status` to refresh
+
+| Phase | Status | Progress |
+|-------|--------|----------|
+| Setup | PENDING | 0/4 |
+| Decision Logic | PENDING | 0/19 |
+| Batch State Machine | PENDING | 0/10 |
+| Claude Helper | PENDING | 0/17 |
+| Question Flow | PENDING | 0/8 |
+| Race Mitigations | PENDING | 0/13 |
+| Session Tracking | PENDING | 0/11 |
+| State Validation | PENDING | 0/7 |
+| Decision Log UI | PENDING | 0/4 |
+| Features Preserved | PENDING | 0/7 |
+| Code Cleanup | PENDING | 0/4 |
+| Tests | PENDING | 0/12 |
+| Testing Infrastructure | PENDING | 0/7 |
+
+**Overall**: 0/123 (0%) | **Current**: T001
+
+---
+
+## Phase 1: Setup
+
+**Purpose**: Extract pure functions and set up dependency injection for testability
+
+- [x] T001 [P] Extract `makeDecision()` as pure function in `packages/dashboard/src/lib/services/orchestration-decisions.ts`
+- [x] T002 [P] Extract `handleImplementBatching()` as pure function in `packages/dashboard/src/lib/services/orchestration-decisions.ts`
+- [x] T003 [P] Extract `validateState()` as pure function in `packages/dashboard/src/lib/services/orchestration-validation.ts`
+- [x] T004 Create `OrchestrationDeps` interface for dependency injection in `packages/dashboard/src/lib/services/orchestration-types.ts`
+
+**Checkpoint**: Pure functions ready for unit testing
+
+---
+
+## Phase 2: Decision Logic (G1)
+
+**Purpose**: Implement complete decision matrix - every state combination has explicit action
+
+### Pre-decision Gates
+
+- [x] T005 [G1.1] Add budget exceeded check before matrix - if `totalCostUsd >= budget.maxTotal` → return `fail` action in `makeDecision()`
+- [x] T006 [G1.2] Add duration gate (4 hour max) - if orchestration running > 4 hours → return `needs_attention` in `makeDecision()`
+
+### Implement Phase Handling (checked first)
+
+- [x] T007 [G1.3] Add implement phase branch - if `step.current === 'implement'`, call `handleImplementBatching()` before other checks
+
+### Workflow Status Checks
+
+- [x] T008 [G1.4] Handle running workflow with recent activity - `workflow.status === 'running'` + activity within 10min → `wait`
+- [x] T009 [G1.5] Handle stale running workflow - `workflow.status === 'running'` + no activity for >10min → `recover_stale`
+- [x] T010 [G1.6] Handle waiting for input - `workflow.status === 'waiting_for_input'` → `wait`
+- [x] T011 [G1.7] Handle workflow lookup failure - workflow ID in state but `getWorkflow()` returns null → `wait_with_backoff`
+
+### Step Complete Transitions
+
+- [x] T012 [G1.8] Handle verify complete with USER_GATE - `step.status === 'complete'` + `current === 'verify'` + `phase.hasUserGate && userGateStatus !== 'confirmed'` → `wait_user_gate`
+- [x] T013 [G1.9] Handle verify complete with autoMerge disabled - `step.status === 'complete'` + `current === 'verify'` + `!config.autoMerge` → `wait_merge`
+- [x] T014 [G1.10] Handle verify complete with autoMerge enabled - `step.status === 'complete'` + `current === 'verify'` + `config.autoMerge` → `transition` to merge
+- [x] T015 [G1.11] Handle merge complete - `step.status === 'complete'` + `current === 'merge'` → `complete`
+- [x] T016 [G1.12] Handle other step completions - `step.status === 'complete'` + other steps → `transition` to next step
+
+### Error States
+
+- [x] T017 [G1.13] Handle failed step - `step.status === 'failed'` → `recover_failed`
+- [x] T018 [G1.14] Handle blocked step - `step.status === 'blocked'` → `recover_failed`
+
+### Spawn Conditions
+
+- [x] T019 [G1.15] Handle in_progress with no workflow - `step.status === 'in_progress'` + no active workflow → `spawn`
+- [x] T020 [G1.16] Handle not_started - `step.status === 'not_started'` → `spawn` (with batch init if implement)
+- [x] T021 [G1.17] Handle null/undefined status - `step.status === null/undefined` → `spawn`
+
+### No Catch-all
+
+- [x] T022 [G1.18] Remove generic else/default case - ensure NO "unknown" handling without logging error
+
+### REMOVE Artifact Checks
+
+- [x] T023 [G10.1] Remove `isPhaseComplete()` artifact checks (`hasPlan`, `hasTasks`, `hasSpec`) from decision logic
+
+**Checkpoint**: Decision matrix complete - all conditions explicitly handled
+
+---
+
+## Phase 3: Batch State Machine (G2)
+
+**Purpose**: Complete batch handling for implement phase
+
+- [x] T024 [G2.1] Handle no batches - `batches.total === 0` → `initialize_batches`
+- [x] T025 [G2.2] Handle all batches complete but step not updated - all batches `completed`/`healed` + `step.status !== 'complete'` → `force_step_complete`
+- [x] T026 [G2.3] Handle all batches complete with step complete - all batches complete + `step.status === 'complete'` → return `null` (let main matrix handle)
+- [x] T027 [G2.4] Handle pending batch with no workflow - `currentBatch.status === 'pending'` + no workflow → `spawn_batch`
+- [x] T028 [G2.5] Handle running batch - `currentBatch.status === 'running'` + workflow running → return `null` (let staleness check handle)
+- [x] T029 [G2.6] Handle completed batch with pause enabled - `currentBatch.status === 'completed'` + `config.pauseBetweenBatches` → `pause`
+- [x] T030 [G2.7] Handle completed batch without pause - `currentBatch.status === 'completed'` + `!pauseBetweenBatches` + more batches → `advance_batch`
+- [x] T031 [G2.8] Handle healed batch - `currentBatch.status === 'healed'` + more batches → `advance_batch`
+- [x] T032 [G2.9] Handle failed batch with attempts remaining - `currentBatch.status === 'failed'` + `healAttempts < maxHealAttempts` → `heal_batch`
+- [x] T033 [G2.10] Handle failed batch with no attempts - `currentBatch.status === 'failed'` + `healAttempts >= maxHealAttempts` → `recover_failed`
+
+**Checkpoint**: Batch state machine complete
+
+---
+
+## Phase 4: Claude Helper (G3)
+
+**Purpose**: Exactly 3 Claude Helper use cases with silent fallbacks
+
+### Case 1: Corrupt/Missing State
+
+- [x] T034 [G3.1] Create `recoverStateWithClaudeHelper()` function in `packages/dashboard/src/lib/services/claude-helper.ts`
+- [x] T035 [G3.2] Create `.bak` backup BEFORE attempting recovery
+- [x] T036 [G3.3] Call Claude Helper with `task: 'recover_state'`
+- [x] T037 [G3.4] If Claude Helper succeeds + confidence > 0.7 → use recovered state
+- [x] T038 [G3.5] If Claude Helper fails → try `tryHeuristicStateRecovery()` (silent, no UI notification)
+- [x] T039 [G3.6] If heuristic fails → return null (caller sets `needs_attention`)
+
+### Case 2: Stale Workflow
+
+- [x] T040 [G3.7] Create `handleStaleWorkflow()` function in `packages/dashboard/src/lib/services/claude-helper.ts`
+- [x] T041 [G3.8] Call Claude Helper with `task: 'diagnose_stale_workflow'`
+- [x] T042 [G3.9] Handle response actions: `continue`, `restart_task`, `skip_task`, `abort`
+- [x] T043 [G3.10] If Claude Helper fails → set `needs_attention` (silent, no error toast)
+
+### Case 3: Failed Step
+
+- [x] T044 [G3.11] Create `handleFailedStep()` function in `packages/dashboard/src/lib/services/orchestration-recovery.ts`
+- [x] T045 [G3.12] Pre-check `healAttempts >= maxHealAttempts` → skip Claude Helper, go to `needs_attention`
+- [x] T046 [G3.13] Call Claude Helper with `task: 'diagnose_failed_step'`
+- [x] T047 [G3.14] Handle response actions: `retry`, `skip_tasks`, `run_prerequisite`, `abort`
+- [x] T048 [G3.15] If Claude Helper fails + heal attempts remaining → simple retry (silent)
+- [x] T049 [G3.16] If Claude Helper fails + no attempts remaining → `needs_attention` (silent)
+
+### Verification
+
+- [x] T050 [G3.17] Verify Claude Helper only called for these 3 cases (grep codebase)
+
+**Checkpoint**: Claude Helper restricted to exactly 3 cases
+
+---
+
+## Phase 5: Question Flow (G4)
+
+**Purpose**: Fix data plumbing from watcher to UI
+
+### use-sse.ts
+
+- [x] T051 [G4.2] Add `sessionQuestions` state (type: `Map<string, SessionQuestion[]>`) in `packages/dashboard/src/hooks/use-sse.ts`
+- [x] T052 [G4.3] Add `session:question` case in switch to populate `sessionQuestions` map
+- [x] T053 [G4.4] Return `sessionQuestions` from hook
+
+### unified-data-context.tsx
+
+- [x] T054 [G4.5] Include `sessionQuestions` in context value in `packages/dashboard/src/contexts/unified-data-context.tsx`
+
+### page.tsx
+
+- [x] T055 [G4.6] Remove hardcoded `decisionQuestions = []` in `packages/dashboard/src/app/projects/[id]/page.tsx`
+- [x] T056 [G4.7] Read `decisionQuestions` from `sessionQuestions.get(consoleSessionId)`
+- [x] T057 [G4.8] Clear questions from map after user answers
+
+### Pre-verification
+
+- [x] T058 [G4.1] Manual test confirms watcher.ts detects questions and emits `session:question` SSE event
+
+**Checkpoint**: Question flow fixed - questions display in UI
+
+---
+
+## Phase 6: Race Condition Mitigations (G5)
+
+**Purpose**: Prevent race conditions with atomic operations
+
+### Atomic State Writes
+
+- [x] T059 [G5.1] Implement atomic writes - `writeOrchestrationState()` writes to `.tmp` file first in `packages/dashboard/src/lib/services/orchestration-service.ts`
+- [x] T060 [G5.2] Use `rename()` for atomic swap after writing temp file
+
+### Spawn Intent Pattern
+
+- [x] T061 [G5.3] Create `spawnWorkflowWithIntent()` function in `packages/dashboard/src/lib/services/orchestration-runner.ts`
+- [x] T062 [G5.4] Check for existing spawn intent before spawning
+- [x] T063 [G5.5] Check `hasActiveWorkflow()` before spawning
+- [x] T064 [G5.6] Write spawn intent to file/state BEFORE calling `workflowService.start()`
+- [x] T065 [G5.7] Clear spawn intent in `finally` block (regardless of success/failure)
+
+### Persistent Runner State
+
+- [x] T066 [G5.8] Implement `persistRunnerState()` to write `runner-{orchestrationId}.json` with PID and startedAt
+- [x] T067 [G5.9] Implement `clearRunnerState()` to remove file when loop exits
+- [x] T068 [G5.10] Call `reconcileRunners()` on dashboard startup to detect orphans
+
+### Event Sleep Fix
+
+- [x] T069 [G5.11] Change `eventSignals` to use `Map<string, Set<() => void>>` (not single callback)
+- [x] T070 [G5.12] Update `eventDrivenSleep()` to add callback to Set
+- [x] T071 [G5.13] Update `wakeUp()` to iterate Set and call all callbacks
+
+**Checkpoint**: Race conditions eliminated
+
+---
+
+## Phase 7: Unified Session Tracking (G6)
+
+**Purpose**: Detect sessions from CLI as well as dashboard
+
+### File Watching
+
+- [x] T072 [G6.1] Watch `~/.claude/projects/{hash}/` directory in `packages/dashboard/src/lib/watcher.ts`
+- [x] T073 [G6.2] Detect new `.jsonl` files (new sessions from CLI)
+- [x] T074 [G6.3] Detect modified `.jsonl` files (session activity from CLI)
+- [x] T075 [G6.4] Emit `session:created` SSE event for new files
+- [x] T076 [G6.5] Emit `session:activity` SSE event for modifications
+
+### Orchestration Integration
+
+- [x] T077 [G6.6] External session activity updates `lastActivity` in orchestration
+- [x] T078 [G6.7] Omnibox commands in session viewer update orchestration state
+
+### Pause/Resume UI
+
+- [x] T079 [G6.8] Verify pause button exists and sets `status: 'paused'`
+- [x] T080 [G6.9] When paused, pause button becomes Play button
+- [x] T081 [G6.10] Play button click resumes orchestration
+- [x] T082 [G6.11] Omnibox command while paused resumes orchestration
+
+**Checkpoint**: External CLI sessions detected
+
+---
+
+## Phase 8: State Validation (G7)
+
+**Purpose**: Validate state consistency
+
+- [x] T083 [G7.1] Check `step.index === STEP_INDEX_MAP[step.current]` in `validateState()`
+- [x] T084 [G7.2] Check `step.current` is in `['design', 'analyze', 'implement', 'verify', 'merge']`
+- [x] T085 [G7.3] Check `step.status` is in valid statuses
+- [x] T086 [G7.4] Check `batches.items[i].index === i`
+- [x] T087 [G7.5] Check `batches.current < batches.total` (unless all complete)
+- [x] T088 [G7.6] Check `recoveryContext` exists when `status === 'needs_attention'`
+- [x] T089 [G7.7] Check cross-file consistency (state step vs execution phase)
+
+**Checkpoint**: State validation complete
+
+---
+
+## Phase 9: Decision Log UI (G8)
+
+**Purpose**: Wire decision log to UI
+
+- [x] T090 [G8.1] Implement `logDecision()` to write to `orchestration.decisionLog` array
+- [x] T091 [G8.2] Phase Completion card reads from `decisionLog`
+- [x] T092 [G8.3] New decision matrix decisions appear in UI
+- [x] T093 [G8.4] Log entries include timestamp, action, and reason
+
+**Checkpoint**: Decision log visible in UI
+
+---
+
+## Phase 10: Features Preserved (G9)
+
+**Purpose**: Ensure cost tracking and heal attempts are preserved
+
+### Cost Tracking
+
+- [x] T094 [G9.1] Verify `addCost()` is called after workflow completes
+- [x] T095 [G9.2] Verify `totalCostUsd` accumulates across workflows
+- [x] T096 [G9.3] Verify budget exceeded triggers `fail` action (covered by T005/G1.1)
+
+### Heal Attempts
+
+- [x] T097 [G9.4] Verify `healAttempts` counter exists in execution state
+- [x] T098 [G9.5] Verify `incrementHealAttempts()` is called before retry
+- [x] T099 [G9.6] Verify max heal attempts check prevents infinite loops (covered by T045/G3.12)
+- [x] T100 [G9.7] Track batch-level `healAttempts` separately from step-level
+
+**Checkpoint**: Features preserved
+
+---
+
+## Phase 11: Code Cleanup (G10)
+
+**Purpose**: Remove duplicate/obsolete code
+
+- [x] T101 [G10.1] Remove `isPhaseComplete()` artifact checks (covered by T023)
+- [x] T102 [G10.2] Consolidate duplicate `getNextPhase()` functions
+- [x] T103 [G10.3] Consolidate duplicate `isStepComplete()` functions
+- [x] T104 [G10.4] Ensure `orchestration-service.ts` contains only persistence logic (no decision logic)
+
+**Checkpoint**: Code simplified
+
+---
+
+## Phase 12: Tests (G11)
+
+**Purpose**: Unit and integration tests
+
+### Unit Tests
+
+- [x] T105 [G11.1] Test for `makeDecision()` covers all G1.* conditions in `packages/dashboard/tests/orchestration/decision-matrix.test.ts`
+- [x] T106 [G11.2] Test for `handleImplementBatching()` covers all G2.* conditions
+- [x] T107 [G11.3] Test for `validateState()` covers all G7.* conditions
+- [x] T108 [G11.4] Test for `spawnWorkflowWithIntent()` prevents duplicate spawns
+
+### Integration Tests
+
+- [x] T109 [G11.5] Happy path test: design → analyze → implement → verify → merge (autoMerge=true)
+- [x] T110 [G11.6] Manual merge test: verify → wait_merge (autoMerge=false)
+- [x] T111 [G11.7] USER_GATE test: verify → wait_user_gate → confirm → merge
+- [x] T112 [G11.8] Question flow test: workflow asks → toast appears → answer → resumes
+- [x] T113 [G11.9] Batch test: implement with multiple batches sequentially
+- [x] T114 [G11.10] Pause/resume test: pause button → play button → resume
+- [x] T115 [G11.11] External CLI test: start session from terminal → dashboard detects
+- [x] T116 [G11.12] Race condition test: rapid spawn triggers → only one workflow
+
+**Checkpoint**: Tests pass
+
+---
+
+## Phase 13: Testing Infrastructure (G12)
+
+**Purpose**: Set up test fixtures and harness
+
+### Pure Function DI
+
+- [x] T117 [G12.1] Verify `makeDecision()` is pure function (no direct I/O)
+- [x] T118 [G12.2] Verify `handleImplementBatching()` is pure function
+- [x] T119 [G12.3] Verify `validateState()` is pure function
+- [x] T120 [G12.4] Verify `runOrchestrationLoop()` accepts `OrchestrationDeps` parameter
+
+### Test Fixtures
+
+- [x] T121 [G12.5-9] Create test fixtures in `packages/dashboard/tests/fixtures/orchestration/` including `state/`, `execution/`, `workflows/`, `helpers.ts`
+- [x] T122 [G12.8] Create JSONL fixtures in `packages/dashboard/tests/fixtures/jsonl/`
+
+### E2E Harness (Optional - defer if time-constrained)
+
+- [x] T123 [G12.29-35] Create E2E test harness script and setup
+
+**Checkpoint**: Testing infrastructure ready
+
+---
+
+## Dependencies & Execution Order
+
+### Phase Dependencies
+
+- **Setup (Phase 1)**: No dependencies - can start immediately
+- **Decision Logic (Phase 2)**: Depends on Setup
+- **Batch State Machine (Phase 3)**: Depends on Setup (uses same pure functions)
+- **Claude Helper (Phase 4)**: Can proceed in parallel with Phase 2-3
+- **Question Flow (Phase 5)**: Can proceed in parallel with Phase 2-4
+- **Race Mitigations (Phase 6)**: Depends on Phase 2 (needs decision logic in place)
+- **Session Tracking (Phase 7)**: Depends on Phase 5 (question flow patterns)
+- **State Validation (Phase 8)**: Depends on Setup
+- **Decision Log UI (Phase 9)**: Depends on Phase 2 (needs decision types)
+- **Features Preserved (Phase 10)**: Verification only, can run after Phase 2
+- **Code Cleanup (Phase 11)**: Depends on Phase 2-6 being complete
+- **Tests (Phase 12)**: Depends on all functional phases
+- **Testing Infrastructure (Phase 13)**: Can proceed in parallel with Phase 12
+
+### Parallel Opportunities
+
+Phases 2-5 have significant parallelism opportunity:
+- Decision Logic (Phase 2) + Batch State Machine (Phase 3) share same file
+- Claude Helper (Phase 4) is isolated
+- Question Flow (Phase 5) is isolated
+
+---
+
+## Notes
+
+- [P] tasks = different files, no dependencies
+- [G#.#] = Maps to verifiable goal in plan.md
+- Each phase should be independently completable
+- Commit after each phase or logical group
+- Reference: plan.md for detailed pseudocode and specifications
diff --git a/.specify/history/HISTORY.md b/.specify/history/HISTORY.md
index fdfa96c..75f6a30 100644
--- a/.specify/history/HISTORY.md
+++ b/.specify/history/HISTORY.md
@@ -4,6 +4,691 @@
 
 ---
 
+## 1057 - Orchestration Simplification
+
+**Completed**: 2026-01-24
+
+### 1057 - Orchestration Simplification
+
+**Goal**: Refactor dashboard orchestration to trust state file, fix question flow, add Claude Helper for specific recovery scenarios, eliminate race conditions, unify session tracking across dashboard and CLI.
+
+**Context**: The orchestration-runner (1,412 lines) reimplements /flow.orchestrate logic poorly instead of following the simple state ownership pattern. Questions are broken because data never reaches UI. Race conditions cause duplicate workflows. External CLI sessions are not detected.
+
+**Solution**: Simple decision loop based on `step.status`, complete batch state machine, Claude Helper for exactly 3 recovery scenarios with silent fallbacks, atomic operations to prevent races, unified session watching for dashboard/omnibox/CLI.
+
+---
+
+## Key Alignment Decisions
+
+| Topic | Decision |
+|-------|----------|
+| Auto-merge | Fully automatic when `autoMerge=true` (no confirmation) |
+| Question flow | Needs testing to verify watcher detection works first |
+| Claude Helper failures | Silent fallback (don't clutter UI) |
+| Race fixes | Must-have for this phase |
+| Stale threshold | 10 minutes fixed |
+| Batch pause/resume | Existing pause→play button, also omnibox resume |
+| Code size | Focus on simplicity, not line count |
+| External CLI | Watch `~/.claude/projects/{hash}/` for JSONL creation AND modification |
+| Testing | Both unit tests AND integration tests required |
+| Features | Keep cost tracking, heal attempts - improve, don't neuter |
+
+---
+
+## Problem Summary
+
+### 1. Orchestration runner is overcomplicated
+
+Current `isPhaseComplete()` checks artifact existence:
+```typescript
+case 'design':
+  return status.context?.hasPlan === true && status.context?.hasTasks === true;
+```
+
+Should just check `step.status`:
+```typescript
+if (step.status === 'complete') return true;
+```
+
+### 2. Questions don't display
+
+- Watcher correctly detects questions from JSONL ✓
+- SSE event broadcasts correctly ✓
+- `use-sse.ts` receives event but DROPS IT (does nothing) ✗
+- `page.tsx` has hardcoded `decisionQuestions = []` ✗
+
+### 3. Race conditions
+
+- State file write/read race (no atomic writes)
+- Workflow spawn double-fire (check and spawn not atomic)
+- Event sleep callback replacement bug
+- No persistent runner state (dashboard restart causes duplicates)
+
+### 4. Batch handling incomplete
+
+- Batch state machine scattered across codebase
+- Missing `pauseBetweenBatches` handling
+- No `initialize_batches` action when entering implement
+
+---
+
+## State Ownership Pattern (from flow.orchestrate.md)
+
+| Owner | Fields | Who Sets |
+|-------|--------|----------|
+| **Orchestrate** | `step.current`, `step.index` | Only orchestrate |
+| **Sub-command** | `step.status` | Set to `in_progress` → `complete` or `failed` |
+
+**Valid steps**: `design`, `analyze`, `implement`, `verify`, `merge`
+
+**Merge step**:
+- If `autoMerge=true` → transition to merge step, run `/flow.merge`
+- If `autoMerge=false` → `wait_merge` status, user triggers manually
+
+---
+
+## Goals
+
+1. **Trust step.status** - If sub-command set it to `complete`, step is done
+2. **Complete decision matrix** - Every state combination has explicit action
+3. **Fix question flow** - Wire SSE data to DecisionToast (3 files)
+4. **Claude Helper for 3 cases only** - With explicit fallback chains
+5. **Eliminate race conditions** - Atomic writes, spawn intent pattern
+6. **Reduce code** - Target <600 lines (from 1,412)
+
+---
+
+## Deliverables
+
+### Phase 1: Simplify Decision Logic
+
+**Pre-decision gates** (checked before matrix):
+- [ ] Budget exceeded check → `fail` action
+- [ ] Duration gate (4 hour max) → `needs_attention`
+
+**Decision matrix** (complete, no ambiguity):
+| Condition | Action |
+|-----------|--------|
+| `current === 'implement'` | Check batch state machine first |
+| `workflow.status === 'running'` + recent activity | `wait` |
+| `workflow.status === 'running'` + stale (>10min) | `recover_stale` |
+| `workflow.status === 'waiting_for_input'` | `wait` |
+| Workflow ID exists but lookup fails | `wait_with_backoff` |
+| `step.status === 'complete'` + `current === 'verify'` + USER_GATE pending | `wait_user_gate` |
+| `step.status === 'complete'` + `current === 'verify'` + `autoMerge=false` | `wait_merge` |
+| `step.status === 'complete'` + `current === 'verify'` + `autoMerge=true` | `transition` to merge |
+| `step.status === 'complete'` + `current === 'merge'` | `complete` |
+| `step.status === 'complete'` + next step exists | `transition` |
+| `step.status === 'failed'` or `'blocked'` | `recover_failed` |
+| `step.status === 'in_progress'` + no workflow | `spawn` |
+| `step.status === 'not_started'` or null | `spawn` (init batches if implement) |
+
+### Phase 2: Batch State Machine
+
+- [ ] `initialize_batches` action when entering implement with no batches
+- [ ] `spawn_batch` action for pending batch + no workflow
+- [ ] `advance_batch` action when batch completes
+- [ ] `heal_batch` action when batch fails + heal attempts remaining
+- [ ] `pause` action when `pauseBetweenBatches=true` + batch completes
+- [ ] `force_step_complete` when all batches done but step.status not updated
+
+### Phase 3: Fix Question Flow (Data Plumbing)
+
+- [ ] `use-sse.ts`: Add `sessionQuestions` state, populate on `session:question` event
+- [ ] `unified-data-context.tsx`: Export `sessionQuestions` from context
+- [ ] `page.tsx`: Replace hardcoded `[]` with `sessionQuestions.get(consoleSessionId)`
+- [ ] Clear questions after user answers
+
+### Phase 4: Add Claude Helper (3 Specific Cases)
+
+**Case 1: Recover Corrupt/Missing State File**
+- When: `readOrchestrationState()` throws error
+- Fallback: Claude Helper → heuristic recovery → return null → `needs_attention`
+- Always: Create `.bak` backup BEFORE recovery
+
+**Case 2: Recover Stale Workflow**
+- When: `workflow.status === 'running'` but no file changes for > 10 minutes
+- Fallback: If Claude Helper fails → conservative `needs_attention`
+
+**Case 3: Recover Failed Step**
+- When: `step.status === 'failed'` or `step.status === 'blocked'`
+- Pre-check: If max heal attempts reached, skip Claude Helper → `needs_attention`
+- Fallback: If Claude Helper fails → simple retry if within limits → else `needs_attention`
+
+### Phase 5: Race Condition Mitigations
+
+- [ ] Atomic state file writes (write to `.tmp`, then rename)
+- [ ] Spawn intent pattern (store intent before spawn, check before spawning)
+- [ ] Persistent runner state (`runner-{orchestrationId}.json`)
+- [ ] Reconcile orphaned runners on dashboard startup
+- [ ] Fix event sleep callback overwrite bug (use Set instead of single callback)
+
+### Phase 6: Unified Session Tracking
+
+Terminal is just the manual version of dashboard automation. Both should work identically.
+
+- [ ] Watch `~/.claude/projects/{hash}/` for JSONL creation (new sessions from CLI)
+- [ ] Watch for JSONL modification (session activity from CLI)
+- [ ] Emit `session:created` and `session:activity` SSE events
+- [ ] Orchestration detects external session activity, updates lastActivity
+- [ ] Omnibox commands in session viewer update orchestration state
+- [ ] Pause button → Play button when paused, resume via click OR omnibox
+
+### Phase 7: Consolidate Code
+
+- [ ] `orchestration-service.ts` becomes thin persistence layer
+- [ ] Remove duplicate `getNextPhase()`, `isStepComplete()` functions
+- [ ] Move shared types to @specflow/shared
+- [ ] Focus on simplicity, not line count
+
+### Phase 8: Decision Log UI
+
+- [ ] Verify decision log wires correctly to Phase Completion card
+- [ ] Make UI improvements if needed
+- [ ] Decisions from new matrix appear correctly
+
+---
+
+## State Validation
+
+Validate BOTH state files and their consistency:
+- [ ] `step.index === STEP_INDEX_MAP[step.current]`
+- [ ] `batches.items[i].index === i` (batch index matches position)
+- [ ] `batches.current < batches.total` (unless all complete)
+- [ ] `recoveryContext` exists when `status === 'needs_attention'`
+- [ ] Cross-file: `OrchestrationState.step.current === OrchestrationExecution.currentPhase`
+
+---
+
+## Verification Gate
+
+**USER GATE**: User must verify:
+
+1. Start orchestration on a test phase
+2. Orchestration advances based on `step.status` (not artifacts)
+3. Batch handling: implement with multiple batches → each spawned sequentially
+4. When workflow needs input, question toast appears
+5. Answer question, workflow resumes
+6. If step fails, Claude Helper diagnoses and recovers (silent fallback if Claude fails)
+7. With `autoMerge=false`: verify complete → `wait_merge` → user triggers
+8. With `autoMerge=true`: verify complete → merge runs automatically (no prompt)
+9. Rapid triggers don't spawn duplicate workflows
+10. Pause button → Play button when paused
+11. Omnibox command resumes paused orchestration
+12. Start session from external CLI terminal → dashboard detects it
+13. Decision log appears correctly in Phase Completion card
+14. Orchestration completes successfully
+
+---
+
+## Pre-Implementation Verification
+
+Before assuming question detection works:
+- [ ] Manually test: Start workflow that asks question → verify SSE event fires
+- [ ] Check watcher.ts actually parses questions correctly
+- [ ] If detection broken, add to scope
+
+---
+
+## Files to Modify
+
+| File | Changes |
+|------|---------|
+| `packages/dashboard/src/lib/services/orchestration-runner.ts` | Rewrite with complete decision matrix, atomic spawning, batch state machine |
+| `packages/dashboard/src/lib/services/orchestration-service.ts` | Thin to persistence only |
+| `packages/dashboard/src/lib/watcher.ts` | Add project session watching for external CLI |
+| `packages/dashboard/src/hooks/use-sse.ts` | Add `sessionQuestions` state, handle events |
+| `packages/dashboard/src/contexts/unified-data-context.tsx` | Export `sessionQuestions` |
+| `packages/dashboard/src/app/projects/[id]/page.tsx` | Wire questions to DecisionToast |
+| `packages/dashboard/src/components/projects/session-viewer-drawer.tsx` | Verify omnibox updates orchestration |
+| `packages/dashboard/src/lib/services/claude-helper.ts` | Add silent fallback chains, backup before recovery |
+
+---
+
+## Verifiable Goals Checklist
+
+See `specs/1057-orchestration-simplification/plan.md` for full checklist with 80+ concrete verification items.
+
+### Summary by Category
+
+| Category | Items | Description |
+|----------|-------|-------------|
+| G1. Decision Matrix | 18 | Every condition→action in `makeDecision()` |
+| G2. Batch State Machine | 10 | All batch statuses in `handleImplementBatching()` |
+| G3. Claude Helper | 17 | 3 cases only, silent fallbacks, no other calls |
+| G4. Question Flow | 8 | Data plumbing: use-sse → context → page |
+| G5. Race Mitigations | 13 | Atomic writes, spawn intent, persistent runner, event fix |
+| G6. Session Tracking | 11 | CLI detection, omnibox, pause/play |
+| G7. State Validation | 7 | All invariant checks |
+| G8. Decision Log UI | 4 | Wired to Phase Completion card |
+| G9. Features Preserved | 7 | Cost tracking, heal attempts |
+| G10. Code Cleanup | 4 | Remove artifact checks, consolidate duplicates |
+| G11. Tests | 12 | Unit tests + integration tests |
+| G12. Testing Infrastructure | 35 | Pure functions, DI, fixtures, git tags, E2E harness, JSONL fixtures |
+
+**Total: 146 verifiable items**
+
+### Quick Verification Commands
+
+```bash
+# No hardcoded empty questions array
+grep -n "decisionQuestions = \[\]" packages/dashboard/src/  # Should return nothing
+
+# No artifact existence checks
+grep -n "hasPlan\|hasTasks\|hasSpec" orchestration-runner.ts  # Should return nothing
+
+# Claude Helper only in 3 places
+grep -r "claudeHelper\|claude-helper" packages/dashboard/src/lib/services/ --include="*.ts" -l
+
+# Atomic writes exist
+grep -n "\.tmp\|rename" packages/dashboard/src/lib/services/orchestration-service.ts
+```
+
+---
+
+## Dependencies
+
+- Phase 1056 (JSONL Watcher) - ✅ Complete, close before starting 1057
+- Sub-commands must set step.status correctly (verify each)
+
+---
+
+## 1056 - jsonl-watcher
+
+**Completed**: 2026-01-23
+
+### 1056 - JSONL File Watcher & Polling Elimination
+
+**Goal**: Replace all polling with file-watching. Zero polling loops when complete.
+
+**Context**: Dashboard has 9+ polling mechanisms causing 3-5s delays and ~20 subprocess calls/minute.
+
+**Solution**: File-watch everything via chokidar, including session JSONL files in `~/.claude/projects/`. Delete all polling code.
+
+**Approach**: Clean implementation - no migration code, no fallbacks, no deprecated stubs. Single user, so just build it right.
+
+---
+
+## Phase 0: Discovery (COMPLETE)
+
+See `polling-consolidation-analysis.md` for:
+- [x] All 9+ polling locations with line numbers
+- [x] Polling intervals mapped
+- [x] Race conditions identified
+- [x] Data flow documented
+- [x] Existing SSE infrastructure documented
+- [x] New event types specified
+
+**Deliverable**: `.specify/phases/polling-consolidation-analysis.md`
+
+---
+
+## Phase 0.5: Delete Polling Hooks
+
+Delete these files and fix any imports:
+- [ ] `src/hooks/use-workflow-execution.ts`
+- [ ] `src/hooks/use-workflow-list.ts`
+- [ ] `src/hooks/use-session-history.ts`
+- [ ] `src/hooks/use-session-messages.ts`
+- [ ] `src/lib/session-polling-manager.ts`
+
+Replace with SSE-based hooks (`useProjectData`, `useSessionContent`, `useUnifiedData`).
+
+---
+
+## Phase 1: Orchestration Runner Event-Driven (HIGHEST PRIORITY)
+
+**Why first**: The orchestration runner calls `specflow status --json` subprocess (~1-2s) on EVERY 3-second poll. This is the largest performance bottleneck.
+
+### 1.1 Eliminate Subprocess Calls
+
+Replace `specflow status --json` with file watching:
+
+```typescript
+// BEFORE (orchestration-runner.ts:273-284)
+function getSpecflowStatus(projectPath: string): SpecflowStatus | null {
+  const result = execSync('specflow status --json', { // ~1-2s per call!
+    cwd: projectPath,
+    timeout: 30000,
+  });
+  return JSON.parse(result);
+}
+
+// AFTER: Subscribe to file events
+function subscribeToSpecflowStatus(projectPath: string, callback: (status) => void) {
+  // Watch tasks.md for task counts
+  // Watch spec.md, plan.md for artifact existence
+  // Derive status from file state
+}
+```
+
+### 1.2 Watch Files for Status
+
+| Data | Current Source | File to Watch |
+|------|----------------|---------------|
+| Task progress | `specflow status --json` | `specs/{phase}/tasks.md` |
+| Phase artifacts | `specflow status --json` | `spec.md`, `plan.md`, `tasks.md` existence |
+| Phase number | `specflow status --json` | `ROADMAP.md` or orchestration state |
+
+### 1.3 Event-Driven Decision Loop
+
+```
+BEFORE (polling):
+  while (running):
+    sleep(3 seconds)           ← Wastes time
+    specflow status --json     ← Spawns subprocess (~1-2s)
+    load orchestration state
+    make decision
+    execute decision
+
+AFTER (event-driven):
+  subscribe to file events
+  on event:
+    derive status from files   ← Instant, no subprocess
+    make decision
+    execute decision
+  (no sleep - purely reactive)
+```
+
+### 1.4 Implementation Steps
+- [ ] Add `tasks.md` parsing to derive task counts
+- [ ] Add artifact existence checks (no subprocess)
+- [ ] Create event subscription in orchestration-runner
+- [ ] Replace `while(running) { sleep }` with event listener
+- [ ] Delete `specflow status --json` calls entirely
+
+**Impact**: Latency 3000ms → <500ms. Zero subprocess calls.
+
+---
+
+## Phase 2: Session File Watching
+
+Add session JSONL files to chokidar watcher.
+
+### 2.1 Calculate Session Directory
+
+```typescript
+// project-hash.ts (already exists)
+function calculateProjectHash(projectPath: string): string {
+  return projectPath.replace(/\//g, '-');
+}
+
+// Session directory
+const sessionDir = join(homeDir, '.claude', 'projects', calculateProjectHash(projectPath));
+```
+
+### 2.2 Add to Watcher
+
+```typescript
+// In watcher.ts - extend existing chokidar watcher
+function watchSessionFiles(projectPath: string, projectId: string) {
+  const sessionDir = getSessionDirectory(projectPath);
+
+  // Watch all JSONL files in session directory
+  watcher.add(join(sessionDir, '*.jsonl'));
+
+  watcher.on('change', (filePath) => {
+    if (filePath.endsWith('.jsonl')) {
+      const sessionId = basename(filePath, '.jsonl');
+      handleSessionFileChange(projectId, sessionId, filePath);
+    }
+  });
+}
+```
+
+### 2.3 Parse New Content
+
+```typescript
+async function handleSessionFileChange(projectId: string, sessionId: string, filePath: string) {
+  // Read file, get new lines since last read
+  const content = await readFile(filePath, 'utf-8');
+  const lines = content.trim().split('\n');
+
+  // Parse last N lines (tail behavior)
+  const newMessages = parseSessionLines(lines.slice(-100));
+
+  // Check for questions
+  const questions = extractQuestions(newMessages);
+
+  // Broadcast events
+  if (newMessages.length > 0) {
+    broadcast({ type: 'session:message', projectId, sessionId, data: newMessages });
+  }
+  if (questions.length > 0) {
+    broadcast({ type: 'session:question', projectId, sessionId, data: questions });
+  }
+
+  // Check for session end
+  if (detectSessionEnd(newMessages)) {
+    broadcast({ type: 'session:end', projectId, sessionId });
+  }
+}
+```
+
+### 2.4 Remove Session Polling Manager
+- [ ] Migrate `useSessionContent` to SSE events
+- [ ] Remove `sessionPollingManager` singleton
+- [ ] Delete `src/lib/session-polling-manager.ts`
+
+**Impact**: Session updates from 5s polling to <500ms file-watch. Instant question detection.
+
+---
+
+## Phase 3: SSE Event Type Expansion
+
+Extend existing `/api/events` endpoint with new event types.
+
+### 3.1 New Event Types
+
+```typescript
+// In packages/shared/src/schemas/events.ts
+type SSEEvent =
+  // Existing events
+  | { type: 'connected'; timestamp: string }
+  | { type: 'heartbeat'; timestamp: string }
+  | { type: 'registry'; data: Registry }
+  | { type: 'state'; projectId: string; data: OrchestrationState }
+  | { type: 'tasks'; projectId: string; data: TasksData }
+  | { type: 'workflow'; projectId: string; data: WorkflowData }
+  | { type: 'phases'; projectId: string; data: PhasesData }
+
+  // NEW: Session events
+  | { type: 'session:message'; projectId: string; sessionId: string; data: SessionMessage[] }
+  | { type: 'session:question'; projectId: string; sessionId: string; data: Question }
+  | { type: 'session:end'; projectId: string; sessionId: string }
+
+  // NEW: Orchestration events
+  | { type: 'orchestration:decision'; projectId: string; data: DecisionLogEntry }
+  | { type: 'orchestration:batch'; projectId: string; data: BatchProgress }
+  | { type: 'workflow:complete'; projectId: string; workflowId: string };
+```
+
+### 3.2 Update useSSE Hook
+
+```typescript
+// In use-sse.ts - add handlers for new events
+case 'session:message':
+  // Update session content in context
+  break;
+case 'session:question':
+  // Trigger question notification
+  break;
+case 'orchestration:decision':
+  // Update decision log display
+  break;
+```
+
+---
+
+## Phase 4: Client Hook Consolidation
+
+### 4.1 Update useSessionContent
+
+```typescript
+// BEFORE: Uses sessionPollingManager
+export function useSessionContent(sessionId, projectPath) {
+  useEffect(() => {
+    sessionPollingManager.subscribe(sessionId, projectPath);
+    return () => sessionPollingManager.unsubscribe(sessionId);
+  }, [sessionId, projectPath]);
+}
+
+// AFTER: Uses SSE events from context
+export function useSessionContent(sessionId, projectPath) {
+  const { sessionContent } = useUnifiedData();
+  return sessionContent.get(sessionId) ?? null;
+}
+```
+
+### 4.2 Update useOrchestration
+
+```typescript
+// BEFORE: Polls /api/workflow/orchestrate/status every 3s
+// AFTER: Derives from SSE state events + orchestration:* events
+```
+
+### 4.3 Connection Recovery
+
+SSE auto-reconnects on disconnect (existing behavior). No polling fallback - if SSE is down, UI shows stale data until reconnected.
+
+---
+
+## Technical Notes
+
+### Architecture Diagram
+
+```
+┌──────────────────────────────────────────────────────────────────────┐
+│                         FILE SYSTEM                                   │
+├──────────────────────────────────────────────────────────────────────┤
+│                                                                      │
+│  Project Files                      Session Files (EXTERNAL)         │
+│  ~/dev/myproject/                   ~/.claude/projects/{hash}/       │
+│  ├─ .specflow/orchestration.json    ├─ session1.jsonl                │
+│  ├─ specs/{phase}/tasks.md          ├─ session2.jsonl                │
+│  ├─ specs/{phase}/spec.md           └─ ...                           │
+│  └─ ROADMAP.md                                                       │
+│                                                                      │
+└──────────────────┬─────────────────────────────────┬─────────────────┘
+                   │                                 │
+                   ▼                                 ▼
+          ┌─────────────────────────────────────────────────┐
+          │         chokidar watcher (UNIFIED)              │
+          │  Watches: project files + session JSONL files   │
+          │  Debounce: 200ms                                │
+          └────────────────────┬────────────────────────────┘
+                               │
+                               ▼
+          ┌─────────────────────────────────────────────────┐
+          │              SSE Event Bus                      │
+          │  /api/events (existing endpoint)                │
+          │  Events: state, tasks, workflow, phases,        │
+          │          session:*, orchestration:*             │
+          │  Heartbeat: 30s                                 │
+          └────────────────────┬────────────────────────────┘
+                               │
+           ┌───────────────────┼───────────────────┐
+           ▼                   ▼                   ▼
+   ┌───────────────┐   ┌───────────────┐   ┌───────────────┐
+   │ Dashboard UI  │   │ Orchestration │   │ Session       │
+   │ (useSSE)      │   │ Runner        │   │ Viewer        │
+   │               │   │ (event-driven)│   │               │
+   └───────────────┘   └───────────────┘   └───────────────┘
+```
+
+### macOS File Watcher Limits
+
+**Problem**: macOS default limit is 256 file watchers.
+
+**Mitigation**: Use glob patterns instead of individual file watches:
+
+```typescript
+// GOOD: Single glob pattern covers many files
+watcher.add([
+  `${homeDir}/.specflow/**/*.json`,
+  `${homeDir}/.claude/projects/**/*.jsonl`,
+  ...projects.map(p => `${p.path}/specs/**/tasks.md`),
+]);
+
+// BAD: One watcher per file (hits limits)
+projects.forEach(p => watcher.add(`${p.path}/tasks.md`));
+```
+
+**Cleanup**: Remove watchers when:
+- Project unregistered from registry
+- Session ends (detected from JSONL content)
+- No SSE subscribers for 5 minutes
+
+### Debouncing Strategy
+
+```typescript
+const DEBOUNCE_MS = 200; // Existing value, proven stable
+
+// For session files (high write frequency during active sessions)
+const SESSION_DEBOUNCE_MS = 100; // Slightly faster for responsiveness
+```
+
+---
+
+## Files to Modify
+
+### DELETE (polling code)
+- `src/hooks/use-workflow-execution.ts`
+- `src/hooks/use-workflow-list.ts`
+- `src/hooks/use-session-history.ts`
+- `src/hooks/use-session-messages.ts`
+- `src/lib/session-polling-manager.ts`
+
+### MODIFY (event-driven)
+- `src/lib/services/orchestration-runner.ts` - Event-driven loop, no subprocess
+- `src/lib/watcher.ts` - Add session JSONL + tasks.md watching
+- `src/hooks/use-session-content.ts` - Use SSE events
+- `src/hooks/use-orchestration.ts` - Remove polling
+- `src/hooks/use-sse.ts` - Handle new event types
+- `src/contexts/unified-data-context.tsx` - Session content from SSE
+- `packages/shared/src/schemas/events.ts` - New event types
+- `src/app/api/events/route.ts` - Emit new events
+
+---
+
+## Verification Gate: USER
+
+- [ ] Session messages appear within 500ms
+- [ ] Questions appear instantly
+- [ ] Orchestration updates without polling
+- [ ] No `specflow status --json` subprocess calls
+- [ ] No `setInterval` polling loops remain
+- [ ] Connection recovers on network interruption
+
+---
+
+## Success Metrics
+
+| Metric | Before | After |
+|--------|--------|-------|
+| Session latency | 0-5s | <500ms |
+| Question delay | 0-5s | <200ms |
+| Decision latency | 3-5s | <500ms |
+| Subprocess calls/min | ~20 | 0 |
+| Polling loops | 9+ | 0 |
+
+---
+
+## Dependencies
+
+- Phase 1055 (Smart Batching) - Stable orchestration foundation
+
+## Complexity
+
+**Medium** - Builds on existing infrastructure (SSE endpoint, chokidar watcher, event types all exist).
+
+## Risks
+
+- **File watcher limits**: Use glob patterns, not per-file watchers
+- **Rapid file changes**: 200ms debounce handles this
+
+---
+
 ## 1055 - Smart Batching & Orchestration
 
 **Completed**: 2026-01-22
diff --git a/.specify/phases/1056-jsonl-watcher.md b/.specify/phases/1056-jsonl-watcher.md
deleted file mode 100644
index 206929e..0000000
--- a/.specify/phases/1056-jsonl-watcher.md
+++ /dev/null
@@ -1,229 +0,0 @@
----
-phase: 1056
-name: jsonl-watcher
-status: not_started
-created: 2026-01-22
-updated: 2026-01-22
----
-
-### 1056 - JSONL File Watcher & Polling Consolidation
-
-**Goal**: Replace fragmented polling with unified push-based updates, providing near-instant UI updates and eliminating redundant polling loops across the dashboard.
-
-**Context**: The dashboard has accumulated multiple polling loops:
-- Session content: 3-second polling
-- Workflow status: 3-second polling
-- Orchestration runner: 3-second polling loop
-- Various hooks polling the same data independently
-
-This causes:
-- Up to 3 seconds delay before UI updates
-- Race conditions between multiple pollers
-- Redundant API calls and file reads
-- Each bug fix tends to add another polling mechanism
-
-**Solution**: Unified event-driven architecture with JSONL file watching as the single source of truth.
-
----
-
-## Phase 0: Discovery (REQUIRED FIRST)
-
-Before implementation, map all current polling sources:
-
-### 0.1 Inventory Current Polling
-- [ ] Document all polling locations in dashboard codebase
-- [ ] Identify polling intervals and what data each polls
-- [ ] Map dependencies between pollers
-- [ ] Identify which polls can be consolidated vs need to remain separate
-
-### 0.2 Data Flow Analysis
-- [ ] Map what data changes trigger what UI updates
-- [ ] Identify the authoritative source for each piece of data
-- [ ] Document current race conditions and their symptoms
-- [ ] List all SSE endpoints that already exist
-
-### 0.3 Consolidation Plan
-- [ ] Design unified event taxonomy (what events, what data)
-- [ ] Determine which components subscribe to which events
-- [ ] Plan migration path (parallel run, then cutover)
-- [ ] Define rollback strategy
-
-**Discovery Deliverable**: `polling-consolidation-analysis.md` documenting findings
-
----
-
-## Phase 1: Server-Side File Watcher
-
-Implement file watching on the Next.js server:
-- Watch active session JSONL files using `fs.watch` or `chokidar`
-- Detect changes and parse new content
-- Track which sessions are being watched (cleanup on disconnect)
-- Handle file rotation/truncation gracefully
-
----
-
-## Phase 2: Unified SSE Event Bus
-
-### 2.1 SSE Endpoint
-New API route for streaming ALL dashboard updates:
-- `GET /api/events/stream?projectId=xxx`
-- Single connection per project (not per session)
-- Events cover: session, workflow, orchestration, task progress
-
-### 2.2 Event Types
-```typescript
-type DashboardEvent =
-  | { type: 'session:message'; data: SessionMessage }
-  | { type: 'session:question'; data: Question }
-  | { type: 'session:end'; data: { sessionId: string } }
-  | { type: 'workflow:status'; data: WorkflowExecution }
-  | { type: 'orchestration:progress'; data: OrchestrationProgress }
-  | { type: 'orchestration:decision'; data: DecisionLogEntry }
-  | { type: 'tasks:updated'; data: TaskProgress }
-  | { type: 'heartbeat'; data: null };
-```
-
-### 2.3 Heartbeat & Reconnection
-- Heartbeat every 30s to detect stale connections
-- Client auto-reconnects with exponential backoff
-- Server cleans up watchers on disconnect
-
----
-
-## Phase 3: Orchestration Runner Integration
-
-**Critical**: Migrate orchestration-runner from polling to event-driven:
-
-### 3.1 Current Architecture (Polling)
-```
-orchestration-runner:
-  while (running):
-    load orchestration state
-    load workflow status
-    make decision
-    execute decision
-    sleep(3 seconds)
-```
-
-### 3.2 Target Architecture (Event-Driven)
-```
-orchestration-runner:
-  subscribe to workflow events
-  subscribe to specflow status events
-  on event:
-    make decision
-    execute decision
-  (no polling loop - purely reactive)
-```
-
-### 3.3 Migration Steps
-- [ ] Add event emission when workflow status changes
-- [ ] Add event emission when specflow status changes
-- [ ] Create event handler in orchestration-runner
-- [ ] Run parallel (events + polling) during transition
-- [ ] Remove polling loop once events proven stable
-
----
-
-## Phase 4: Client Hook Migration
-
-### 4.1 Unified Event Hook
-Create `useProjectEvents(projectId)`:
-- Single SSE connection per project
-- Dispatches events to appropriate state stores
-- Handles reconnection transparently
-
-### 4.2 Deprecate Polling Hooks
-Migrate away from:
-- `useWorkflowExecution` polling → SSE events
-- `useSessionMessages` polling → SSE events
-- `useOrchestration` polling → SSE events
-
-### 4.3 Fallback Strategy
-- Detect SSE connection failure
-- Automatically fall back to consolidated polling (single poller, not multiple)
-- Warn in console when in fallback mode
-
----
-
-## Phase 5: Question Detection Enhancement
-
-Improve question detection for instant display:
-- Parse `AskUserQuestion` tool calls from JSONL in real-time
-- Emit `session:question` SSE event immediately when detected
-- Update `DecisionToast` visibility without waiting for workflow status poll
-
----
-
-**Technical Notes:**
-
-Architecture:
-```
-┌─────────────────┐     fs.watch      ┌─────────────────┐
-│  JSONL file     │ ───────────────▶  │  Server (Next)  │
-│  changes        │                   │  Event Bus      │
-└─────────────────┘                   └────────┬────────┘
-                                               │ SSE push
-┌─────────────────┐                           │
-│  specflow CLI   │ ──── status ─────────────▶│
-│  state changes  │                           │
-└─────────────────┘                           ▼
-                                      ┌─────────────────┐
-                                      │  Dashboard UI   │
-                                      │  (single SSE)   │
-                                      └─────────────────┘
-                                               │
-                                               ▼
-                                      ┌─────────────────┐
-                                      │  Orchestration  │
-                                      │  Runner         │
-                                      │  (event-driven) │
-                                      └─────────────────┘
-```
-
-Considerations:
-- File watcher limits on macOS (256 default, can be increased)
-- Cleanup watchers for inactive sessions (5 min timeout)
-- Rate limiting to prevent overwhelming clients (debounce 100ms)
-- Graceful degradation to polling if SSE fails
-- Single SSE connection per browser tab (avoid 6-connection limit)
-
----
-
-**UI Components:**
-- No new visual components - improves responsiveness of existing UI
-
-**API Routes:**
-- GET `/api/events/stream` - Unified SSE endpoint for all dashboard events
-
-**Hooks:**
-- `useProjectEvents.ts` - Single SSE hook per project
-- Deprecate: `useWorkflowExecution`, `useSessionMessages` polling modes
-
-**Services:**
-- `event-bus.ts` - Server-side event aggregation and SSE management
-- `session-watcher.ts` - JSONL file watcher
-- `specflow-watcher.ts` - CLI state file watcher
-
----
-
-**Dependencies:**
-- Phase 1055 (Smart Batching) - Stable orchestration foundation
-
-**Verification Gate: USER**
-- [ ] Session messages appear within 500ms of Claude output
-- [ ] Questions appear instantly (no 3s delay)
-- [ ] Orchestration progress updates without polling
-- [ ] Single SSE connection per project (verified in Network tab)
-- [ ] Connection recovers gracefully after network interruption
-- [ ] No memory leaks from file watchers
-- [ ] Fallback to polling works when SSE unavailable
-- [ ] orchestration-runner uses events, not polling loop
-
-**Estimated Complexity**: Medium-High (due to migration scope)
-
-**Risk Notes:**
-- File watcher resource limits on systems with many concurrent sessions
-- SSE connection limits in browsers (6 per domain in HTTP/1.1)
-- Edge cases with rapid file changes (debouncing needed)
-- Migration period where both polling and events coexist
diff --git a/.specify/phases/polling-consolidation-analysis.md b/.specify/phases/polling-consolidation-analysis.md
new file mode 100644
index 0000000..4ecff5d
--- /dev/null
+++ b/.specify/phases/polling-consolidation-analysis.md
@@ -0,0 +1,286 @@
+# Polling Consolidation Analysis
+
+> **Phase 1056 Discovery Document**
+> Generated: 2026-01-22
+> Purpose: Map all polling sources before migrating to event-driven architecture
+
+---
+
+## Executive Summary
+
+The SpecFlow dashboard has accumulated **9+ polling mechanisms** across client hooks, server services, and the orchestration runner. This document maps each source, its purpose, and the consolidation strategy.
+
+**Key Finding**: The orchestration runner's `specflow status --json` subprocess call (~1-2s per call, every 3s) is the largest bottleneck and should be prioritized.
+
+---
+
+## Polling Inventory
+
+### Critical Polling (High Impact)
+
+| Source | Interval | File | Line | Impact |
+|--------|----------|------|------|--------|
+| Orchestration runner | 3s | `orchestration-runner.ts` | 614-695 | Spawns subprocess every poll |
+| Orchestration status hook | 3s | `use-orchestration.ts` | 379 | Active during orchestration |
+| Session polling manager | 5s | `session-polling-manager.ts` | 201 | **Unnecessary** - can file-watch |
+
+### Deprecated Polling (Should Be Removed)
+
+| Source | Interval | File | Replacement |
+|--------|----------|------|-------------|
+| `useWorkflowExecution` | 3s | `use-workflow-execution.ts:299` | `useProjectData()` + `useWorkflowActions()` |
+| `useWorkflowList` | 3s | `use-workflow-list.ts:132` | `useUnifiedData()` |
+| `useSessionHistory` | 5s | `use-session-history.ts:113` | `useProjectData()` |
+| `useSessionMessages` | 3s | `use-session-messages.ts:195` | `useSessionContent()` |
+
+### UI/Utility Polling (Low Priority)
+
+| Source | Interval | File | Notes |
+|--------|----------|------|-------|
+| Status pill timer | 1s | `status-pill.tsx:75` | UI display only |
+| Status message cycling | ~25s | `use-status-message.ts:82` | Motivational messages |
+| Process spawner | 2s | `process-spawner.ts:182` | Checks workflow completion |
+| SSE heartbeat | 30s | `watcher.ts:725` | Keep-alive (not data polling) |
+
+---
+
+## Data Flow Analysis
+
+### What Data Changes Trigger What UI Updates
+
+```
+┌─────────────────────────────────────────────────────────────────┐
+│                    DATA CHANGE SOURCES                          │
+├─────────────────────────────────────────────────────────────────┤
+│                                                                 │
+│  Project Files (File-Watchable)          External Files         │
+│  ├─ .specflow/orchestration-state.json   ├─ ~/.claude/...jsonl │
+│  ├─ specs/{phase}/tasks.md               │   (CAN be watched!) │
+│  ├─ specs/{phase}/spec.md                │                     │
+│  ├─ specs/{phase}/plan.md                └───────────┬─────────┤
+│  ├─ ROADMAP.md                                       │         │
+│  └─ .specflow/workflows/index.json                   │         │
+│                                                      │         │
+└──────────────────────┬───────────────────────────────┘         │
+                       │                                          │
+                       ▼                                          ▼
+              ┌─────────────────┐                      ┌──────────────────┐
+              │  chokidar       │                      │  NEW: chokidar   │
+              │  watcher.ts     │                      │  session watcher │
+              └────────┬────────┘                      └────────┬─────────┘
+                       │                                        │
+                       ▼                                        ▼
+              ┌─────────────────────────────────────────────────────────┐
+              │              SSE Event Bus (/api/events)                │
+              │  Events: state, tasks, workflow, phases, session:*      │
+              └────────────────────────┬────────────────────────────────┘
+                                       │
+                       ┌───────────────┼───────────────┐
+                       ▼               ▼               ▼
+              ┌─────────────┐  ┌─────────────┐  ┌─────────────────┐
+              │ Dashboard   │  │ Orchestr.   │  │ Session         │
+              │ UI          │  │ Runner      │  │ Viewer          │
+              └─────────────┘  └─────────────┘  └─────────────────┘
+```
+
+### Authoritative Data Sources
+
+| Data | Authoritative Source | Current Access | Target Access |
+|------|---------------------|----------------|---------------|
+| Task progress | `tasks.md` | Subprocess (`specflow status`) | File watch |
+| Phase artifacts | `spec.md`, `plan.md` | Subprocess | File watch |
+| Workflow status | `workflows/index.json` | File watch ✓ | File watch ✓ |
+| Orchestration state | `orchestration-state.json` | File watch ✓ | File watch ✓ |
+| Session messages | `~/.claude/.../session.jsonl` | 5s polling | File watch |
+| Session questions | JSONL tool_use blocks | 5s polling | File watch |
+
+---
+
+## Race Conditions Identified
+
+### 1. Orchestration Runner vs UI Polling
+**Symptom**: UI shows stale state while orchestration advances
+**Cause**: Both poll at 3s intervals, not synchronized
+**Solution**: Single event source triggers both
+
+### 2. Multiple Workflow Status Pollers
+**Symptom**: Inconsistent workflow badges across components
+**Cause**: `useWorkflowExecution`, `useWorkflowList`, `useOrchestration` all poll independently
+**Solution**: Remove deprecated hooks, single SSE stream
+
+### 3. Session End Detection Delay
+**Symptom**: Session shows "running" up to 5s after completion
+**Cause**: Polling interval masks immediate status
+**Solution**: File-watch session JSONL for instant end detection
+
+---
+
+## Existing SSE Infrastructure
+
+### Current SSE Endpoint: `/api/events`
+
+```typescript
+// Existing event types (watcher.ts)
+type SSEEvent =
+  | { type: 'connected'; timestamp: string }
+  | { type: 'heartbeat'; timestamp: string }
+  | { type: 'registry'; data: Registry }
+  | { type: 'state'; projectId: string; data: OrchestrationState }
+  | { type: 'tasks'; projectId: string; data: TasksData }
+  | { type: 'workflow'; projectId: string; data: WorkflowData }
+  | { type: 'phases'; projectId: string; data: PhasesData }
+```
+
+### New Event Types Needed
+
+```typescript
+// Session events (add to watcher.ts)
+| { type: 'session:message'; projectId: string; sessionId: string; data: SessionMessage }
+| { type: 'session:question'; projectId: string; sessionId: string; data: Question }
+| { type: 'session:end'; projectId: string; sessionId: string }
+
+// Orchestration events (add for runner)
+| { type: 'orchestration:decision'; projectId: string; data: DecisionLogEntry }
+| { type: 'orchestration:batch'; projectId: string; data: BatchProgress }
+```
+
+---
+
+## Consolidation Plan
+
+### Phase 0: Remove Deprecated Hooks
+1. Audit component usage of deprecated hooks
+2. Migrate to SSE-based equivalents
+3. Delete deprecated hook files
+4. **Eliminates**: 3 redundant polling loops (9s of polling per cycle)
+
+### Phase 1: Add Session File Watching
+1. Calculate session directory: `~/.claude/projects/{projectHash}/`
+2. Add to chokidar watch list: `${sessionDir}/*.jsonl`
+3. Parse new JSONL lines on file change
+4. Emit `session:message` and `session:question` SSE events
+5. **Eliminates**: sessionPollingManager (5s polling)
+
+### Phase 2: Orchestration Runner Event-Driven
+1. Subscribe runner to SSE events (not polling)
+2. Trigger decision cycle on relevant events only
+3. Remove `specflow status --json` subprocess calls
+4. **Eliminates**: 3s polling + 1-2s subprocess per cycle
+
+### Phase 3: Cleanup & Fallback
+1. Add 30s fallback polling (emergency only)
+2. Log event vs poll discrepancies
+3. Remove fallback after stability period
+
+---
+
+## API Endpoints Being Polled
+
+| Endpoint | Current Interval | Hooks Using It | After Consolidation |
+|----------|------------------|----------------|---------------------|
+| `/api/session/content` | 5s | sessionPollingManager | **Eliminated** (file watch) |
+| `/api/session/active` | 3s | useSessionMessages | **Eliminated** (deprecated) |
+| `/api/session/history` | 5s | useSessionHistory | **Eliminated** (deprecated) |
+| `/api/workflow/list` | 3s | useWorkflowList, useWorkflowExecution | **Eliminated** (deprecated) |
+| `/api/workflow/status` | 3s | useWorkflowExecution | **Eliminated** (deprecated) |
+| `/api/workflow/orchestrate/status` | 3s | useOrchestration | SSE events |
+
+---
+
+## File Watcher Resource Limits
+
+### macOS Limits
+- Default: 256 file watchers
+- With many projects: Could hit limit
+- **Mitigation**: Use glob patterns instead of individual file watches
+
+```typescript
+// BAD: One watcher per file
+projects.forEach(p => watcher.add(`${p.path}/tasks.md`));
+
+// GOOD: Glob pattern from common root
+watcher.add([
+  `${homeDir}/.specflow/**/*.json`,
+  `${homeDir}/.claude/projects/**/*.jsonl`,
+  ...projects.map(p => `${p.path}/specs/**/tasks.md`),
+]);
+```
+
+### Cleanup Strategy
+- Remove watchers when project unregistered
+- 5-minute timeout for inactive session watchers
+- Track active subscriptions to avoid orphan watchers
+
+---
+
+## Migration Safety: Parallel Run Strategy
+
+```
+Week 1: Events + Polling (Both Active)
+├─ Events trigger immediate updates
+├─ Polling runs at 30s (reduced from 3s)
+├─ Log any discrepancies between event and poll data
+└─ Alert if discrepancy rate > 1%
+
+Week 2: Events Primary, Polling Fallback
+├─ Polling only runs if no event in 60s
+├─ Considered "fallback mode"
+└─ Log fallback activations
+
+Week 3+: Events Only
+├─ Remove polling code
+├─ Keep heartbeat for connection health
+└─ Monitor for missed events
+```
+
+---
+
+## Success Metrics
+
+| Metric | Current | Target |
+|--------|---------|--------|
+| Session message latency | 0-5s | <500ms |
+| Question appearance delay | 0-3s | <200ms |
+| Orchestration decision latency | 3s | <500ms |
+| Subprocess calls per minute | ~20 | 0 |
+| Concurrent pollers per project | 4-6 | 0 |
+| SSE connections per project | 1 | 1 (unchanged) |
+
+---
+
+## Files to Modify
+
+### Remove/Deprecate
+- `src/hooks/use-workflow-execution.ts` - Remove
+- `src/hooks/use-workflow-list.ts` - Remove
+- `src/hooks/use-session-history.ts` - Remove
+- `src/hooks/use-session-messages.ts` - Remove
+- `src/lib/session-polling-manager.ts` - Remove after session watching
+
+### Modify
+- `src/lib/watcher.ts` - Add session file watching
+- `src/lib/services/orchestration-runner.ts` - Event-driven loop
+- `src/app/api/events/route.ts` - New event types
+- `packages/shared/src/schemas/events.ts` - New event type definitions
+
+### New
+- None needed (extend existing infrastructure)
+
+---
+
+## Appendix: Polling Code Locations
+
+```
+orchestration-runner.ts:614-695    # Main 3s loop
+orchestration-runner.ts:273-284    # specflow status subprocess
+use-orchestration.ts:379           # 3s orchestration status
+use-workflow-execution.ts:299      # 3s workflow (deprecated)
+use-workflow-list.ts:132           # 3s workflow list (deprecated)
+use-session-history.ts:113         # 5s session history (deprecated)
+use-session-messages.ts:195        # 3s session messages (deprecated)
+session-polling-manager.ts:201     # 5s session content
+process-spawner.ts:182             # 2s process completion
+watcher.ts:725                     # 30s heartbeat (keep)
+status-pill.tsx:75                 # 1s UI timer (keep)
+use-status-message.ts:82           # 25s messages (keep)
+```
diff --git a/BACKLOG.md b/BACKLOG.md
index e5ef854..e57e75d 100644
--- a/BACKLOG.md
+++ b/BACKLOG.md
@@ -4,7 +4,7 @@
 > Review periodically to schedule into upcoming phases.
 
 **Created**: 2026-01-18
-**Last Updated**: 2026-01-18
+**Last Updated**: 2026-01-22
 
 ---
 
@@ -29,6 +29,7 @@
 
 | Item | Source | Reason Deferred | Notes |
 |------|--------|-----------------|-------|
+| [RES001] Research BMAD-METHOD for best practices | Manual | Research | Review https://github.com/bmad-code-org/BMAD-METHOD - scale-adaptive planning (5 levels), 21+ specialized agents, 34 structured workflows. Consider: complexity-based phase sizing, agent specialization patterns, execution track concepts (quick/standard/enterprise). |
 | [OE001] Over-Engineering: 5 error classes for enum-like behavior (errors.ts) | Phase 1049 | Deferred | - |
 | [OE002] Over-Engineering: Global state for output options (output.ts) | Phase 1049 | Deferred | - |
 | [OE003] Over-Engineering: Optional projectPath parameter unused (paths.ts) | Phase 1049 | Deferred | - |
@@ -50,6 +51,7 @@
 | V-064 flow.orchestrate.md exit codes | Phase 0082 | implicit (0=success) | - |
 | V-081 No new linting errors | Phase 0082 | lint unavailable | - |
 | V-083 Commit history | Phase 0082 | changes uncommitted | - |
+| I-004: Orchestration event types (orchestration:decision, orchestration:batch) - not critical for core polling elimination goals | Phase 1056 | Deferred | - |
 
 ### P3 - Low Priority
 
diff --git a/CLAUDE.md b/CLAUDE.md
index 88dcb59..a206cd7 100644
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -12,6 +12,7 @@ SpecFlow v3.0 is a spec-driven development framework for Claude Code. This repos
 
 ```bash
 # Smart Commands (TypeScript CLI)
+specflow init                # Initialize new project (full 3.0 compliance)
 specflow status              # Complete project status
 specflow next                # Next actionable task with context
 specflow mark T007           # Mark task complete
@@ -38,8 +39,10 @@ packages/cli/                → TypeScript CLI implementation
 │   │   ├── next.ts         → Next task command
 │   │   ├── mark.ts         → Mark task command
 │   │   ├── check.ts        → Validation command
+│   │   ├── init.ts         → Initialize project (top-level alias)
 │   │   ├── state/          → State subcommands
-│   │   └── phase/          → Phase lifecycle (open/close/status)
+│   │   ├── phase/          → Phase lifecycle (open/close/status)
+│   │   └── project/        → Project lifecycle (init)
 │   └── lib/                → Shared libraries
 │       ├── tasks.ts        → Parse tasks.md
 │       ├── roadmap.ts      → Parse ROADMAP.md
@@ -60,6 +63,12 @@ commands/flow.*.md          → Claude Code slash commands (/flow.*)
 ## CLI Syntax Notes
 
 ```bash
+# Project initialization
+specflow init                       # Initialize new project with full compliance
+specflow init --name "My App"       # With custom project name
+specflow init --force               # Reinitialize existing project
+specflow project init               # Same as specflow init
+
 # State operations
 specflow state get orchestration.phase.number
 specflow state set orchestration.step.current=verify
diff --git a/PHASE_COMPLETE_TEST_TRACKER.md b/PHASE_COMPLETE_TEST_TRACKER.md
new file mode 100644
index 0000000..8fe2baa
--- /dev/null
+++ b/PHASE_COMPLETE_TEST_TRACKER.md
@@ -0,0 +1,357 @@
+# Phase Complete Test Tracker
+
+Testing comprehensive phase completion across all projects.
+
+## Test Summary
+
+| #   | Project           | State                                     | Tasks     | Expected Action                | Result | Notes |
+| --- | ----------------- | ----------------------------------------- | --------- | ------------------------------ | ------ | ----- |
+| 1   | test-app          | Active: 0010-hello-world                  | 3/3 ✓     | Close phase, archive specs     | ⏳     |       |
+| 2   | level-agency-sdd  | Ready → ask question ui                   | N/A       | Should not close (Ready state) | ⏳     |       |
+| 3   | watson-helper     | Ready                                     | N/A       | Should not close (Ready state) | ⏳     |       |
+| 4   | story-sprout      | Active: 0175-story-flow-redesign          | 44/47     | Warn: 3 incomplete tasks       | ⏳     |       |
+| 5   | inbox-pilot       | Active: 0151-digest-ea-transformation     | 137/142   | Warn: 5 incomplete tasks       | ⏳     |       |
+| 6   | specflow          | Active: 1057-orchestration-simplification | 123/123 ✓ | Close phase, archive specs     | ⏳     |       |
+| 7   | ai-assistant      | Ready → Persistent Cache                  | N/A       | Should not close (Ready state) | ⏳     |       |
+| 8   | overnight-coder   | Ready → UI Plugins                        | N/A       | Should not close (Ready state) | ⏳     |       |
+| 9   | rogue-minesweeper | Ready → rune synergies                    | N/A       | Should not close (Ready state) | ⏳     |       |
+| 10  | cli-bridge        | Ready → OpenTelemetry                     | N/A       | Should not close (Ready state) | ⏳     |       |
+| 11  | CodingBridge      | Ready → UI Redesign                       | N/A       | Should not close (Ready state) | ⏳     |       |
+
+---
+
+## Detailed Project Info
+
+### 1. test-app
+
+- **Path**: `/Users/ppatterson/dev/test-app`
+- **Branch**: `0010-hello-world`
+- **Phase**: 0010 - Hello World
+- **Tasks**: 3/3 complete
+- **Expected**:
+  - `specflow phase close` succeeds
+  - `specs/0010-hello-world/` → `.specify/archive/0010-hello-world/`
+  - ROADMAP.md updated with phase status
+  - HISTORY.md appended
+- **Actual**:
+- **Issues**:
+
+---
+
+### 2. level-agency-sdd
+
+- **Path**: `/Users/ppatterson/dev/level-agency-sdd`
+- **State**: Ready (no active phase)
+- **Pending Phase**: "ask question ui"
+- **Expected**:
+  - Phase Complete should indicate no active phase
+  - Or offer to start the pending phase
+- **Actual**:
+- **Issues**:
+
+---
+
+### 3. watson-helper
+
+- **Path**: `/Users/ppatterson/dev/watson-helper`
+- **State**: Ready (no active phase)
+- **Expected**:
+  - Phase Complete should indicate no active phase
+- **Actual**:
+- **Issues**:
+
+---
+
+### 4. story-sprout
+
+- **Path**: `/Users/ppatterson/dev/story-sprout`
+- **Branch**: `0175-story-flow-redesign`
+- **Phase**: 0175 - story flow redesign
+- **Tasks**: 44/47 (3 incomplete)
+- **Expected**:
+  - Warning about incomplete tasks
+  - Either block close or offer to defer incomplete tasks to BACKLOG
+  - If forced: archive with incomplete task note
+- **Actual**:
+- **Issues**:
+
+---
+
+### 5. inbox-pilot
+
+- **Path**: `/Users/ppatterson/dev/inbox-pilot`
+- **Branch**: `0151-digest-ea-transformation`
+- **Phase**: 0151 - digest ea transformation
+- **Tasks**: 137/142 (5 incomplete)
+- **Expected**:
+  - Warning about incomplete tasks
+  - Either block close or offer to defer incomplete tasks to BACKLOG
+  - If forced: archive with incomplete task note
+- **Actual**:
+- **Issues**:
+
+---
+
+### 6. specflow
+
+- **Path**: `/Users/ppatterson/dev/specflow`
+- **Branch**: `1057-orchestration-simplification`
+- **Phase**: 1057 - Orchestration Simplification
+- **Tasks**: 123/123 complete
+- **Expected**:
+  - `specflow phase close` succeeds
+  - `specs/1057-orchestration-simplification/` → `.specify/archive/1057-orchestration-simplification/`
+  - ROADMAP.md updated
+  - HISTORY.md appended
+- **Actual**:
+- **Issues**:
+
+---
+
+### 7. ai-assistant
+
+- **Path**: `/Users/ppatterson/dev/ai-assistant`
+- **State**: Ready (no active phase)
+- **Pending Phase**: "Persistent Cache"
+- **Expected**:
+  - Phase Complete should indicate no active phase
+- **Actual**:
+- **Issues**:
+
+---
+
+### 8. overnight-coder
+
+- **Path**: `/Users/ppatterson/dev/overnight-coder`
+- **State**: Ready (no active phase)
+- **Pending Phase**: "UI Plugins"
+- **Expected**:
+  - Phase Complete should indicate no active phase
+- **Actual**:
+- **Issues**:
+
+---
+
+### 9. rogue-minesweeper
+
+- **Path**: `/Users/ppatterson/dev/rogue-minesweeper`
+- **State**: Ready (no active phase)
+- **Pending Phase**: "rune synergies"
+- **Expected**:
+  - Phase Complete should indicate no active phase
+- **Actual**:
+- **Issues**:
+
+---
+
+### 10. cli-bridge
+
+- **Path**: `/Users/ppatterson/dev/cli-bridge`
+- **State**: Ready (no active phase)
+- **Pending Phase**: "OpenTelemetry Operational Excellence"
+- **Expected**:
+  - Phase Complete should indicate no active phase
+- **Actual**:
+- **Issues**:
+
+---
+
+### 11. CodingBridge
+
+- **Path**: `/Users/ppatterson/dev/CodingBridge`
+- **State**: Ready (no active phase)
+- **Pending Phase**: "UI Redesign Advanced Features"
+- **Expected**:
+  - Phase Complete should indicate no active phase
+- **Actual**:
+- **Issues**:
+
+---
+
+## Phase Complete Expected Behavior
+
+When "Phase Complete" is triggered, the system should:
+
+1. **For Active Phases (100% complete)**:
+   - Run `specflow check --gate verify` to validate
+   - Archive specs from `specs/NNNN-name/` to `.specify/archive/NNNN-name/`
+   - Update ROADMAP.md phase status to ✓
+   - Append summary to `.specify/history/HISTORY.md`
+   - Clear orchestration state
+   - Optionally: commit, push, merge to main
+
+2. **For Active Phases (incomplete tasks)**:
+   - Warn about incomplete tasks
+   - Offer options:
+     - Defer incomplete to BACKLOG.md
+     - Force close anyway
+     - Cancel and continue work
+
+3. **For Ready State (no active phase)**:
+   - Indicate no phase to close
+   - Optionally show pending phases from dashboard
+
+---
+
+## Files to Check After Each Test
+
+For each active phase close, verify:
+
+- [ ] `specs/NNNN-name/` directory removed
+- [ ] `.specify/archive/NNNN-name/` directory created with contents
+- [ ] `ROADMAP.md` phase row updated
+- [ ] `.specify/history/HISTORY.md` updated
+- [ ] `.specflow/orchestration-state.json` cleared/updated
+- [ ] Git branch status (if merge attempted)
+
+---
+
+## Test Log
+
+### Test 1: test-app (0010-hello-world)
+
+**Started**: 2026-01-24
+**Completed**: In progress
+**Actions Taken**:
+
+- Clicked "Complete Phase" with modal defaults
+
+**Observations**:
+
+- ❌ Session viewer did not show "Current Session"
+- ❌ No new session in dropdown before or after refresh
+- Root cause #1: sessionId is populated async after CLI spawns, but hook queries immediately and caches null
+- **FIX #1 APPLIED**: Added polling for sessionId in use-orchestration.ts (polls for up to 15s after start)
+- Root cause #2: Orchestration started at 'implement' phase with 0 batches (all tasks complete) → immediately went to 'needs_attention'
+- **FIX #2 APPLIED**: Added `skipImplement` flag to config schema. When all tasks complete, orchestration now starts at 'verify' phase.
+- Cancelled stuck orchestration `c41e57f6-a441-4b94-8384-9bf3344bdd5b`
+- Root cause #3 (CORRECTED): Verify WAS genuinely complete - the state is NOT stale. When verify is complete, orchestration should skip to merge, not re-run verify.
+- **FIX #3 APPLIED (CORRECTED)**: Added `skipVerify` flag to config schema. When verify step is complete AND all tasks are complete, orchestration starts at 'merge' phase.
+- Cancelled orchestration `72a0cfaf-71bd-4726-ad37-57a2efee3fef`
+- Ready for retry - should now spawn `/flow.merge` workflow
+
+---
+
+### Test 2: level-agency-sdd (ask question ui)
+
+**Started**: 2026-01-24
+**Completed**: In progress
+**Actions Taken**:
+
+- Started orchestration for "ask question ui" phase
+- flow.design completed successfully (parallel agents worked, agent chips displayed)
+- Orchestration did NOT auto-continue to analyze phase
+
+**Observations**:
+
+- ✅ Agent task chips work correctly - parallel agents visible in session viewer
+- ✅ Orchestration IS continuing after design (user confirmed)
+- ❌ Analyze phase was SKIPPED - went directly from design → implement
+- **Root cause**: `getSmartConfig` in `/api/workflow/orchestrate/route.ts` had bug:
+  ```typescript
+  const smartSkipAnalyze = config.skipAnalyze || smartSkipDesign;
+  ```
+  This incorrectly coupled `skipAnalyze` to `skipDesign`. If design artifacts exist OR design is skipped, analyze gets auto-skipped too.
+
+**Fixes Applied**:
+
+- Fixed `getSmartConfig` to NOT auto-skip analyze based on design status
+- User must explicitly check "Skip analyze" to skip it
+- Also added debug logging and 'stale'/'detached' workflow status handling
+- Dashboard rebuilt - ready for retest with new orchestration
+
+---
+
+### Test 3: watson-helper (Ready)
+
+**Started**:
+**Completed**:
+**Actions Taken**:
+
+**Observations**:
+
+---
+
+### Test 4: story-sprout (0175 - 44/47)
+
+**Started**:
+**Completed**:
+**Actions Taken**:
+
+**Observations**:
+
+---
+
+### Test 5: inbox-pilot (0151 - 137/142)
+
+**Started**:
+**Completed**:
+**Actions Taken**:
+
+**Observations**:
+
+---
+
+### Test 6: specflow (1057 - 123/123)
+
+**Started**:
+**Completed**:
+**Actions Taken**:
+
+**Observations**:
+
+---
+
+### Test 7-11: Ready State Projects
+
+**Started**:
+**Completed**:
+**Observations**:
+
+---
+
+## Issues Found
+
+| #   | Project  | Issue                                                                             | Severity | Fixed?                                                              |
+| --- | -------- | --------------------------------------------------------------------------------- | -------- | ------------------------------------------------------------------- |
+| 1   | test-app | No session shown after Complete Phase - sessionId not available immediately       | High     | ✅ Yes - added polling in use-orchestration.ts                      |
+| 2   | test-app | All tasks complete but orchestration tried to start at 'implement' with 0 batches | High     | ✅ Yes - added skipImplement flag to start at 'verify'              |
+| 3   | test-app | Verify was complete but orchestration started at 'verify' instead of 'merge'      | Medium   | ✅ Yes - added skipVerify flag; when verify complete, skip to merge |
+| 4   | test-app | State file mismatch: step.status='complete' for verify, but orchestration at merge | High     | ✅ Yes - only trust step.status if step.current matches orchestration phase |
+| 5   | test-app | Staleness detection using project file times, not workflow activity time | High     | ✅ Yes - use workflow.lastActivityAt instead of lastFileChangeTime |
+| 6   | test-app | Session not showing in UI without refresh - page.tsx didn't use activeSessionId from useOrchestration | High     | ✅ Yes - extract orchestrationSessionId and use as fallback in consoleSessionId |
+| 7   | test-app | SpecFlow session shown as "CLI Session" instead of proper label | Medium   | ✅ Yes - fixed by session history improvements |
+| 8   | test-app | AskUserQuestion UI not rendering - CLI mode uses structured_output, not tool calls | High     | ✅ Yes - added broadcastWorkflowQuestions() and call from workflow-service |
+| 9   | test-app | Question SSE event had wrong structure - sessionId was nested inside data | High     | ✅ Yes - moved sessionId to root level per schema, added timestamp |
+| 10  | test-app | Session polling timeout too short (15s but workflow takes 30s+) | High     | ✅ Yes - increased polling from 15s to 90s in use-orchestration.ts |
+| 11  | test-app | flow.merge errors on no remote instead of asking user | Critical | ✅ Yes - added LOCAL_ONLY_MODE fallback with AskUserQuestion |
+| 12  | test-app | Polling ran all iterations instantly instead of waiting 1s each | High     | ✅ Yes - await the polling loop so isLoading stays true |
+| 13  | test-app | Questions not shown in session viewer | Medium   | ✅ Yes - parse AskUserQuestion from JSONL, render in session-message.tsx |
+| 14  | test-app | Historical sessions hang on "Loading session..." | High     | ✅ Yes - add API fallback in useSessionContent for non-SSE sessions |
+| 15  | test-app | Structured output not shown in session viewer | Low      | ✅ Yes - parse StructuredOutput from JSONL, display via WorkflowOutputCard |
+| 16  | test-app | Parallel agent tasks not shown in session viewer | Medium   | ✅ Yes - parse Task tool calls, display as AgentTaskChip components |
+| 17  | level-agency-sdd | Orchestration skipping analyze phase after design | High     | ✅ Fixed - `smartSkipAnalyze` was incorrectly coupled to `smartSkipDesign` in getSmartConfig |
+| 18  | level-agency-sdd | Question modal not showing when navigating to waiting session | High     | ✅ Fixed - Added fallback to extract questions from session messages when SSE questions unavailable |
+| 19  | level-agency-sdd | Batches marked complete without verifying actual task completion | Critical | ✅ Fixed - Added verifyBatchTaskCompletion() to check tasks.md before advancing batches |
+| 20  | test-app | Question modal not appearing on page refresh | High     | ✅ Fixed - Added loading state to DecisionToast, show toast while questions load |
+| 21  | test-app | "Waiting" badge not clickable to show question modal | Medium   | ✅ Fixed - Added onStatusClick handler to OmniBox, badge now clickable when waiting |
+| 22  | level-agency-sdd | Batches skipped - spawn_batch called completeBatch BEFORE running workflow | Critical | ✅ Fixed - Removed erroneous completeBatch() call from spawn_batch case. Batches 1,3,5,7 were marked complete without workflows! |
+| 23  | level-agency-sdd | workflowStatus didn't reflect selected session's status | High | ✅ Fixed - workflowStatus now uses selectedConsoleSession.status when a session is selected from dropdown |
+| 24  | level-agency-sdd | Questions not extracted from StructuredOutput (CLI mode) | High | ✅ Fixed - decisionQuestions now also checks sessionWorkflowOutput.questions for needs_input status |
+| 25  | level-agency-sdd | handleDecisionAnswer only checked SSE questions, not fallbacks | High | ✅ Fixed - Now computes fallback questions inline (sessionMessages + sessionWorkflowOutput) |
+| 26  | level-agency-sdd | Real-time updates not showing for resumed sessions after answering questions | High | ⏳ Pending - debug logs added, waiting for reproduction |
+| 27  | level-agency-sdd | Orchestration jumped back to Analyze when restarting after Verify was complete | Critical | ✅ Fixed - getSmartConfig now uses better heuristics: if all tasks complete, skip analyze; isPastPhase() checks current phase index |
+
+---
+
+## Final Summary
+
+**Total Projects**: 11
+**Active Phases**: 4 (test-app, story-sprout, inbox-pilot, specflow)
+**Ready State**: 7
+**100% Complete**: 2 (test-app, specflow)
+**Incomplete Tasks**: 2 (story-sprout: 3, inbox-pilot: 5)
+
+**Pass Rate**: \_/11
+**Issues Found**:
+**Issues Fixed**:
diff --git a/README.md b/README.md
index a0441c9..34d7eec 100644
--- a/README.md
+++ b/README.md
@@ -65,22 +65,22 @@ specflow status
 
 ## Quick Start
 
-**1. Initialize your project in Claude Code:**
+**1. Create project structure:**
 
-```
-/flow.init
+```bash
+specflow init                    # Creates .specflow/, .specify/, ROADMAP.md, etc.
 ```
 
-**2. Create your roadmap:**
+**2. Run discovery interview in Claude Code:**
 
 ```
-/flow.roadmap
+/flow.init                       # AI-guided requirements gathering
 ```
 
 **3. Start development:**
 
 ```
-/flow.orchestrate
+/flow.orchestrate                # Full automated workflow
 ```
 
 SpecFlow guides you through design → analyze → implement → verify.
@@ -91,7 +91,7 @@ SpecFlow guides you through design → analyze → implement → verify.
 
 ```mermaid
 flowchart TD
-    A["/flow.init"] --> B["/flow.roadmap"]
+    A["specflow init"] --> B["/flow.init"]
     B --> C["/flow.orchestrate"]
     C --> D["design → analyze → implement → verify"]
     D --> E["/flow.merge"]
@@ -103,8 +103,8 @@ SpecFlow manages the full development lifecycle:
 
 | Stage | What Happens |
 |-------|--------------|
-| **Init** | Discovery interview captures requirements and decisions |
-| **Roadmap** | Break work into phased milestones |
+| **Scaffold** | `specflow init` creates project structure (.specflow/, .specify/, ROADMAP.md) |
+| **Discovery** | `/flow.init` runs AI-guided interview to capture requirements |
 | **Orchestrate** | Automated workflow: design → analyze → implement → verify |
 | **Merge** | Push, create PR, merge, cleanup branches |
 
@@ -122,6 +122,7 @@ SpecFlow has two interfaces:
 ### CLI Commands
 
 ```bash
+specflow init                # Initialize new project (full 3.0 compliance)
 specflow status              # Complete project status
 specflow next                # Next actionable task
 specflow mark T007           # Mark task complete
diff --git a/ROADMAP.md b/ROADMAP.md
index 079a5a7..38a679d 100644
--- a/ROADMAP.md
+++ b/ROADMAP.md
@@ -60,7 +60,8 @@ This allows inserting urgent work without renumbering existing phases.
 | 1053 | Workflow-Session Unification | ✅ Complete | **USER GATE**: Session detected immediately on workflow start |
 | 1054 | Project Details Redesign | ✅ Complete | **USER GATE**: New UI matches v3 mockup, all states work |
 | 1055 | Smart Batching & Orchestration | ✅ Complete | **USER GATE**: Auto-batch tasks, state machine, auto-healing |
-| 1056 | JSONL Watcher (Push Updates) | ⬜ Not Started | **USER GATE**: SSE-based instant updates, no polling delay |
+| 1056 | JSONL Watcher (Push Updates) | ✅ Complete | **USER GATE**: SSE-based instant updates, no polling delay |
+| 1057 | Orchestration Simplification | ✅ Complete | **USER GATE**: State-driven orchestration, questions work, Claude Helper |
 | 1060  | Stats & Operations                | ⬜ Not Started | **USER GATE**: Costs on cards, operations page, basic chart        |
 | 1070  | Cost Analytics                    | ⬜ Not Started | **USER GATE**: Advanced charts, projections, export                |
 
@@ -110,6 +111,7 @@ specflow phase list --complete
 | **Gate 6.7** | 1054  | New project details UI matches v3 mockup, all workflow states work    |
 | **Gate 7**   | 1055  | Auto-batching works, state machine transitions, auto-healing attempts |
 | **Gate 7.5** | 1056  | Session updates within 500ms, questions appear instantly, SSE works   |
+| **Gate 7.6** | 1057  | Orchestration trusts step.status, questions display, Claude Helper works |
 | **Gate 8**   | 1060  | Costs on cards, session history, basic chart, operations page         |
 | **Gate 9**   | 1070  | Advanced charts, projections, CSV/JSON export                         |
 
diff --git a/bin/specflow b/bin/specflow
index 56e21e6..c614d82 100755
--- a/bin/specflow
+++ b/bin/specflow
@@ -9,8 +9,10 @@
 #   next        Get next actionable task
 #   mark        Mark task(s) complete/incomplete
 #   check       Deep validation with auto-fix
+#   init        Initialize a new SpecFlow project
 #   state       Manage orchestration state
 #   phase       Manage phase lifecycle (open/close/status)
+#   project     Manage project lifecycle (init)
 #   workflow    Execute SpecFlow skills via Claude CLI
 #   templates   Manage project templates
 #   help        Show this help message
@@ -65,6 +67,15 @@ COMMANDS:
                   [--fix]             Auto-fix fixable issues
                   [--gate <gate>]     Check specific gate: design, implement, verify
 
+    init        Initialize a new SpecFlow project (alias for "project init")
+                  [--force]           Reinitialize existing project
+                  [--name <name>]     Project name (default: directory name)
+
+    project     Manage project lifecycle
+                  init                Initialize a new SpecFlow project
+                  [--force]           Reinitialize existing project
+                  [--name <name>]     Project name (default: directory name)
+
     state       Manage orchestration state
                   get [key]           Get state value (dot notation)
                   set <key>=<value>   Set state value
@@ -92,12 +103,19 @@ COMMANDS:
     version     Show version
 
 EXAMPLES:
+    specflow init                            # Initialize new project
+    specflow init --name "My App"            # With custom name
     specflow status --json
     specflow next
     specflow mark T007
     specflow check --fix
     specflow state get orchestration.phase.number
 
+INITIALIZATION SEQUENCE:
+    1. specflow init                         # Create project structure (CLI)
+    2. /flow.init                            # Run discovery interview (Claude Code)
+    3. /flow.orchestrate                     # Start development workflow (Claude Code)
+
 For Claude Code slash commands, use: /flow.orchestrate, /flow.design, etc.
 EOF
 }
@@ -163,6 +181,12 @@ main() {
     check)
       run_ts_cli "check" "$@"
       ;;
+    init)
+      run_ts_cli "init" "$@"
+      ;;
+    project)
+      run_ts_cli "project" "$@"
+      ;;
     state)
       run_ts_cli "state" "$@"
       ;;
@@ -193,7 +217,7 @@ main() {
       deprecated_command "${command}"
       ;;
     # Slash commands - these are Claude Code prompts, not CLI commands
-    analyze|specify|clarify|plan|implement|verify|orchestrate|init|constitution|start|design)
+    analyze|specify|clarify|plan|implement|verify|orchestrate|constitution|start|design)
       log_error "Unknown command: ${command}"
       echo ""
       echo "'${command}' is a Claude Code slash command, not a CLI command."
diff --git a/commands/flow.init.md b/commands/flow.init.md
index efe9b34..4609262 100644
--- a/commands/flow.init.md
+++ b/commands/flow.init.md
@@ -69,13 +69,30 @@ Options:
 2. Run /flow.init --force to reinitialize anyway
 ```
 
-**Create project structure** if `.specify/` doesn't exist:
+**If project structure doesn't exist** (no `.specflow/` or `.specify/`):
+
+Recommend the CLI initialization first:
+```
+Project Not Initialized
+
+Run `specflow init` first to create the project structure, then run `/flow.init` for discovery.
+
+Or continue and /flow.init will create the structure for you.
+```
+
+**Create project structure** if `.specify/` doesn't exist (fallback if `specflow init` wasn't run):
 - `.specify/discovery/` - context.md, state.md, decisions.md
 - `.specify/memory/`
 - `.specify/templates/`
 - `.specify/phases/`
 - `specs/`
 
+Note: `specflow init` is the preferred way to create this structure as it also creates:
+- `.specflow/orchestration-state.json` with proper state
+- `.specflow/manifest.json` for version tracking
+- `ROADMAP.md` and `BACKLOG.md` templates
+- Registers the project in the global registry
+
 **Copy templates** from installed location to `.specify/templates/`:
 ```bash
 cp ~/.specflow/templates/*.md .specify/templates/
diff --git a/commands/flow.merge.md b/commands/flow.merge.md
index dfaaab5..33d743a 100644
--- a/commands/flow.merge.md
+++ b/commands/flow.merge.md
@@ -69,7 +69,37 @@ if [[ "$CURRENT_BRANCH" == "main" || "$CURRENT_BRANCH" == "master" ]]; then
 fi
 ```
 
-**Check for merge conflicts with main:**
+**Check for git remote (critical for push/PR/merge):**
+
+```bash
+REMOTE_URL=$(git remote get-url origin 2>/dev/null || echo "")
+```
+
+If `REMOTE_URL` is empty, use `AskUserQuestion` to offer local-only fallback:
+
+```json
+{
+  "questions": [{
+    "question": "No git remote is configured. The merge workflow normally pushes to a remote and creates a PR.\n\nWould you like to proceed with a local-only merge instead? This will:\n- Close the phase and update ROADMAP.md\n- Commit all changes locally\n- Skip push, PR, and remote merge\n\nYou can push manually later or configure a remote.",
+    "header": "No Remote",
+    "options": [
+      {"label": "Local merge (Recommended)", "description": "Close phase locally - commit changes but skip push/PR/merge"},
+      {"label": "Cancel", "description": "Stop and configure git remote first"}
+    ],
+    "multiSelect": false
+  }]
+}
+```
+
+**Handle response:**
+- **Local merge**: Set `LOCAL_ONLY_MODE=true` and continue. Skip steps 5-9 (push/PR/merge), but still do steps 1-4 and 10-11.
+- **Cancel**: Return with `status: "cancelled"` and message about configuring remote.
+
+**If remote is configured**, proceed normally with `LOCAL_ONLY_MODE=false`.
+
+**Check for merge conflicts with main (skip if LOCAL_ONLY_MODE):**
+
+If `LOCAL_ONLY_MODE=false`:
 
 ```bash
 # Fetch latest main to ensure we have current state
@@ -279,13 +309,17 @@ Co-Authored-By: Claude Opus 4.5 <noreply@anthropic.com>"
 
 Use TodoWrite: mark [MERGE] COMMIT complete, mark [MERGE] PUSH in_progress.
 
-### 5. Push Branch
+### 5. Push Branch (Skip if LOCAL_ONLY_MODE)
+
+**If LOCAL_ONLY_MODE=true**: Skip to step 10 (Memory Integration). Mark [MERGE] PUSH, [MERGE] MERGE as skipped.
+
+**If LOCAL_ONLY_MODE=false**:
 
 ```bash
 git push -u origin "$CURRENT_BRANCH"
 ```
 
-### 6. Create Pull Request
+### 6. Create Pull Request (Skip if LOCAL_ONLY_MODE)
 
 **Check for existing PR:**
 
@@ -307,7 +341,7 @@ if [[ -z "$PR_URL" ]]; then
 fi
 ```
 
-### 7. Handle --pr-only
+### 7. Handle --pr-only (Skip if LOCAL_ONLY_MODE)
 
 ```bash
 if [[ "$ARGUMENTS" == *"--pr-only"* ]]; then
@@ -321,13 +355,17 @@ fi
 
 Use TodoWrite: mark [MERGE] PUSH complete, mark [MERGE] MERGE in_progress.
 
-### 8. Merge PR
+### 8. Merge PR (Skip if LOCAL_ONLY_MODE)
 
 ```bash
 gh pr merge --squash --delete-branch
 ```
 
-### 9. Switch to Main
+### 9. Switch to Main (Skip if LOCAL_ONLY_MODE)
+
+**If LOCAL_ONLY_MODE=true**: Stay on feature branch. Phase is closed and committed locally.
+
+**If LOCAL_ONLY_MODE=false**:
 
 ```bash
 git checkout main
@@ -397,6 +435,19 @@ Use TodoWrite: mark [MERGE] MEMORY complete, mark [MERGE] DONE in_progress.
 
 ### 11. Done
 
+**If LOCAL_ONLY_MODE=true**:
+```text
+✓ Closed phase $PHASE_NUMBER (local only)
+✓ Committed changes locally
+⊘ Skipped push/PR/merge (no remote configured)
+✓ Integrated archive into memory
+
+Phase is complete locally. To push later:
+1. Configure remote: git remote add origin <url>
+2. Push: git push -u origin $CURRENT_BRANCH
+```
+
+**If LOCAL_ONLY_MODE=false**:
 ```text
 ✓ Closed phase $PHASE_NUMBER
 ✓ Committed changes
@@ -414,6 +465,7 @@ Use TodoWrite: mark [MERGE] DONE complete.
 | Error | Response |
 |-------|----------|
 | Not on feature branch | "Switch to a feature branch first" |
+| No git remote | **Ask user** - offer local-only merge or cancel |
 | Uncommitted changes | **Ask user** - show changes, offer: commit with phase, stash, review, or abort |
 | Phase close fails | Show CLI error message |
 | Merge fails | "Check for merge conflicts or required reviews" |
diff --git a/docs/cli-reference.md b/docs/cli-reference.md
index 808837c..efb857d 100644
--- a/docs/cli-reference.md
+++ b/docs/cli-reference.md
@@ -16,6 +16,30 @@ All commands support `--help` for detailed usage and `--json` for machine-readab
 
 These are the primary commands for SpecFlow v3.0. They provide rich, contextual output designed for efficient Claude Code integration.
 
+### init - Initialize New Project
+
+Create a new SpecFlow project with full 3.0 compliance.
+
+```bash
+specflow init                         # Initialize in current directory
+specflow init --name "My Project"     # With custom project name
+specflow init --force                 # Reinitialize existing project
+specflow project init                 # Same as specflow init
+```
+
+**Creates:**
+- `.specflow/` - Operational state (orchestration-state.json, manifest.json, workflows/)
+- `.specify/` - Repository knowledge (memory/, templates/, phases/, archive/, history/)
+- `ROADMAP.md` - Phase overview template
+- `BACKLOG.md` - Deferred items template
+- `specs/` - Active phase artifacts directory
+
+**Output includes:**
+- Created directories and files
+- Synced templates
+- Registry status
+- Next steps
+
 ### status - Complete Project Status
 
 Get comprehensive project status in a single call.
@@ -201,9 +225,9 @@ The following bash commands are deprecated in v3.0. They will display an error w
 | `specflow tasks mark` | `specflow mark` |
 | `specflow gate` | `specflow check --gate` |
 | `specflow reconcile` | `specflow check --fix` |
-| `specflow scaffold` | Use `/flow.init` slash command |
+| `specflow scaffold` | `specflow init` (CLI) then `/flow.init` (AI discovery) |
 | `specflow memory` | Use `/flow.memory` slash command |
-| `specflow templates` | Use `/flow.init` slash command |
+| `specflow templates` | `specflow init` syncs templates automatically |
 | `specflow dashboard` | (Removed in v3.0) |
 | `specflow git` | Use git directly |
 | `specflow roadmap` | Use `/flow.roadmap` slash command |
@@ -213,7 +237,8 @@ Running a deprecated command shows:
 ```
 ERROR: Command 'doctor' is deprecated in SpecFlow v3.0
 
-The TypeScript CLI replaces bash scripts with 6 smart commands:
+The TypeScript CLI replaces bash scripts with 7 smart commands:
+  specflow init     - Initialize new project (creates structure)
   specflow status   - Complete project status (replaces: context, doctor, detect)
   specflow next     - Next task with context (replaces: tasks incomplete)
   specflow mark     - Mark tasks done (replaces: tasks mark)
@@ -221,3 +246,44 @@ The TypeScript CLI replaces bash scripts with 6 smart commands:
   specflow state    - State operations (same as before)
   specflow phase    - Phase lifecycle (open/close/status/defer/add)
 ```
+
+---
+
+## Initialization Paths
+
+### New Projects
+
+For greenfield projects, the recommended initialization sequence is:
+
+```bash
+# Step 1: Create project structure (CLI)
+specflow init
+
+# Step 2: Run discovery interview (Claude Code)
+/flow.init
+
+# Step 3: Start development (Claude Code)
+/flow.orchestrate
+```
+
+- `specflow init` creates the directory structure, templates, and state files
+- `/flow.init` runs an AI-guided discovery interview and generates memory documents
+- `/flow.orchestrate` begins the development workflow
+
+### Existing v1.0/v2.0 Projects
+
+For projects migrating from older SpecFlow versions:
+
+```bash
+# Step 1: Detect and migrate (CLI)
+specflow upgrade
+
+# Step 2: Intelligent analysis (Claude Code)
+/flow.doctor migrate
+
+# Step 3: Validate and repair (CLI)
+specflow check --fix
+
+# Step 4: Resume development (Claude Code)
+/flow.orchestrate
+```
diff --git a/packages/cli/src/commands/check.ts b/packages/cli/src/commands/check.ts
index 52d60ea..da079dc 100644
--- a/packages/cli/src/commands/check.ts
+++ b/packages/cli/src/commands/check.ts
@@ -1,17 +1,22 @@
 import { Command } from 'commander';
-import { readFile, readdir, copyFile, mkdir } from 'node:fs/promises';
+import { readFile, readdir, copyFile, mkdir, writeFile, unlink } from 'node:fs/promises';
 import { join } from 'node:path';
 import { output } from '../lib/output.js';
-import { readState, writeState, setStateValue } from '../lib/state.js';
+import { readState, writeState, setStateValue, readRawState, writeRawState } from '../lib/state.js';
 import { readTasks, detectCircularDependencies } from '../lib/tasks.js';
 import { readRoadmap, getPhaseByNumber } from '../lib/roadmap.js';
 import { readFeatureChecklists, areAllChecklistsComplete } from '../lib/checklist.js';
 import { getProjectContext, resolveFeatureDir, getMissingArtifacts } from '../lib/context.js';
 import { runHealthCheck, type HealthIssue } from '../lib/health.js';
-import { findProjectRoot, pathExists, getStatePath, getMemoryDir, getTemplatesDir, getSystemTemplatesDir } from '../lib/paths.js';
+import { findProjectRoot, pathExists, getStatePath, getMemoryDir, getTemplatesDir, getSystemTemplatesDir, getHistoryDir, getSpecifyDir } from '../lib/paths.js';
 import { handleError, NotFoundError } from '../lib/errors.js';
 import type { OrchestrationState } from '@specflow/shared';
 
+/**
+ * Step index mapping for validation
+ */
+const STEP_INDEX_MAP: Record<string, number> = { design: 0, analyze: 1, implement: 2, verify: 3 };
+
 /**
  * Gate types
  */
@@ -392,8 +397,208 @@ async function applyFixes(
   const fixed: FixResult[] = [];
   const autoFixable = issues.filter(i => i.autoFixable);
 
+  // First pass: Fix STATE_SCHEMA_ERROR issues that prevent normal reads
+  const schemaErrors = autoFixable.filter(i => i.code === 'STATE_SCHEMA_ERROR');
+  if (schemaErrors.length > 0) {
+    try {
+      const rawResult = await readRawState(projectRoot);
+      if (rawResult.data && rawResult.zodErrors) {
+        const data = rawResult.data as Record<string, unknown>;
+        let fixCount = 0;
+
+        // Fix common schema issues in raw data
+        const orchestration = data.orchestration as Record<string, unknown> | undefined;
+        if (orchestration) {
+          const step = orchestration.step as Record<string, unknown> | undefined;
+          const phase = orchestration.phase as Record<string, unknown> | undefined;
+
+          // Fix step.index if it's a string
+          if (step && typeof step.index === 'string') {
+            const stepCurrent = step.current as string | undefined;
+            const correctIndex = stepCurrent && STEP_INDEX_MAP[stepCurrent] !== undefined
+              ? STEP_INDEX_MAP[stepCurrent]
+              : null;
+            step.index = correctIndex;
+            fixCount++;
+          }
+
+          // Fix step.current if invalid
+          const validSteps = ['design', 'analyze', 'implement', 'verify'];
+          if (step && step.current && !validSteps.includes(step.current as string)) {
+            step.current = null;
+            fixCount++;
+          }
+
+          // Fix step.status if invalid
+          const validStepStatuses = ['not_started', 'pending', 'in_progress', 'complete', 'failed', 'blocked', 'skipped'];
+          if (step && step.status && !validStepStatuses.includes(step.status as string)) {
+            step.status = 'not_started';
+            fixCount++;
+          }
+
+          // Fix phase.status if invalid
+          const validPhaseStatuses = ['not_started', 'in_progress', 'complete'];
+          if (phase && phase.status && !validPhaseStatuses.includes(phase.status as string)) {
+            phase.status = 'not_started';
+            fixCount++;
+          }
+        }
+
+        // Fix schema_version
+        if (data.schema_version !== '3.0') {
+          data.schema_version = '3.0';
+          fixCount++;
+        }
+
+        if (fixCount > 0) {
+          await writeRawState(data, projectRoot);
+          fixed.push({
+            code: 'STATE_SCHEMA_ERROR',
+            action: `Repaired ${fixCount} schema validation issue(s) in state file`,
+          });
+        }
+      }
+    } catch {
+      // Raw repair failed, continue with other fixes
+    }
+  }
+
   for (const issue of autoFixable) {
     try {
+      // Skip STATE_SCHEMA_ERROR - already handled above
+      if (issue.code === 'STATE_SCHEMA_ERROR') continue;
+
+      // === Schema validation fixes ===
+
+      if (issue.code === 'SCHEMA_VERSION_OUTDATED') {
+        const state = await readState(projectRoot);
+        const updated = { ...state, schema_version: '3.0' };
+        await writeState(updated as OrchestrationState, projectRoot);
+        fixed.push({
+          code: issue.code,
+          action: 'Updated schema_version to "3.0"',
+        });
+      }
+
+      if (issue.code === 'STEP_INDEX_TYPE_ERROR') {
+        const state = await readState(projectRoot);
+        const currentStep = state.orchestration?.step?.current;
+        // Convert to correct number based on step name, or 0 if unknown
+        const correctIndex = currentStep && STEP_INDEX_MAP[currentStep] !== undefined
+          ? STEP_INDEX_MAP[currentStep]
+          : 0;
+        const updated = setStateValue(state, 'orchestration.step.index', correctIndex);
+        await writeState(updated, projectRoot);
+        fixed.push({
+          code: issue.code,
+          action: `Converted step.index to number: ${correctIndex}`,
+        });
+      }
+
+      if (issue.code === 'STEP_CURRENT_INVALID') {
+        const state = await readState(projectRoot);
+        // Reset to null for invalid values like "idle"
+        const updated = setStateValue(state, 'orchestration.step.current', null);
+        await writeState(updated, projectRoot);
+        fixed.push({
+          code: issue.code,
+          action: 'Reset step.current to null',
+        });
+      }
+
+      if (issue.code === 'STEP_STATUS_INVALID') {
+        const state = await readState(projectRoot);
+        // Reset to not_started for invalid values like "idle"
+        const updated = setStateValue(state, 'orchestration.step.status', 'not_started');
+        await writeState(updated, projectRoot);
+        fixed.push({
+          code: issue.code,
+          action: 'Reset step.status to "not_started"',
+        });
+      }
+
+      if (issue.code === 'PHASE_STATUS_INVALID') {
+        const state = await readState(projectRoot);
+        // Reset to not_started for invalid values like "idle"
+        const updated = setStateValue(state, 'orchestration.phase.status', 'not_started');
+        await writeState(updated, projectRoot);
+        fixed.push({
+          code: issue.code,
+          action: 'Reset phase.status to "not_started"',
+        });
+      }
+
+      if (issue.code === 'STEP_INDEX_MISMATCH') {
+        const state = await readState(projectRoot);
+        const currentStep = state.orchestration?.step?.current;
+        if (currentStep && STEP_INDEX_MAP[currentStep] !== undefined) {
+          const correctIndex = STEP_INDEX_MAP[currentStep];
+          const updated = setStateValue(state, 'orchestration.step.index', correctIndex);
+          await writeState(updated, projectRoot);
+          fixed.push({
+            code: issue.code,
+            action: `Corrected step.index to ${correctIndex} (for "${currentStep}")`,
+          });
+        }
+      }
+
+      // === File structure fixes ===
+
+      if (issue.code === 'STATE_WRONG_LOCATION') {
+        const wrongPath = join(getSpecifyDir(projectRoot), 'orchestration-state.json');
+        await unlink(wrongPath);
+        fixed.push({
+          code: issue.code,
+          action: 'Removed duplicate state file from .specify/',
+        });
+      }
+
+      if (issue.code === 'NO_BACKLOG') {
+        const backlogPath = join(projectRoot, 'BACKLOG.md');
+        const backlogContent = `# Backlog
+
+> Items deferred for future consideration. Add items during \`/flow.verify\` or with \`specflow phase defer "item"\`.
+
+## Deferred Items
+
+<!-- Add deferred items here -->
+
+## Technical Debt
+
+<!-- Add tech debt items here -->
+
+## Future Considerations
+
+<!-- Add future ideas here -->
+`;
+        await writeFile(backlogPath, backlogContent, 'utf-8');
+        fixed.push({
+          code: issue.code,
+          action: 'Created BACKLOG.md template',
+        });
+      }
+
+      if (issue.code === 'NO_HISTORY') {
+        const historyDir = getHistoryDir(projectRoot);
+        await mkdir(historyDir, { recursive: true });
+        const historyPath = join(historyDir, 'HISTORY.md');
+        const historyContent = `# Phase History
+
+> Summaries of completed phases. Updated automatically by \`specflow phase close\`.
+
+---
+
+<!-- Completed phase summaries will be added here -->
+`;
+        await writeFile(historyPath, historyContent, 'utf-8');
+        fixed.push({
+          code: issue.code,
+          action: 'Created .specify/history/HISTORY.md template',
+        });
+      }
+
+      // === Existing fixes ===
+
       if (issue.code === 'TASKS_COMPLETE_STEP_IMPLEMENT') {
         const state = await readState(projectRoot);
         const updated = setStateValue(state, 'orchestration.step.current', 'verify');
diff --git a/packages/cli/src/commands/init.ts b/packages/cli/src/commands/init.ts
new file mode 100644
index 0000000..6f78bb2
--- /dev/null
+++ b/packages/cli/src/commands/init.ts
@@ -0,0 +1,15 @@
+import { Command } from 'commander';
+import { runProjectInit, type InitOptions } from './project/init.js';
+
+/**
+ * Top-level init command - alias for `specflow project init`
+ *
+ * This provides a convenient shorthand:
+ *   specflow init         → specflow project init
+ *   specflow init --force → specflow project init --force
+ */
+export const initCommand = new Command('init')
+  .description('Initialize a new SpecFlow project (alias for "project init")')
+  .option('--force', 'Reinitialize even if already initialized')
+  .option('--name <name>', 'Project name (defaults to directory name)')
+  .action(runProjectInit);
diff --git a/packages/cli/src/commands/project/index.ts b/packages/cli/src/commands/project/index.ts
new file mode 100644
index 0000000..f54a495
--- /dev/null
+++ b/packages/cli/src/commands/project/index.ts
@@ -0,0 +1,12 @@
+import { Command } from 'commander';
+import { init } from './init.js';
+
+/**
+ * Project command - manage SpecFlow project lifecycle
+ *
+ * Subcommands:
+ *   specflow project init        Initialize a new SpecFlow project
+ */
+export const projectCommand = new Command('project')
+  .description('Manage SpecFlow project lifecycle')
+  .addCommand(init);
diff --git a/packages/cli/src/commands/project/init.ts b/packages/cli/src/commands/project/init.ts
new file mode 100644
index 0000000..3074619
--- /dev/null
+++ b/packages/cli/src/commands/project/init.ts
@@ -0,0 +1,553 @@
+import { Command } from 'commander';
+import { mkdir, writeFile } from 'node:fs/promises';
+import { basename, join, resolve } from 'node:path';
+import chalk from 'chalk';
+import { createInitialState, writeState } from '../../lib/state.js';
+import {
+  getStatePath,
+  getManifestPath,
+  getSpecflowDir,
+  getSpecsDir,
+  getRoadmapPath,
+  pathExists,
+} from '../../lib/paths.js';
+import { registerProject } from '../../lib/registry.js';
+import {
+  setupFullScaffolding,
+  createScaffolding,
+  syncTemplates,
+  ensureHistoryFile,
+  ensureConstitution,
+} from '../../lib/scaffold.js';
+import { createV3Manifest } from '../../lib/migrate.js';
+import { output, success, info, warn, header } from '../../lib/output.js';
+import { handleError } from '../../lib/errors.js';
+
+/**
+ * Output structure for project init command with --json flag
+ */
+export interface ProjectInitOutput {
+  status: 'success' | 'error';
+  command: 'project init';
+  project: {
+    id: string;
+    name: string;
+    path: string;
+  };
+  created: {
+    specflowDir: boolean;
+    stateFile: boolean;
+    manifestFile: boolean;
+    workflowsDir: boolean;
+    specifyDirs: string[];
+    specsDir: boolean;
+    roadmap: boolean;
+    backlog: boolean;
+    history: boolean;
+    constitution: boolean;
+  };
+  templates: {
+    copied: string[];
+    skipped: string[];
+  };
+  registered: boolean;
+  alreadyInitialized: boolean;
+  error?: { message: string; hint: string };
+}
+
+/**
+ * Get current date in YYYY-MM-DD format
+ */
+function getCurrentDate(): string {
+  return new Date().toISOString().split('T')[0];
+}
+
+/**
+ * Create ROADMAP.md from template with project name substituted
+ */
+async function createRoadmap(projectPath: string, projectName: string): Promise<boolean> {
+  const roadmapPath = getRoadmapPath(projectPath);
+
+  if (pathExists(roadmapPath)) {
+    return false;
+  }
+
+  const content = `# ${projectName} Development Roadmap
+
+> **Source of Truth**: This document defines all feature phases, their order, and completion status.
+> Work proceeds through phases sequentially. Each phase produces a deployable increment.
+
+**Project**: ${projectName}
+**Created**: ${getCurrentDate()}
+**Schema Version**: 3.0 (ABBC numbering)
+**Status**: Active Development
+
+---
+
+## Phase Numbering
+
+Phases use **ABBC** format:
+
+- **A** = Milestone (0-9) - Major version or project stage
+- **BB** = Phase (01-99) - Sequential work within milestone
+- **C** = Hotfix (0-9) - Insert slot (0 = main phase, 1-9 = hotfixes/inserts)
+
+**Examples**:
+
+- \`0010\` = Milestone 0, Phase 01, no hotfix
+- \`0021\` = Hotfix 1 inserted after Phase 02
+- \`1010\` = Milestone 1, Phase 01, no hotfix
+
+This allows inserting urgent work without renumbering existing phases.
+
+---
+
+## Phase Overview
+
+| Phase | Name | Status | Verification Gate |
+| ----- | ---- | ------ | ----------------- |
+| 0010  | Initial Setup | ⬜ Not Started | Project scaffolding complete |
+
+**Legend**: ⬜ Not Started | 🔄 In Progress | ✅ Complete | **USER GATE** = Requires user verification
+
+---
+
+## Phase Details
+
+Phase details are stored in modular files:
+
+| Location                      | Content                      |
+| ----------------------------- | ---------------------------- |
+| \`.specify/phases/*.md\`        | Active/pending phase details |
+| \`.specify/history/HISTORY.md\` | Archived completed phases    |
+
+To view a specific phase:
+
+\`\`\`bash
+specflow phase show 0010
+\`\`\`
+
+To list all phases:
+
+\`\`\`bash
+specflow phase list
+specflow phase list --active
+specflow phase list --complete
+\`\`\`
+
+---
+
+## Phase Sizing Guidelines
+
+Each phase is designed to be:
+
+- **Completable** in a single agentic coding session (~200k tokens)
+- **Independently deployable** (no half-finished features)
+- **Verifiable** with clear success criteria
+- **Building** on previous phases
+
+If a phase is running long:
+
+1. Cut scope to MVP for that phase
+2. Document deferred items in \`specs/[phase]/checklists/deferred.md\`
+3. Prioritize verification gate requirements
+
+---
+
+## How to Use This Document
+
+### Starting a Phase
+
+\`\`\`
+/flow.orchestrate
+\`\`\`
+
+Or manually:
+
+\`\`\`
+/flow.design "Phase NNNN - [Phase Name]"
+\`\`\`
+
+### After Completing a Phase
+
+1. Run \`/flow.verify\` to verify the phase is complete
+2. Run \`/flow.merge\` to close, push, and merge (updates ROADMAP automatically)
+3. If USER GATE: get explicit user verification before proceeding
+
+### Adding New Phases
+
+Use SpecFlow commands:
+
+\`\`\`bash
+specflow phase add 0025 "new-phase-name"
+specflow phase add 0025 "new-phase-name" --user-gate --gate "Description"
+specflow phase open --hotfix "Urgent Fix"
+\`\`\`
+`;
+
+  try {
+    await writeFile(roadmapPath, content);
+    return true;
+  } catch {
+    return false;
+  }
+}
+
+/**
+ * Create BACKLOG.md from template
+ */
+async function createBacklog(projectPath: string, projectName: string): Promise<boolean> {
+  const backlogPath = join(resolve(projectPath), 'BACKLOG.md');
+
+  if (pathExists(backlogPath)) {
+    return false;
+  }
+
+  const currentDate = getCurrentDate();
+  const content = `# ${projectName} Backlog
+
+> Items deferred from phases without a specific target phase assignment.
+> Review periodically to schedule into upcoming phases.
+
+**Created**: ${currentDate}
+**Last Updated**: ${currentDate}
+
+---
+
+## Priority Legend
+
+| Priority | Meaning | Criteria |
+|----------|---------|----------|
+| **P1** | High | Core functionality, significant user value |
+| **P2** | Medium | Nice-to-have, quality of life improvements |
+| **P3** | Low | Future considerations, can wait indefinitely |
+
+---
+
+## Backlog Items
+
+### P1 - High Priority
+
+| Item | Source | Reason Deferred | Notes |
+|------|--------|-----------------|-------|
+| (none) | - | - | - |
+
+### P2 - Medium Priority
+
+| Item | Source | Reason Deferred | Notes |
+|------|--------|-----------------|-------|
+| (none) | - | - | - |
+
+### P3 - Low Priority
+
+| Item | Source | Reason Deferred | Notes |
+|------|--------|-----------------|-------|
+| (none) | - | - | - |
+
+---
+
+## Scheduling Guidelines
+
+When planning a new phase, review this backlog:
+
+1. **Check P1 items** - Should any be scheduled for the next phase?
+2. **Look for synergies** - Do any backlog items align with planned work?
+3. **Update target phases** - Move items from Backlog to specific phases as appropriate
+4. **Clean up** - Remove completed items, update priorities as project evolves
+
+---
+
+## History
+
+| Date | Action | Items Affected |
+|------|--------|----------------|
+| ${currentDate} | Created backlog | Initial setup |
+`;
+
+  try {
+    await writeFile(backlogPath, content);
+    return true;
+  } catch {
+    return false;
+  }
+}
+
+/**
+ * Create manifest.json
+ */
+async function createManifest(projectPath: string, projectName: string): Promise<boolean> {
+  const manifestPath = getManifestPath(projectPath);
+
+  if (pathExists(manifestPath)) {
+    return false;
+  }
+
+  const manifest = createV3Manifest(projectName);
+  await writeFile(manifestPath, JSON.stringify(manifest, null, 2) + '\n');
+  return true;
+}
+
+/**
+ * Create workflows directory
+ */
+async function createWorkflowsDir(projectPath: string): Promise<boolean> {
+  const workflowsPath = join(getSpecflowDir(projectPath), 'workflows');
+
+  if (pathExists(workflowsPath)) {
+    return false;
+  }
+
+  await mkdir(workflowsPath, { recursive: true });
+  return true;
+}
+
+/**
+ * Create specs directory
+ */
+async function createSpecsDir(projectPath: string): Promise<boolean> {
+  const specsPath = getSpecsDir(projectPath);
+
+  if (pathExists(specsPath)) {
+    return false;
+  }
+
+  await mkdir(specsPath, { recursive: true });
+
+  // Create a .gitkeep file to ensure the directory is tracked
+  await writeFile(join(specsPath, '.gitkeep'), '');
+  return true;
+}
+
+/**
+ * Format human-readable output for project init command
+ */
+function formatHumanReadable(result: ProjectInitOutput): string {
+  if (result.status === 'error' && result.error) {
+    return `Error: ${result.error.message}\nHint: ${result.error.hint}`;
+  }
+
+  const lines: string[] = [];
+
+  lines.push(chalk.bold.green('✓ Initialized SpecFlow project'));
+  lines.push('');
+  lines.push(chalk.bold('Project'));
+  lines.push(`  Name: ${result.project.name}`);
+  lines.push(`  Path: ${result.project.path}`);
+  lines.push('');
+
+  lines.push(chalk.bold('Created'));
+
+  // .specflow/ items
+  if (result.created.specflowDir) {
+    lines.push(`  ${chalk.green('✓')} .specflow/`);
+  }
+  if (result.created.stateFile) {
+    lines.push(`  ${chalk.green('✓')} .specflow/orchestration-state.json`);
+  }
+  if (result.created.manifestFile) {
+    lines.push(`  ${chalk.green('✓')} .specflow/manifest.json`);
+  }
+  if (result.created.workflowsDir) {
+    lines.push(`  ${chalk.green('✓')} .specflow/workflows/`);
+  }
+
+  // .specify/ items
+  if (result.created.specifyDirs.length > 0) {
+    for (const dir of result.created.specifyDirs) {
+      lines.push(`  ${chalk.green('✓')} ${dir}`);
+    }
+  }
+
+  // Core files
+  if (result.created.history) {
+    lines.push(`  ${chalk.green('✓')} .specify/history/HISTORY.md`);
+  }
+  if (result.created.constitution) {
+    lines.push(`  ${chalk.green('✓')} .specify/memory/constitution.md`);
+  }
+  if (result.created.roadmap) {
+    lines.push(`  ${chalk.green('✓')} ROADMAP.md`);
+  }
+  if (result.created.backlog) {
+    lines.push(`  ${chalk.green('✓')} BACKLOG.md`);
+  }
+  if (result.created.specsDir) {
+    lines.push(`  ${chalk.green('✓')} specs/`);
+  }
+
+  // Templates
+  if (result.templates.copied.length > 0) {
+    lines.push('');
+    lines.push(chalk.bold('Templates Synced'));
+    for (const template of result.templates.copied) {
+      lines.push(`  ${chalk.green('✓')} ${template}`);
+    }
+  }
+
+  // Registration
+  if (result.registered) {
+    lines.push('');
+    lines.push(`${chalk.green('✓')} Registered in global project registry`);
+  }
+
+  lines.push('');
+  lines.push(chalk.bold('Next Steps'));
+  lines.push('  1. Edit ROADMAP.md to define your phases');
+  lines.push('  2. Edit .specify/memory/constitution.md with project principles');
+  lines.push('  3. Run /flow.orchestrate to start your first phase');
+
+  return lines.join('\n');
+}
+
+/**
+ * Options for the init action
+ */
+export interface InitOptions {
+  force?: boolean;
+  name?: string;
+}
+
+/**
+ * Shared action handler for project initialization
+ * Used by both `specflow project init` and `specflow init`
+ */
+export async function runProjectInit(options: InitOptions): Promise<void> {
+  const projectPath = resolve(process.cwd());
+  const projectName = options.name ?? basename(projectPath);
+    const statePath = getStatePath(projectPath);
+
+    // Initialize result
+    const result: ProjectInitOutput = {
+      status: 'error',
+      command: 'project init',
+      project: {
+        id: '',
+        name: projectName,
+        path: projectPath,
+      },
+      created: {
+        specflowDir: false,
+        stateFile: false,
+        manifestFile: false,
+        workflowsDir: false,
+        specifyDirs: [],
+        specsDir: false,
+        roadmap: false,
+        backlog: false,
+        history: false,
+        constitution: false,
+      },
+      templates: {
+        copied: [],
+        skipped: [],
+      },
+      registered: false,
+      alreadyInitialized: false,
+    };
+
+    try {
+      // Check if already initialized
+      const alreadyHasState = pathExists(statePath);
+      if (alreadyHasState && !options.force) {
+        result.alreadyInitialized = true;
+        result.error = {
+          message: 'Project already initialized',
+          hint: 'Use --force to reinitialize',
+        };
+        output(result, `${chalk.yellow('⚠')} Project already initialized. Use --force to reinitialize.`);
+        process.exitCode = 1;
+        return;
+      }
+
+      // 1. Create .specflow/ directory
+      const specflowDir = getSpecflowDir(projectPath);
+      if (!pathExists(specflowDir)) {
+        await mkdir(specflowDir, { recursive: true });
+        result.created.specflowDir = true;
+      }
+
+      // 2. Create orchestration-state.json
+      const state = createInitialState(projectName, projectPath);
+      result.project.id = state.project.id;
+      await writeState(state, projectPath);
+      result.created.stateFile = true;
+
+      // 3. Create manifest.json
+      result.created.manifestFile = await createManifest(projectPath, projectName);
+
+      // 4. Create workflows/ directory
+      result.created.workflowsDir = await createWorkflowsDir(projectPath);
+
+      // 5. Create .specify/ scaffolding
+      const scaffoldResult = await createScaffolding(projectPath);
+      result.created.specifyDirs = scaffoldResult.created;
+
+      // 6. Sync templates
+      const templatesResult = await syncTemplates(projectPath);
+      result.templates.copied = templatesResult.copied;
+      result.templates.skipped = templatesResult.skipped;
+
+      // 7. Create HISTORY.md
+      result.created.history = await ensureHistoryFile(projectPath);
+
+      // 8. Create constitution.md
+      result.created.constitution = await ensureConstitution(projectPath);
+
+      // 9. Create ROADMAP.md
+      result.created.roadmap = await createRoadmap(projectPath, projectName);
+
+      // 10. Create BACKLOG.md
+      result.created.backlog = await createBacklog(projectPath, projectName);
+
+      // 11. Create specs/ directory
+      result.created.specsDir = await createSpecsDir(projectPath);
+
+      // 12. Register in global registry
+      registerProject(state.project.id, projectName, projectPath);
+      result.registered = true;
+
+      // Success
+      result.status = 'success';
+
+      output(result, formatHumanReadable(result));
+    } catch (err) {
+      result.error = {
+        message: err instanceof Error ? err.message : 'Unknown error',
+        hint: 'Check the error message for details',
+      };
+      output(result, `Error: ${result.error.message}\nHint: ${result.error.hint}`);
+      process.exitCode = 1;
+    }
+}
+
+/**
+ * Initialize a new SpecFlow project with full compliance
+ *
+ * Creates:
+ *   .specflow/
+ *     orchestration-state.json
+ *     manifest.json
+ *     workflows/
+ *   .specify/
+ *     memory/
+ *       constitution.md
+ *     templates/
+ *     phases/
+ *     archive/
+ *     history/
+ *       HISTORY.md
+ *     discovery/
+ *   ROADMAP.md
+ *   BACKLOG.md
+ *   specs/
+ *
+ * Examples:
+ *   specflow project init
+ *   specflow project init --force
+ *   specflow project init --name "My Project"
+ */
+export const init = new Command('init')
+  .description('Initialize a new SpecFlow project with full 3.0 compliance')
+  .option('--force', 'Reinitialize even if already initialized')
+  .option('--name <name>', 'Project name (defaults to directory name)')
+  .action(runProjectInit);
diff --git a/packages/cli/src/commands/upgrade.ts b/packages/cli/src/commands/upgrade.ts
index a4548b9..945a7f6 100644
--- a/packages/cli/src/commands/upgrade.ts
+++ b/packages/cli/src/commands/upgrade.ts
@@ -218,8 +218,11 @@ async function runUpgrade(options: {
 
   // Handle uninitialized repos
   if (detection.version === 'uninitialized') {
-    result.errors.push('No SDD artifacts found. Run /flow.init to initialize a new project.');
-    result.nextSteps = ['Run /flow.init to initialize this project'];
+    result.errors.push('No SpecFlow artifacts found. Run "specflow init" to create project structure.');
+    result.nextSteps = [
+      'Run "specflow init" to create project structure',
+      'Then run /flow.init for AI-guided discovery (optional)',
+    ];
     return result;
   }
 
@@ -407,8 +410,8 @@ function formatHumanReadable(result: UpgradeOutput): string {
 
   // Handle special cases
   if (result.detection.version === 'uninitialized') {
-    lines.push(chalk.yellow('No SDD artifacts found.'));
-    lines.push('Run /flow.init to initialize a new project.');
+    lines.push(chalk.yellow('No SpecFlow artifacts found.'));
+    lines.push('Run "specflow init" to create project structure.');
     return lines.join('\n');
   }
 
diff --git a/packages/cli/src/index.ts b/packages/cli/src/index.ts
index e716636..a86c946 100644
--- a/packages/cli/src/index.ts
+++ b/packages/cli/src/index.ts
@@ -5,7 +5,9 @@ import { statusCommand } from './commands/status.js';
 import { nextCommand } from './commands/next.js';
 import { markCommand } from './commands/mark.js';
 import { checkCommand } from './commands/check.js';
+import { initCommand } from './commands/init.js';
 import { phaseCommand } from './commands/phase/index.js';
+import { projectCommand } from './commands/project/index.js';
 import { upgradeCommand } from './commands/upgrade.js';
 import { workflowCommand } from './commands/workflow/index.js';
 import { templatesCommand } from './commands/templates.js';
@@ -31,7 +33,9 @@ program.addCommand(statusCommand);
 program.addCommand(nextCommand);
 program.addCommand(markCommand);
 program.addCommand(checkCommand);
+program.addCommand(initCommand);
 program.addCommand(phaseCommand);
+program.addCommand(projectCommand);
 program.addCommand(upgradeCommand);
 program.addCommand(workflowCommand);
 program.addCommand(templatesCommand);
diff --git a/packages/cli/src/lib/health.ts b/packages/cli/src/lib/health.ts
index 15f1e4c..ae4a3ac 100644
--- a/packages/cli/src/lib/health.ts
+++ b/packages/cli/src/lib/health.ts
@@ -1,7 +1,7 @@
 import { exec } from 'node:child_process';
 import { promisify } from 'node:util';
 import { join } from 'node:path';
-import { readFile } from 'node:fs/promises';
+import { readFile, readdir } from 'node:fs/promises';
 import { z } from 'zod';
 import {
   findProjectRoot,
@@ -11,14 +11,32 @@ import {
   getMemoryDir,
   getTemplatesDir,
   getSystemTemplatesDir,
+  getSpecsDir,
+  getArchiveDir,
+  getHistoryDir,
+  getPhasesDir,
+  getSpecifyDir,
   pathExists,
 } from './paths.js';
-import { readState } from './state.js';
+import { readState, readRawState } from './state.js';
 import { readRoadmap, getPhaseByNumber } from './roadmap.js';
 import { getProjectContext, getMissingArtifacts, resolveFeatureDir } from './context.js';
 import { readTasks } from './tasks.js';
 import type { OrchestrationState } from '@specflow/shared';
 
+/**
+ * Valid enum values for schema validation
+ */
+const VALID_STEP_NAMES = ['design', 'analyze', 'implement', 'verify'] as const;
+const VALID_STEP_STATUSES = ['not_started', 'pending', 'in_progress', 'complete', 'failed', 'blocked', 'skipped'] as const;
+const VALID_PHASE_STATUSES = ['not_started', 'in_progress', 'complete'] as const;
+const STEP_INDEX_MAP: Record<string, number> = { design: 0, analyze: 1, implement: 2, verify: 3 };
+
+/**
+ * ABBC naming pattern - 4 digits (e.g., 0010, 0020, 1015)
+ */
+const ABBC_PATTERN = /^\d{4}-/;
+
 /**
  * Zod schema for manifest.json validation
  */
@@ -115,8 +133,8 @@ async function collectIssues(projectPath?: string): Promise<HealthIssue[]> {
       code: 'NO_STATE',
       severity: 'error',
       message: 'No state file found',
-      fix: 'Run "specflow phase open <number>" to start a phase, or "specflow state set" to initialize',
-      autoFixable: true,
+      fix: 'Run "specflow init" to initialize the project',
+      autoFixable: false, // Requires full project setup, not just state file
     });
     return issues; // Can't check further without state
   }
@@ -126,14 +144,218 @@ async function collectIssues(projectPath?: string): Promise<HealthIssue[]> {
   try {
     state = await readState(root);
   } catch (err) {
+    // Try to read raw state for better diagnostics
+    const rawResult = await readRawState(root);
+    if (rawResult.zodErrors && rawResult.zodErrors.length > 0) {
+      // Provide specific error messages for each Zod validation issue
+      for (const zodIssue of rawResult.zodErrors.slice(0, 5)) {
+        const path = zodIssue.path.join('.');
+        issues.push({
+          code: 'STATE_SCHEMA_ERROR',
+          severity: 'error',
+          message: `${path}: ${zodIssue.message}`,
+          fix: 'Run "specflow check --fix" to attempt auto-repair',
+          autoFixable: true,
+        });
+      }
+      if (rawResult.zodErrors.length > 5) {
+        issues.push({
+          code: 'STATE_SCHEMA_ERROR',
+          severity: 'error',
+          message: `... and ${rawResult.zodErrors.length - 5} more validation errors`,
+          autoFixable: false,
+        });
+      }
+    } else {
+      issues.push({
+        code: 'STATE_INVALID',
+        severity: 'error',
+        message: rawResult.error || 'State file is corrupted or invalid',
+        fix: 'Run "specflow state reset" to reset state, or manually repair .specflow/orchestration-state.json',
+        autoFixable: false,
+      });
+    }
+    return issues;
+  }
+
+  // === NEW: Schema validation checks ===
+
+  // Check schema_version
+  if (state.schema_version !== '3.0') {
     issues.push({
-      code: 'STATE_INVALID',
+      code: 'SCHEMA_VERSION_OUTDATED',
       severity: 'error',
-      message: 'State file is corrupted or invalid',
-      fix: 'Run "specflow state reset" to reset state, or manually repair .specflow/orchestration-state.json',
-      autoFixable: false, // Requires manual intervention to preserve data
+      message: `schema_version is "${state.schema_version}", expected "3.0"`,
+      fix: 'Run "specflow check --fix" to update schema version',
+      autoFixable: true,
     });
-    return issues;
+  }
+
+  // Check step.index is a number (not string)
+  const stepIndex = state.orchestration?.step?.index;
+  if (stepIndex !== null && stepIndex !== undefined && typeof stepIndex !== 'number') {
+    issues.push({
+      code: 'STEP_INDEX_TYPE_ERROR',
+      severity: 'error',
+      message: `step.index is "${typeof stepIndex}" ("${stepIndex}"), must be a number`,
+      fix: 'Run "specflow check --fix" to convert to correct type',
+      autoFixable: true,
+    });
+  }
+
+  // Check step.current is valid enum or null
+  const stepCurrent = state.orchestration?.step?.current;
+  if (stepCurrent !== null && stepCurrent !== undefined) {
+    if (!VALID_STEP_NAMES.includes(stepCurrent as typeof VALID_STEP_NAMES[number])) {
+      issues.push({
+        code: 'STEP_CURRENT_INVALID',
+        severity: 'error',
+        message: `step.current is "${stepCurrent}", must be one of: ${VALID_STEP_NAMES.join(', ')} (or null)`,
+        fix: 'Run "specflow check --fix" to reset to valid value',
+        autoFixable: true,
+      });
+    }
+  }
+
+  // Check step.status is valid enum
+  const stepStatus = state.orchestration?.step?.status;
+  if (stepStatus !== null && stepStatus !== undefined) {
+    if (!VALID_STEP_STATUSES.includes(stepStatus as typeof VALID_STEP_STATUSES[number])) {
+      issues.push({
+        code: 'STEP_STATUS_INVALID',
+        severity: 'error',
+        message: `step.status is "${stepStatus}", must be one of: ${VALID_STEP_STATUSES.join(', ')}`,
+        fix: 'Run "specflow check --fix" to reset to valid value',
+        autoFixable: true,
+      });
+    }
+  }
+
+  // Check phase.status is valid enum
+  const phaseStatus = state.orchestration?.phase?.status;
+  if (phaseStatus !== null && phaseStatus !== undefined) {
+    if (!VALID_PHASE_STATUSES.includes(phaseStatus as typeof VALID_PHASE_STATUSES[number])) {
+      issues.push({
+        code: 'PHASE_STATUS_INVALID',
+        severity: 'error',
+        message: `phase.status is "${phaseStatus}", must be one of: ${VALID_PHASE_STATUSES.join(', ')}`,
+        fix: 'Run "specflow check --fix" to reset to valid value',
+        autoFixable: true,
+      });
+    }
+  }
+
+  // Check step.index matches step.current (if both set)
+  if (stepCurrent && typeof stepIndex === 'number') {
+    const expectedIndex = STEP_INDEX_MAP[stepCurrent];
+    if (expectedIndex !== undefined && stepIndex !== expectedIndex) {
+      issues.push({
+        code: 'STEP_INDEX_MISMATCH',
+        severity: 'warning',
+        message: `step.index is ${stepIndex} but step.current is "${stepCurrent}" (expected index ${expectedIndex})`,
+        fix: 'Run "specflow check --fix" to correct index',
+        autoFixable: true,
+      });
+    }
+  }
+
+  // === NEW: File structure checks ===
+
+  // Check for state file in wrong location (.specify/)
+  const wrongStatePath = join(getSpecifyDir(root), 'orchestration-state.json');
+  if (pathExists(wrongStatePath)) {
+    issues.push({
+      code: 'STATE_WRONG_LOCATION',
+      severity: 'warning',
+      message: 'State file found in .specify/ (should only be in .specflow/)',
+      fix: 'Run "specflow check --fix" to remove duplicate, or manually delete .specify/orchestration-state.json',
+      autoFixable: true,
+    });
+  }
+
+  // Check BACKLOG.md exists
+  const backlogPath = join(root, 'BACKLOG.md');
+  if (!pathExists(backlogPath)) {
+    issues.push({
+      code: 'NO_BACKLOG',
+      severity: 'info',
+      message: 'No BACKLOG.md found',
+      fix: 'Run "specflow check --fix" to create BACKLOG.md template',
+      autoFixable: true,
+    });
+  }
+
+  // Check HISTORY.md exists
+  const historyDir = getHistoryDir(root);
+  const historyPath = join(historyDir, 'HISTORY.md');
+  if (!pathExists(historyPath)) {
+    issues.push({
+      code: 'NO_HISTORY',
+      severity: 'info',
+      message: 'No .specify/history/HISTORY.md found',
+      fix: 'Run "specflow check --fix" to create HISTORY.md template',
+      autoFixable: true,
+    });
+  }
+
+  // Check specs/ folder for ABC naming (should be ABBC)
+  const specsDir = getSpecsDir(root);
+  if (pathExists(specsDir)) {
+    try {
+      const specFolders = await readdir(specsDir, { withFileTypes: true });
+      const abcFolders = specFolders
+        .filter(d => d.isDirectory())
+        .filter(d => /^\d{3}-/.test(d.name) && !ABBC_PATTERN.test(d.name))
+        .map(d => d.name);
+
+      if (abcFolders.length > 0) {
+        issues.push({
+          code: 'ABC_NAMING_FOUND',
+          severity: 'warning',
+          message: `Found ${abcFolders.length} phase folder(s) with old ABC naming: ${abcFolders.slice(0, 3).join(', ')}${abcFolders.length > 3 ? '...' : ''}`,
+          fix: 'Rename folders from ABC (001-name) to ABBC (0010-name) format',
+          autoFixable: false, // Requires careful migration
+        });
+      }
+    } catch {
+      // Can't read specs dir
+    }
+  }
+
+  // Check for completed phases still in specs/ (should be archived)
+  if (pathExists(specsDir) && state.actions?.history) {
+    try {
+      const specFolders = await readdir(specsDir, { withFileTypes: true });
+      const specFolderNames = specFolders.filter(d => d.isDirectory()).map(d => d.name);
+
+      const completedPhases = state.actions.history
+        .filter(h => h.type === 'phase_completed' && h.phase_number)
+        .map(h => h.phase_number);
+
+      const unarchived: string[] = [];
+      for (const folder of specFolderNames) {
+        // Extract phase number from folder name (e.g., "0010-name" -> "0010")
+        const match = folder.match(/^(\d{3,4})-/);
+        if (match) {
+          const phaseNum = match[1].padStart(4, '0'); // Normalize to 4 digits
+          if (completedPhases.includes(phaseNum) || completedPhases.includes(match[1])) {
+            unarchived.push(folder);
+          }
+        }
+      }
+
+      if (unarchived.length > 0) {
+        issues.push({
+          code: 'COMPLETED_PHASE_NOT_ARCHIVED',
+          severity: 'warning',
+          message: `Found ${unarchived.length} completed phase(s) still in specs/: ${unarchived.slice(0, 3).join(', ')}${unarchived.length > 3 ? '...' : ''}`,
+          fix: 'Move completed phases to .specify/archive/ with "specflow phase archive <number>"',
+          autoFixable: false, // Requires careful migration
+        });
+      }
+    } catch {
+      // Can't check
+    }
   }
 
   // Check ROADMAP.md
@@ -310,7 +532,7 @@ async function collectIssues(projectPath?: string): Promise<HealthIssue[]> {
             severity: 'warning',
             message: `Current branch "${currentBranch}" doesn't match state "${expectedBranch}"`,
             fix: `Run "git checkout ${expectedBranch}" to switch branches`,
-            autoFixable: true,
+            autoFixable: false, // Don't auto-switch branches - could lose uncommitted work
           });
         }
       }
@@ -365,13 +587,13 @@ async function collectIssues(projectPath?: string): Promise<HealthIssue[]> {
     }
   }
 
-  // Check step status consistency
-  const stepStatus = state.orchestration?.step?.status;
-  if (stepStatus === 'blocked' || stepStatus === 'failed') {
+  // Check step status consistency (blocked/failed)
+  const currentStepStatus = state.orchestration?.step?.status;
+  if (currentStepStatus === 'blocked' || currentStepStatus === 'failed') {
     issues.push({
       code: 'STEP_BLOCKED',
       severity: 'warning',
-      message: `Current step is ${stepStatus}`,
+      message: `Current step is ${currentStepStatus}`,
       fix: 'Review blockers and retry, or skip with "specflow state set orchestration.step.status=in_progress"',
       autoFixable: false,
     });
diff --git a/packages/cli/src/lib/state.ts b/packages/cli/src/lib/state.ts
index 6741f76..8a857d3 100644
--- a/packages/cli/src/lib/state.ts
+++ b/packages/cli/src/lib/state.ts
@@ -1,6 +1,7 @@
 import { readFile, writeFile, mkdir, rename, unlink } from 'node:fs/promises';
 import { dirname, join } from 'node:path';
 import { randomUUID } from 'node:crypto';
+import { z } from 'zod';
 import type { OrchestrationState } from '@specflow/shared';
 import { OrchestrationStateSchema } from '@specflow/shared';
 import { getStatePath, pathExists } from './paths.js';
@@ -10,6 +11,20 @@ import { NotFoundError, StateError, ValidationError } from './errors.js';
  * State file operations for SpecFlow
  */
 
+/**
+ * Format Zod error for human-readable output
+ */
+function formatZodError(error: z.ZodError): string {
+  const issues = error.issues.slice(0, 3).map(issue => {
+    const path = issue.path.join('.');
+    return `  - ${path}: ${issue.message}`;
+  });
+  if (error.issues.length > 3) {
+    issues.push(`  ... and ${error.issues.length - 3} more issues`);
+  }
+  return issues.join('\n');
+}
+
 /** Read and parse the state file */
 export async function readState(projectPath?: string): Promise<OrchestrationState> {
   const statePath = getStatePath(projectPath);
@@ -29,10 +44,71 @@ export async function readState(projectPath?: string): Promise<OrchestrationStat
     if (err instanceof SyntaxError) {
       throw new StateError('State file contains invalid JSON');
     }
+    if (err instanceof z.ZodError) {
+      throw new StateError(
+        `State file schema validation failed:\n${formatZodError(err)}\n\nRun "specflow check --fix" to attempt auto-repair.`
+      );
+    }
     throw err;
   }
 }
 
+/**
+ * Result of reading raw state (for diagnostics)
+ */
+export interface RawStateResult {
+  success: boolean;
+  data?: Record<string, unknown>;
+  error?: string;
+  zodErrors?: z.ZodIssue[];
+}
+
+/**
+ * Read state file without validation (for diagnostics and repair)
+ * Returns parsed JSON data even if it fails Zod validation
+ */
+export async function readRawState(projectPath?: string): Promise<RawStateResult> {
+  const statePath = getStatePath(projectPath);
+
+  if (!pathExists(statePath)) {
+    return { success: false, error: 'State file not found' };
+  }
+
+  try {
+    const content = await readFile(statePath, 'utf-8');
+    const data = JSON.parse(content);
+
+    // Try to validate but capture errors instead of throwing
+    const result = OrchestrationStateSchema.safeParse(data);
+    if (result.success) {
+      return { success: true, data };
+    } else {
+      return {
+        success: false,
+        data, // Return the raw data anyway for repair
+        error: 'Schema validation failed',
+        zodErrors: result.error.issues,
+      };
+    }
+  } catch (err) {
+    if (err instanceof SyntaxError) {
+      return { success: false, error: 'Invalid JSON' };
+    }
+    return { success: false, error: String(err) };
+  }
+}
+
+/**
+ * Write raw data to state file (bypasses validation, use with caution)
+ * Used for auto-repair scenarios
+ */
+export async function writeRawState(data: Record<string, unknown>, projectPath?: string): Promise<void> {
+  const statePath = getStatePath(projectPath);
+  const dir = dirname(statePath);
+  await mkdir(dir, { recursive: true });
+  await atomicWriteFile(statePath, JSON.stringify(data, null, 2));
+}
+
 /**
  * Atomically write content to a file (write to temp, then rename).
  * This prevents partial writes from corrupting the file.
diff --git a/packages/cli/tests/commands/project/init.test.ts b/packages/cli/tests/commands/project/init.test.ts
new file mode 100644
index 0000000..f9dd25b
--- /dev/null
+++ b/packages/cli/tests/commands/project/init.test.ts
@@ -0,0 +1,126 @@
+import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest';
+import { mkdir, writeFile, rm } from 'node:fs/promises';
+import { join } from 'node:path';
+import { tmpdir } from 'node:os';
+import { randomUUID } from 'node:crypto';
+
+// Store original process.cwd
+const originalCwd = process.cwd;
+
+describe('project init command', () => {
+  let testDir: string;
+
+  beforeEach(async () => {
+    // Create a unique temp directory for each test
+    testDir = join(tmpdir(), `specflow-init-test-${randomUUID()}`);
+    await mkdir(testDir, { recursive: true });
+    // Change to test directory
+    process.cwd = () => testDir;
+  });
+
+  afterEach(async () => {
+    // Restore original cwd
+    process.cwd = originalCwd;
+    // Clean up test directory
+    try {
+      await rm(testDir, { recursive: true, force: true });
+    } catch {
+      // Ignore cleanup errors
+    }
+  });
+
+  describe('runProjectInit', () => {
+    it('should create all required directories and files', async () => {
+      // Dynamically import to get mocked cwd
+      const { runProjectInit } = await import('../../../src/commands/project/init.js');
+      const { pathExists } = await import('../../../src/lib/paths.js');
+
+      await runProjectInit({ name: 'test-project' });
+
+      // Verify .specflow/ structure
+      expect(pathExists(join(testDir, '.specflow'))).toBe(true);
+      expect(pathExists(join(testDir, '.specflow', 'orchestration-state.json'))).toBe(true);
+      expect(pathExists(join(testDir, '.specflow', 'manifest.json'))).toBe(true);
+      expect(pathExists(join(testDir, '.specflow', 'workflows'))).toBe(true);
+
+      // Verify .specify/ structure
+      expect(pathExists(join(testDir, '.specify'))).toBe(true);
+      expect(pathExists(join(testDir, '.specify', 'memory'))).toBe(true);
+      expect(pathExists(join(testDir, '.specify', 'templates'))).toBe(true);
+      expect(pathExists(join(testDir, '.specify', 'phases'))).toBe(true);
+      expect(pathExists(join(testDir, '.specify', 'archive'))).toBe(true);
+      expect(pathExists(join(testDir, '.specify', 'history'))).toBe(true);
+      expect(pathExists(join(testDir, '.specify', 'discovery'))).toBe(true);
+
+      // Verify core files
+      expect(pathExists(join(testDir, '.specify', 'history', 'HISTORY.md'))).toBe(true);
+      expect(pathExists(join(testDir, '.specify', 'memory', 'constitution.md'))).toBe(true);
+      expect(pathExists(join(testDir, 'ROADMAP.md'))).toBe(true);
+      expect(pathExists(join(testDir, 'BACKLOG.md'))).toBe(true);
+      expect(pathExists(join(testDir, 'specs'))).toBe(true);
+    });
+
+    it('should create valid state file', async () => {
+      const { runProjectInit } = await import('../../../src/commands/project/init.js');
+      const { readFile } = await import('node:fs/promises');
+
+      await runProjectInit({ name: 'my-project' });
+
+      const stateContent = await readFile(join(testDir, '.specflow', 'orchestration-state.json'), 'utf-8');
+      const state = JSON.parse(stateContent);
+
+      expect(state.schema_version).toBe('3.0');
+      expect(state.project.name).toBe('my-project');
+      expect(state.project.path).toBe(testDir);
+      expect(state.orchestration.phase.status).toBe('not_started');
+      expect(state.orchestration.step.current).toBe('design');
+      expect(state.orchestration.step.index).toBe(0);
+    });
+
+    it('should fail if already initialized without --force', async () => {
+      const { runProjectInit } = await import('../../../src/commands/project/init.js');
+
+      // First init should succeed
+      await runProjectInit({ name: 'test-project' });
+
+      // Second init should fail (check exit code was set)
+      const originalExitCode = process.exitCode;
+      await runProjectInit({ name: 'test-project' });
+      expect(process.exitCode).toBe(1);
+
+      // Reset
+      process.exitCode = originalExitCode;
+    });
+
+    it('should succeed with --force on existing project', async () => {
+      const { runProjectInit } = await import('../../../src/commands/project/init.js');
+      const { pathExists } = await import('../../../src/lib/paths.js');
+
+      // First init
+      await runProjectInit({ name: 'test-project' });
+
+      // Clear exit code
+      process.exitCode = undefined;
+
+      // Second init with force should succeed
+      await runProjectInit({ name: 'updated-project', force: true });
+
+      // Verify still valid
+      expect(pathExists(join(testDir, '.specflow', 'orchestration-state.json'))).toBe(true);
+    });
+
+    it('should use directory name as project name when not specified', async () => {
+      const { runProjectInit } = await import('../../../src/commands/project/init.js');
+      const { readFile } = await import('node:fs/promises');
+      const { basename } = await import('node:path');
+
+      await runProjectInit({});
+
+      const stateContent = await readFile(join(testDir, '.specflow', 'orchestration-state.json'), 'utf-8');
+      const state = JSON.parse(stateContent);
+
+      // Should use the test directory name
+      expect(state.project.name).toBe(basename(testDir));
+    });
+  });
+});
diff --git a/packages/dashboard/eslint.config.mjs b/packages/dashboard/eslint.config.mjs
index 05e726d..b74e188 100644
--- a/packages/dashboard/eslint.config.mjs
+++ b/packages/dashboard/eslint.config.mjs
@@ -13,6 +13,20 @@ const eslintConfig = defineConfig([
     "build/**",
     "next-env.d.ts",
   ]),
+  // T030: Prevent setInterval in hooks for data polling
+  // Use SSE/file watching instead of polling
+  {
+    files: ["src/hooks/**/*.ts", "src/hooks/**/*.tsx"],
+    rules: {
+      "no-restricted-globals": [
+        "warn",
+        {
+          name: "setInterval",
+          message: "Avoid setInterval in hooks for data polling. Use SSE events from useUnifiedData instead.",
+        },
+      ],
+    },
+  },
 ]);
 
 export default eslintConfig;
diff --git a/packages/dashboard/package.json b/packages/dashboard/package.json
index ae0a1ef..9fd8f01 100644
--- a/packages/dashboard/package.json
+++ b/packages/dashboard/package.json
@@ -30,6 +30,7 @@
     "remark-gfm": "^4.0.1",
     "sonner": "^1.7.0",
     "tailwind-merge": "^3.4.0",
+    "uuid": "^13.0.0",
     "zod": "^3.25.76",
     "zod-to-json-schema": "^3.25.1"
   },
@@ -38,6 +39,7 @@
     "@types/react": "^19",
     "@types/react-dom": "^19",
     "@types/react-syntax-highlighter": "^15.5.13",
+    "@types/uuid": "^11.0.0",
     "autoprefixer": "^10.4.23",
     "eslint": "^9",
     "eslint-config-next": "16.1.3",
diff --git a/packages/dashboard/src/app/api/events/route.ts b/packages/dashboard/src/app/api/events/route.ts
index 3a8679c..977cc1c 100644
--- a/packages/dashboard/src/app/api/events/route.ts
+++ b/packages/dashboard/src/app/api/events/route.ts
@@ -1,4 +1,4 @@
-import { initWatcher, addListener, getCurrentRegistry, getAllStates, getAllTasks, getAllWorkflows, getAllPhases, startHeartbeat } from '@/lib/watcher';
+import { initWatcher, addListener, getCurrentRegistry, getAllStates, getAllTasks, getAllWorkflows, getAllPhases, getAllSessions, startHeartbeat } from '@/lib/watcher';
 import type { SSEEvent } from '@specflow/shared';
 
 // Initialize watcher on first request
@@ -95,6 +95,18 @@ export async function GET(): Promise<Response> {
         });
       }
 
+      // Send current session content for active sessions
+      const sessions = await getAllSessions();
+      for (const { projectId, sessionId, content } of sessions) {
+        send({
+          type: 'session:message',
+          timestamp: new Date().toISOString(),
+          projectId,
+          sessionId,
+          data: content,
+        });
+      }
+
       // Add listener for future events
       const removeListener = addListener(send);
 
diff --git a/packages/dashboard/src/app/api/session/content/route.ts b/packages/dashboard/src/app/api/session/content/route.ts
index b43ff1d..da8e12f 100644
--- a/packages/dashboard/src/app/api/session/content/route.ts
+++ b/packages/dashboard/src/app/api/session/content/route.ts
@@ -105,6 +105,8 @@ export async function GET(request: Request) {
       sessionId,
       toolCalls,
       currentTodos: sessionData.currentTodos,
+      workflowOutput: sessionData.workflowOutput,
+      agentTasks: sessionData.agentTasks,
     });
   } catch (error) {
     const message = error instanceof Error ? error.message : 'Unknown error';
diff --git a/packages/dashboard/src/app/api/workflow/orchestrate/route.ts b/packages/dashboard/src/app/api/workflow/orchestrate/route.ts
index fb79a35..7f78d16 100644
--- a/packages/dashboard/src/app/api/workflow/orchestrate/route.ts
+++ b/packages/dashboard/src/app/api/workflow/orchestrate/route.ts
@@ -58,6 +58,10 @@ interface SpecflowStatus {
     tasksTotal?: number;
     tasksCompleted?: number;
   };
+  step?: {
+    current?: string;
+    status?: string;
+  };
   nextAction?: string;
 }
 
@@ -96,7 +100,9 @@ function needsDesign(status: SpecflowStatus | null): boolean {
 
 /**
  * Determine smart starting phase based on project state
- * Returns config overrides for skipDesign/skipAnalyze
+ * Returns config overrides for skipDesign/skipAnalyze/skipImplement/skipVerify
+ *
+ * Phase ordering: design → analyze → implement → verify → merge
  */
 function getSmartConfig(
   status: SpecflowStatus | null,
@@ -111,16 +117,57 @@ function getSmartConfig(
   const tasksCompleted = status.progress?.tasksCompleted ?? 0;
   const allTasksComplete = tasksTotal > 0 && tasksCompleted >= tasksTotal;
 
-  // Smart defaults based on actual state:
-  // - If design artifacts exist, skip design (unless user explicitly unchecked)
-  // - If all tasks complete, we'll start at implement but immediately transition to verify
-  const smartSkipDesign = config.skipDesign || (hasSpec && hasPlan && hasTasks);
-  const smartSkipAnalyze = config.skipAnalyze || smartSkipDesign;
+  // Check step.current to determine what phase we're at (state file may be stale)
+  const stepCurrent = status.step?.current;
+  const stepStatus = status.step?.status;
+
+  // Phase ordering for determining "past" phases
+  const phaseOrder = ['design', 'analyze', 'implement', 'verify', 'merge'];
+  const currentPhaseIndex = stepCurrent ? phaseOrder.indexOf(stepCurrent) : -1;
+
+  // Helper: is current phase at or past a given phase?
+  const isPastPhase = (phase: string) => {
+    const phaseIndex = phaseOrder.indexOf(phase);
+    return currentPhaseIndex >= 0 && currentPhaseIndex > phaseIndex;
+  };
+
+  // Helper: is current phase at a given phase and complete?
+  const isPhaseComplete = (phase: string) => {
+    return stepCurrent === phase && stepStatus === 'complete';
+  };
+
+  // Design is complete if:
+  // - Artifacts exist (spec, plan, tasks)
+  // - OR we're past design phase
+  const designComplete = (hasSpec && hasPlan && hasTasks) || isPastPhase('design');
+
+  // Analyze is complete if:
+  // - User explicitly skips it
+  // - OR we're past analyze phase (at implement, verify, or merge)
+  // - OR step.current is 'analyze' and status is 'complete'
+  // - OR all tasks are complete (implies we're past analyze - analyze happens before implement)
+  const analyzeComplete = config.skipAnalyze || isPastPhase('analyze') || isPhaseComplete('analyze') || allTasksComplete;
+
+  // Implement is complete if:
+  // - All tasks are complete
+  // - OR we're past implement phase (at verify or merge)
+  const implementComplete = allTasksComplete || isPastPhase('implement');
+
+  // Verify is complete if:
+  // - step.current is 'verify' and status is 'complete'
+  // - OR we're past verify phase (at merge)
+  // Note: verify completion also requires all tasks to be complete
+  const verifyComplete = (isPhaseComplete('verify') || isPastPhase('verify')) && allTasksComplete;
+
+  console.log(`[getSmartConfig] stepCurrent=${stepCurrent}, stepStatus=${stepStatus}, phaseIndex=${currentPhaseIndex}`);
+  console.log(`[getSmartConfig] designComplete=${designComplete}, analyzeComplete=${analyzeComplete}, implementComplete=${implementComplete}, verifyComplete=${verifyComplete}`);
 
   return {
     ...config,
-    skipDesign: smartSkipDesign,
-    skipAnalyze: smartSkipAnalyze,
+    skipDesign: config.skipDesign || designComplete,
+    skipAnalyze: config.skipAnalyze || analyzeComplete,
+    skipImplement: implementComplete,
+    skipVerify: verifyComplete,
   };
 }
 
diff --git a/packages/dashboard/src/app/api/workflow/orchestrate/status/route.ts b/packages/dashboard/src/app/api/workflow/orchestrate/status/route.ts
index c6538fd..041b68d 100644
--- a/packages/dashboard/src/app/api/workflow/orchestrate/status/route.ts
+++ b/packages/dashboard/src/app/api/workflow/orchestrate/status/route.ts
@@ -1,9 +1,11 @@
 import { NextResponse } from 'next/server';
+import { existsSync, readFileSync, writeFileSync } from 'fs';
+import { join } from 'path';
 import { execSync } from 'child_process';
 import { orchestrationService } from '@/lib/services/orchestration-service';
 import { parseBatchesFromProject } from '@/lib/services/batch-parser';
 import { workflowService } from '@/lib/services/workflow-service';
-import type { OrchestrationExecution } from '@specflow/shared';
+import type { OrchestrationExecution, OrchestrationPhase } from '@specflow/shared';
 
 // =============================================================================
 // Types
@@ -48,6 +50,34 @@ interface PreflightStatus {
 // Registry Lookup
 // =============================================================================
 
+/**
+ * Sync current phase to orchestration-state.json for UI consistency
+ */
+function syncPhaseToStateFile(projectPath: string, phase: OrchestrationPhase): void {
+  try {
+    let statePath = join(projectPath, '.specflow', 'orchestration-state.json');
+    if (!existsSync(statePath)) {
+      statePath = join(projectPath, '.specify', 'orchestration-state.json');
+    }
+    if (!existsSync(statePath)) return;
+
+    const content = readFileSync(statePath, 'utf-8');
+    const state = JSON.parse(content);
+
+    // Only update if phase differs (avoid unnecessary writes)
+    if (state.orchestration?.step?.current !== phase) {
+      state.orchestration = state.orchestration || {};
+      state.orchestration.step = state.orchestration.step || {};
+      state.orchestration.step.current = phase;
+      state.orchestration.step.status = 'in_progress';
+      state.last_updated = new Date().toISOString();
+      writeFileSync(statePath, JSON.stringify(state, null, 2));
+    }
+  } catch {
+    // Non-critical
+  }
+}
+
 function getProjectPath(projectId: string): string | null {
   const { existsSync, readFileSync } = require('fs');
   const { join } = require('path');
@@ -223,6 +253,9 @@ export async function GET(request: Request) {
       return NextResponse.json({ orchestration: null, workflow: null }, { status: 200 });
     }
 
+    // Sync current phase to state file (ensures UI consistency for project list)
+    syncPhaseToStateFile(projectPath, orchestration.currentPhase);
+
     // Look up the current workflow to get its sessionId
     let workflowInfo: { id: string; sessionId?: string; status?: string } | null = null;
     const currentWorkflowId = getCurrentWorkflowId(orchestration);
diff --git a/packages/dashboard/src/app/projects/[id]/page.tsx b/packages/dashboard/src/app/projects/[id]/page.tsx
index 02875f1..58e6f6e 100644
--- a/packages/dashboard/src/app/projects/[id]/page.tsx
+++ b/packages/dashboard/src/app/projects/[id]/page.tsx
@@ -15,12 +15,13 @@ import { FailedToast } from "@/components/input/failed-toast"
 import { DetachedBanner } from "@/components/input/detached-banner"
 import type { WorkflowStatus } from "@/components/design-system"
 import { useConnection } from "@/contexts/connection-context"
+import { useUnifiedData } from "@/contexts/unified-data-context"
 import { useProjects } from "@/hooks/use-projects"
-import { useWorkflowExecution } from "@/hooks/use-workflow-execution"
+import { useProjectData } from "@/hooks/use-project-data"
+import { useWorkflowActions } from "@/hooks/use-workflow-actions"
+import { useSessionContentExtended } from "@/hooks/use-session-content"
 import { AlertCircle } from "lucide-react"
 import { SessionViewerDrawer } from "@/components/projects/session-viewer-drawer"
-import { useSessionHistory } from "@/hooks/use-session-history"
-import { useSessionMessages } from "@/hooks/use-session-messages"
 import { usePhaseHistory } from "@/hooks/use-phase-history"
 import { usePhaseDetail } from "@/hooks/use-phase-detail"
 import { useGitChanges } from "@/hooks/use-git-changes"
@@ -74,7 +75,7 @@ export default function ProjectDetailPage() {
   const router = useRouter()
   const projectId = params.id as string
 
-  const { states, tasks, setSelectedProject } = useConnection()
+  const { setSelectedProject } = useConnection()
   const { projects, loading: projectsLoading } = useProjects()
   const [activeView, setActiveView] = useState<ViewType>('dashboard')
   const [historySelectedPhase, setHistorySelectedPhase] = useState<string | null>(null)
@@ -85,23 +86,55 @@ export default function ProjectDetailPage() {
   // Find project in list
   const project = projects.find((p) => p.id === projectId)
 
-  // Workflow execution state
+  // G4.7: Session questions from SSE (AskUserQuestion tool calls)
+  const { sessionQuestions, clearSessionQuestions } = useUnifiedData()
+
+  // Project data from SSE (real-time)
   const {
-    execution: workflowExecution,
-    start: startWorkflow,
-    cancel: cancelWorkflow,
-    submitAnswers,
-  } = useWorkflowExecution(projectId, { projectName: project?.name })
+    state,
+    tasks: projectTasks,
+    workflow,
+    currentExecution,
+    sessions: sessionHistory,
+    isLoading: projectDataLoading,
+  } = useProjectData(projectId)
+
+  // Workflow execution state (derived from SSE data)
+  const workflowExecution = currentExecution
+
+  // Workflow actions (mutations)
+  const {
+    start: startWorkflowAction,
+    cancel: cancelWorkflowAction,
+    submitAnswers: submitAnswersAction,
+    isSubmitting: isSubmittingWorkflow,
+  } = useWorkflowActions(projectId)
   const [isStartingWorkflow, setIsStartingWorkflow] = useState(false)
   const [isCancellingWorkflow, setIsCancellingWorkflow] = useState(false)
 
+  // Wrapper functions for workflow actions
+  const startWorkflow = useCallback(async (skill: string, options?: { resumeSessionId?: string }) => {
+    await startWorkflowAction(skill, options)
+  }, [startWorkflowAction])
+
+  const cancelWorkflow = useCallback(async () => {
+    await cancelWorkflowAction(workflowExecution?.executionId, workflowExecution?.sessionId)
+  }, [cancelWorkflowAction, workflowExecution])
+
+  const submitAnswers = useCallback(async (answers: Record<string, string>) => {
+    if (!workflowExecution?.executionId) throw new Error('No active workflow')
+    await submitAnswersAction(workflowExecution.executionId, answers)
+  }, [submitAnswersAction, workflowExecution])
+
   // Workflow skills for autocomplete
   const { skills: workflowSkills } = useWorkflowSkills()
 
   // Orchestration state (for pause functionality in session console)
   const {
     orchestration,
+    activeSessionId: orchestrationSessionId,  // Session ID from orchestration polling
     pause: pauseOrchestration,
+    resume: resumeOrchestration,
   } = useOrchestration({ projectId })
 
   // Check if there's an active orchestration that can be paused
@@ -118,7 +151,8 @@ export default function ProjectDetailPage() {
   const [currentQuestionIndex, setCurrentQuestionIndex] = useState(0)
 
   // Reset question tracking when workflow questions change (new question set)
-  const questionsKey = workflowExecution?.output?.questions?.map(q => q.question).join('|') ?? ''
+  // TODO: T010 - Questions will come via session:question SSE events
+  const questionsKey = ''
   useEffect(() => {
     setPartialAnswers({})
     setCurrentQuestionIndex(0)
@@ -131,13 +165,13 @@ export default function ProjectDetailPage() {
   // Track which session is selected in the Session console view (separate from drawer)
   const [selectedConsoleSession, setSelectedConsoleSession] = useState<WorkflowIndexEntry | null>(null)
 
-  // Session history for this project
-  const {
-    sessions: sessionHistory,
-    isLoading: sessionHistoryLoading,
-    error: sessionHistoryError,
-    refresh: refreshSessionHistory,
-  } = useSessionHistory(project?.path ?? null)
+  // Session history is now from useProjectData (SSE-pushed)
+  // No need for separate hook - sessionHistory comes from projectData above
+
+  // Refresh function no longer needed - SSE handles real-time updates
+  const refreshSessionHistory = useCallback(() => {
+    // No-op: SSE provides real-time updates
+  }, [])
 
   // Session messages for live console view
   // Include detached sessions - they may still be receiving writes
@@ -146,20 +180,31 @@ export default function ProjectDetailPage() {
     workflowExecution?.status === 'detached'
 
   // Determine which session to show in console: selected historical or current workflow
-  const consoleSessionId = selectedConsoleSession?.sessionId ?? workflowExecution?.sessionId ?? null
+  // Use orchestrationSessionId as fallback - it's populated by polling and available faster than SSE
+  const consoleSessionId = selectedConsoleSession?.sessionId ?? workflowExecution?.sessionId ?? orchestrationSessionId ?? null
+
+  // Debug: log consoleSessionId changes
+  useEffect(() => {
+    console.log(`[Page] consoleSessionId changed:`, {
+      consoleSessionId,
+      selectedSessionId: selectedConsoleSession?.sessionId,
+      workflowSessionId: workflowExecution?.sessionId,
+      orchestrationSessionId,
+    });
+  }, [consoleSessionId, selectedConsoleSession?.sessionId, workflowExecution?.sessionId, orchestrationSessionId]);
+
   const isConsoleSessionActive = selectedConsoleSession
     ? (selectedConsoleSession.status === 'running' || selectedConsoleSession.status === 'waiting_for_input' || selectedConsoleSession.status === 'detached')
     : isWorkflowActive
 
+  // Session content from SSE (no polling)
   const {
     messages: sessionMessages,
     isLoading: sessionMessagesLoading,
     currentTodos: sessionTodos,
-  } = useSessionMessages(
-    project?.path ?? null,
-    consoleSessionId,
-    isConsoleSessionActive
-  )
+    workflowOutput: sessionWorkflowOutput,
+    hasEnded: sessionHasEnded,
+  } = useSessionContentExtended(consoleSessionId, project?.path ?? null)
 
   // Phase history from ROADMAP.md (SSE for real-time updates)
   const {
@@ -184,12 +229,20 @@ export default function ProjectDetailPage() {
     focusPhase?.name
   )
 
-  // Git changes (touched files) - refresh when session messages change
+  // Git changes (touched files) - refresh when session messages, tasks, or state change
+  // Combine triggers: session messages, task count, and state timestamp
+  const gitRefreshTrigger = useMemo(() => {
+    const taskCount = projectTasks?.totalCount ?? 0
+    const completedCount = projectTasks?.completedCount ?? 0
+    const stateTimestamp = state?.orchestration?.phase?.number ?? ''
+    return `${sessionMessages.length}-${taskCount}-${completedCount}-${stateTimestamp}`
+  }, [sessionMessages.length, projectTasks, state])
+
   const {
     files: touchedFiles,
     totalAdditions,
     totalDeletions,
-  } = useGitChanges(project?.path ?? null, sessionMessages.length)
+  } = useGitChanges(project?.path ?? null, gitRefreshTrigger)
 
   // Set selected project for command palette context
   useEffect(() => {
@@ -199,11 +252,7 @@ export default function ProjectDetailPage() {
     return () => setSelectedProject(null)
   }, [project, setSelectedProject])
 
-  // Get orchestration state for this project
-  const state = states.get(projectId)
-
-  // Get tasks for this project
-  const projectTasks = tasks.get(projectId)
+  // state and projectTasks now come from useProjectData above
 
   // Derive project status for actions menu (must be before early returns)
   const projectStatus = useMemo(() => getProjectStatus(state), [state])
@@ -305,14 +354,26 @@ export default function ProjectDetailPage() {
   , [sessionMessages])
 
   // Derive effective workflow status - override to idle if session has ended
+  // Also consider the selected console session (user may have selected a waiting session from dropdown)
   const workflowStatus: WorkflowStatus = useMemo(() => {
+    // If user selected a specific session from dropdown, use that session's status
+    if (selectedConsoleSession) {
+      // Map the session status to WorkflowStatus
+      switch (selectedConsoleSession.status) {
+        case 'running': return 'running'
+        case 'waiting_for_input': return 'waiting'
+        case 'failed': return 'failed'
+        default: return 'idle'
+      }
+    }
+
     const polledStatus = getWorkflowStatus(workflowExecution)
     // If messages show session ended but polling still says running, trust the messages
     if (hasSessionEnded && (polledStatus === 'running' || polledStatus === 'waiting')) {
       return 'idle'
     }
     return polledStatus
-  }, [workflowExecution, hasSessionEnded])
+  }, [workflowExecution, hasSessionEnded, selectedConsoleSession])
 
   // Proactively update workflow metadata when session ends externally
   // This ensures the workflow index reflects reality even if user ends session via CLI
@@ -346,9 +407,40 @@ export default function ProjectDetailPage() {
 
   // Handle decision toast answer - supports multi-question flows
   // Defined before handleOmniBoxSubmit since it's called from there
+  // G4.7/G4.8: Questions come via session:question SSE events OR fallback sources
   const handleDecisionAnswer = useCallback(async (answer: string) => {
-    const questions = workflowExecution?.output?.questions
-    if (!questions?.length) return
+    // Get questions from SSE map first
+    const sseQuestions = consoleSessionId ? sessionQuestions.get(consoleSessionId) : undefined
+
+    // Fallback: compute questions from session messages (same logic as decisionQuestions memo)
+    let fallbackQuestions: Array<{ question: string; options: Array<{ label: string; description?: string }> }> = []
+    if (!sseQuestions?.length && sessionMessages.length > 0) {
+      for (let i = sessionMessages.length - 1; i >= 0; i--) {
+        const msg = sessionMessages[i]
+        if (msg.role === 'assistant' && msg.questions && msg.questions.length > 0) {
+          fallbackQuestions = msg.questions.map((q) => ({
+            question: q.question,
+            options: q.options.map((opt) => ({ label: opt.label, description: opt.description })),
+          }))
+          break
+        }
+      }
+    }
+    // Second fallback: StructuredOutput questions
+    if (!sseQuestions?.length && fallbackQuestions.length === 0 &&
+        sessionWorkflowOutput?.status === 'needs_input' && sessionWorkflowOutput.questions) {
+      fallbackQuestions = sessionWorkflowOutput.questions.map((q) => ({
+        question: q.question,
+        options: (q.options || []).map((opt) => ({ label: opt.label, description: opt.description })),
+      }))
+    }
+
+    const questions = sseQuestions?.length ? sseQuestions : fallbackQuestions
+
+    if (!questions?.length) {
+      console.warn('[handleDecisionAnswer] No questions available to answer')
+      return
+    }
 
     const totalQuestions = questions.length
 
@@ -361,28 +453,47 @@ export default function ProjectDetailPage() {
 
     if (answeredCount >= totalQuestions) {
       // All questions answered - submit all answers together
+      // For fallback questions (no active execution), resume the session with the answer
+      const sessionId = selectedConsoleSession?.sessionId ?? workflowExecution?.sessionId ?? consoleSessionId
+
       try {
+        // Try submitAnswers first (works for active workflow executions)
         await submitAnswers(newAnswers)
+        // G4.8: Clear questions from map after user answers
+        if (consoleSessionId) {
+          clearSessionQuestions(consoleSessionId)
+        }
         // Reset state after successful submission
         setPartialAnswers({})
         setCurrentQuestionIndex(0)
       } catch (error) {
         const errorMessage = error instanceof Error ? error.message : 'Unknown error'
-        // If execution tracking was lost, resume the session with the answers
-        if (errorMessage.includes('expired') || errorMessage.includes('not found')) {
-          const sessionId = workflowExecution?.sessionId
-          if (sessionId) {
+        // If execution tracking was lost OR this is a historical session, resume with the answer
+        const shouldFallbackToResume = errorMessage.includes('expired') ||
+          errorMessage.includes('not found') ||
+          errorMessage.includes('No active workflow')
+
+        if (sessionId && shouldFallbackToResume) {
+          console.log('[handleDecisionAnswer] Falling back to session resume with answer:', sessionId)
+          try {
             // Format answers for resumption prompt
             const answerSummary = Object.entries(newAnswers)
               .map(([idx, ans]) => `${idx}: ${ans}`)
               .join(', ')
             await startWorkflow(`My answers: ${answerSummary}`, { resumeSessionId: sessionId })
-          } else {
-            toastWorkflowError('Unable to resume session - session ID not found')
+          } catch (resumeError) {
+            const resumeErrorMessage = resumeError instanceof Error ? resumeError.message : 'Unknown error'
+            toastWorkflowError(`Failed to resume session: ${resumeErrorMessage}`)
           }
+        } else if (!sessionId && shouldFallbackToResume) {
+          toastWorkflowError('Unable to resume session - session ID not found')
         } else {
           toastWorkflowError(errorMessage)
         }
+        // G4.8: Clear questions on error too
+        if (consoleSessionId) {
+          clearSessionQuestions(consoleSessionId)
+        }
         // Reset state on error too
         setPartialAnswers({})
         setCurrentQuestionIndex(0)
@@ -391,12 +502,23 @@ export default function ProjectDetailPage() {
       // More questions to answer - advance to next question
       setCurrentQuestionIndex(currentQuestionIndex + 1)
     }
-  }, [workflowExecution, submitAnswers, startWorkflow, partialAnswers, currentQuestionIndex])
+  }, [consoleSessionId, sessionQuestions, clearSessionQuestions, workflowExecution, submitAnswers, startWorkflow, partialAnswers, currentQuestionIndex, sessionMessages, sessionWorkflowOutput, selectedConsoleSession])
 
   // Handle OmniBox submit
   const handleOmniBoxSubmit = useCallback(async (message: string) => {
-    // If waiting for input, use the same multi-question handler as DecisionToast
-    if (workflowStatus === 'waiting' && workflowExecution?.output?.questions?.length) {
+    // G6.11: If orchestration is paused, auto-resume when user sends a command
+    if (orchestration?.status === 'paused') {
+      try {
+        await resumeOrchestration()
+        console.log('[page] Auto-resumed orchestration on user input')
+      } catch (error) {
+        console.error('[page] Failed to auto-resume orchestration:', error)
+      }
+    }
+
+    // G4.7: If waiting for input and we have questions, use the decision handler
+    const hasQuestions = consoleSessionId && (sessionQuestions.get(consoleSessionId)?.length ?? 0) > 0
+    if (workflowStatus === 'waiting' && hasQuestions) {
       await handleDecisionAnswer(message)
       return
     }
@@ -468,7 +590,7 @@ export default function ProjectDetailPage() {
 
     // Start a new workflow (slash command)
     handleWorkflowStart(message)
-  }, [workflowStatus, workflowExecution, handleDecisionAnswer, startWorkflow, handleWorkflowStart, hasSessionEnded, cancelWorkflow, consoleSessionId, selectedConsoleSession, setActiveView])
+  }, [workflowStatus, workflowExecution, handleDecisionAnswer, startWorkflow, handleWorkflowStart, hasSessionEnded, cancelWorkflow, consoleSessionId, selectedConsoleSession, setActiveView, orchestration, resumeOrchestration])
 
   // Handle failed toast retry
   const handleRetry = useCallback(() => {
@@ -511,17 +633,72 @@ export default function ProjectDetailPage() {
     }
   }, [hasActiveOrchestration, pauseOrchestration, refreshSessionHistory])
 
-  // Build questions for decision toast
+  // G4.6/G4.7: Build questions for decision toast from SSE sessionQuestions
+  // Fall back to extracting questions from session messages if SSE questions not available
   const decisionQuestions = useMemo(() => {
-    if (!workflowExecution?.output?.questions) return []
-    return workflowExecution.output.questions.map((q) => ({
-      question: q.question,
-      options: q.options?.map((opt) => ({
-        label: opt.label,
-        description: opt.description,
-      })) ?? [],
-    }))
-  }, [workflowExecution?.output?.questions])
+    if (!consoleSessionId) return []
+
+    // First, try SSE questions (real-time)
+    const sseQuestions = sessionQuestions.get(consoleSessionId)
+    if (sseQuestions && sseQuestions.length > 0) {
+      return sseQuestions.map((q) => ({
+        question: q.question,
+        options: q.options.map((opt) => ({
+          label: opt.label,
+          description: opt.description,
+        })),
+      }))
+    }
+
+    // Fallback: Extract questions from session messages
+    // This handles the case where user navigates to a waiting session
+    // after the SSE event was already processed
+    if (sessionMessages.length > 0) {
+      // Find the last assistant message with questions
+      for (let i = sessionMessages.length - 1; i >= 0; i--) {
+        const msg = sessionMessages[i]
+        // Check for AskUserQuestion tool call questions
+        if (msg.role === 'assistant' && msg.questions && msg.questions.length > 0) {
+          return msg.questions.map((q) => ({
+            question: q.question,
+            options: q.options.map((opt) => ({
+              label: opt.label,
+              description: opt.description,
+            })),
+          }))
+        }
+      }
+    }
+
+    // Second fallback: Check sessionWorkflowOutput for StructuredOutput questions
+    // In CLI mode, Claude uses StructuredOutput with status: 'needs_input'
+    if (sessionWorkflowOutput?.status === 'needs_input' && sessionWorkflowOutput.questions) {
+      return sessionWorkflowOutput.questions.map((q) => ({
+        question: q.question,
+        options: (q.options || []).map((opt) => ({
+          label: opt.label,
+          description: opt.description,
+        })),
+      }))
+    }
+
+    return []
+  }, [consoleSessionId, sessionQuestions, sessionMessages, sessionWorkflowOutput])
+
+  // Show question loading state when status is waiting but questions haven't loaded yet
+  const isQuestionsLoading = workflowStatus === 'waiting' && decisionQuestions.length === 0 && sessionMessagesLoading
+
+  // Handle clicking the "Waiting" badge - navigate to session view to show questions
+  const handleStatusClick = useCallback(() => {
+    if (workflowStatus === 'waiting') {
+      // Ensure we're on the session view so the toast is visible
+      if (activeView !== 'session') {
+        setActiveView('session')
+      }
+      // Focus the OmniBox for easy response input
+      omniBoxRef.current?.focus()
+    }
+  }, [workflowStatus, activeView, setActiveView])
 
   // Loading state
   if (projectsLoading) {
@@ -618,9 +795,13 @@ export default function ProjectDetailPage() {
             onSelectSession={handleConsoleSessionSelect}
             onEndSession={handleEndSession}
             onPauseSession={handlePauseSession}
+            onResumeSession={resumeOrchestration}
             canPause={hasActiveOrchestration}
+            isPaused={orchestration?.status === 'paused'}
             projectId={projectId}
             currentTodos={sessionTodos}
+            workflowOutput={sessionWorkflowOutput}
+            sessionEnded={sessionHasEnded}
           />
         )
       case 'tasks':
@@ -689,6 +870,7 @@ export default function ProjectDetailPage() {
           ref={omniBoxRef}
           status={workflowStatus}
           onSubmit={handleOmniBoxSubmit}
+          onStatusClick={handleStatusClick}
           disabled={isStartingWorkflow}
           skills={workflowSkills.map(s => ({
             id: s.id,
@@ -699,21 +881,23 @@ export default function ProjectDetailPage() {
         />
       </div>
 
-      {/* Decision Toast - shown when waiting for input */}
-      {workflowStatus === 'waiting' && decisionQuestions.length > 0 && (
+      {/* Decision Toast - shown when waiting for input (or loading questions) */}
+      {workflowStatus === 'waiting' && (decisionQuestions.length > 0 || isQuestionsLoading) && (
         <DecisionToast
           questions={decisionQuestions}
           currentIndex={currentQuestionIndex}
           onAnswer={handleDecisionAnswer}
           onCustomAnswer={handleOmniBoxSubmit}
           onDismiss={handleDismiss}
+          isLoading={isQuestionsLoading}
         />
       )}
 
       {/* Failed Toast - shown when workflow failed (not detached) */}
+      {/* TODO: T010 - Error details will come via SSE events */}
       {workflowStatus === 'failed' && !isWorkflowDetached(workflowExecution) && (
         <FailedToast
-          error={workflowExecution?.error ?? 'An unexpected error occurred'}
+          error={'An unexpected error occurred'}
           onRetry={handleRetry}
           onDismiss={handleDismiss}
         />
diff --git a/packages/dashboard/src/components/input/decision-toast.tsx b/packages/dashboard/src/components/input/decision-toast.tsx
index a70a6b3..2bcd389 100644
--- a/packages/dashboard/src/components/input/decision-toast.tsx
+++ b/packages/dashboard/src/components/input/decision-toast.tsx
@@ -19,6 +19,8 @@ interface DecisionToastProps {
   onCustomAnswer?: (answer: string) => void
   /** Dismiss the question without answering */
   onDismiss?: () => void
+  /** Whether the questions are still loading */
+  isLoading?: boolean
   className?: string
 }
 
@@ -28,12 +30,49 @@ export function DecisionToast({
   onAnswer,
   onCustomAnswer,
   onDismiss,
+  isLoading = false,
   className,
 }: DecisionToastProps) {
   const [showCustomInput, setShowCustomInput] = useState(false)
   const [customValue, setCustomValue] = useState('')
 
   const currentQuestion = questions[currentIndex]
+
+  // Show loading state when waiting for questions
+  if (isLoading && !currentQuestion) {
+    return (
+      <div
+        className={cn(
+          'fixed bottom-24 left-1/2 -translate-x-1/2 w-full max-w-lg z-50 animate-slide-up',
+          className
+        )}
+      >
+        {/* Beam progress indicator */}
+        <div className="h-1 w-full rounded-t-lg bg-surface-300 overflow-hidden">
+          <div className="h-full w-1/3 bg-gradient-to-r from-transparent via-accent to-transparent animate-beam" />
+        </div>
+
+        {/* Toast content - loading state */}
+        <div className="glass rounded-b-lg p-4">
+          <div className="flex items-center gap-2 mb-3">
+            <HelpCircle className="w-5 h-5 text-warning animate-pulse" />
+            <span className="font-medium text-white">Loading question...</span>
+            {onDismiss && (
+              <button
+                onClick={onDismiss}
+                className="ml-auto p-1 rounded hover:bg-surface-300 text-surface-500 hover:text-white transition-colors"
+                title="Dismiss"
+              >
+                <X className="w-4 h-4" />
+              </button>
+            )}
+          </div>
+          <p className="text-sm text-zinc-400">Retrieving the question from the session...</p>
+        </div>
+      </div>
+    )
+  }
+
   if (!currentQuestion) return null
 
   const handleCustomSubmit = () => {
diff --git a/packages/dashboard/src/components/input/omni-box.tsx b/packages/dashboard/src/components/input/omni-box.tsx
index b1323e1..378d361 100644
--- a/packages/dashboard/src/components/input/omni-box.tsx
+++ b/packages/dashboard/src/components/input/omni-box.tsx
@@ -15,6 +15,7 @@ export interface SkillOption {
 interface OmniBoxProps {
   status?: WorkflowStatus
   onSubmit?: (message: string) => void
+  onStatusClick?: () => void
   disabled?: boolean
   className?: string
   skills?: SkillOption[]
@@ -56,7 +57,7 @@ const statusConfig = {
 }
 
 export const OmniBox = forwardRef<OmniBoxHandle, OmniBoxProps>(
-  ({ status = 'idle', onSubmit, disabled = false, className, skills = [] }, ref) => {
+  ({ status = 'idle', onSubmit, onStatusClick, disabled = false, className, skills = [] }, ref) => {
     const [value, setValue] = useState('')
     const [isFocused, setIsFocused] = useState(false)
     const [showAutocomplete, setShowAutocomplete] = useState(false)
@@ -164,18 +165,22 @@ export const OmniBox = forwardRef<OmniBoxHandle, OmniBoxProps>(
                 : 'border-surface-300 group-hover:border-surface-400'
             )}
           >
-            {/* State badge */}
-            <div
+            {/* State badge - clickable when waiting */}
+            <button
+              type="button"
+              onClick={status === 'waiting' && onStatusClick ? onStatusClick : undefined}
+              disabled={status !== 'waiting' || !onStatusClick}
               className={cn(
                 'flex items-center gap-2 px-3 py-1.5 rounded-lg transition-colors mr-2',
-                config.badgeClass
+                config.badgeClass,
+                status === 'waiting' && onStatusClick && 'cursor-pointer hover:opacity-80'
               )}
             >
               <span className={cn('w-2 h-2 rounded-full', config.dotClass)} />
               <span className={cn('text-xs font-medium', config.textClass)}>
                 {config.badge}
               </span>
-            </div>
+            </button>
 
             {/* Input */}
             <input
diff --git a/packages/dashboard/src/components/orchestration/decision-log-panel.tsx b/packages/dashboard/src/components/orchestration/decision-log-panel.tsx
index d7b416a..0f7201c 100644
--- a/packages/dashboard/src/components/orchestration/decision-log-panel.tsx
+++ b/packages/dashboard/src/components/orchestration/decision-log-panel.tsx
@@ -18,24 +18,49 @@ import type { DecisionLogEntry } from '@specflow/shared';
 export interface DecisionLogPanelProps {
   /** Decision log entries */
   entries: DecisionLogEntry[];
-  /** Maximum entries to show */
+  /** Maximum entries to show when expanded */
   maxEntries?: number;
   /** Initially collapsed */
   defaultCollapsed?: boolean;
+  /** Number of entries to show as preview when collapsed (0 to hide) */
+  previewCount?: number;
 }
 
 // =============================================================================
 // Helper Functions
 // =============================================================================
 
-function formatTimestamp(iso: string): string {
+/**
+ * Format timestamp as relative time (e.g., "2m ago", "1h ago")
+ */
+function formatRelativeTime(iso: string): string {
   try {
     const date = new Date(iso);
-    return date.toLocaleTimeString('en-US', {
-      hour: '2-digit',
-      minute: '2-digit',
-      second: '2-digit',
-      hour12: false,
+    const now = Date.now();
+    const diffMs = now - date.getTime();
+
+    // Handle future dates or invalid dates
+    if (diffMs < 0 || isNaN(diffMs)) {
+      return 'now';
+    }
+
+    const diffSeconds = Math.floor(diffMs / 1000);
+    const diffMinutes = Math.floor(diffSeconds / 60);
+    const diffHours = Math.floor(diffMinutes / 60);
+
+    if (diffSeconds < 60) {
+      return diffSeconds <= 5 ? 'now' : `${diffSeconds}s ago`;
+    }
+    if (diffMinutes < 60) {
+      return `${diffMinutes}m ago`;
+    }
+    if (diffHours < 24) {
+      return `${diffHours}h ago`;
+    }
+    // For older entries, show the date
+    return date.toLocaleDateString('en-US', {
+      month: 'short',
+      day: 'numeric',
     });
   } catch {
     return iso;
@@ -50,6 +75,7 @@ export function DecisionLogPanel({
   entries,
   maxEntries = 10,
   defaultCollapsed = true,
+  previewCount = 3,
 }: DecisionLogPanelProps) {
   const [isCollapsed, setIsCollapsed] = React.useState(defaultCollapsed);
 
@@ -59,10 +85,41 @@ export function DecisionLogPanel({
     [entries, maxEntries]
   );
 
+  // Preview entries shown when collapsed
+  const previewEntries = React.useMemo(
+    () => displayEntries.slice(0, previewCount),
+    [displayEntries, previewCount]
+  );
+
   if (entries.length === 0) {
     return null;
   }
 
+  // Render a single entry row
+  const renderEntry = (entry: DecisionLogEntry, index: number) => (
+    <div
+      key={`${entry.timestamp}-${index}`}
+      className="px-3 py-2 text-xs"
+    >
+      <div className="flex items-start gap-2">
+        <Clock className="h-3 w-3 text-neutral-400 mt-0.5 shrink-0" />
+        <div className="flex-1 min-w-0">
+          <div className="flex items-center gap-2">
+            <span className="text-neutral-400 font-mono">
+              {formatRelativeTime(entry.timestamp)}
+            </span>
+            <span className="font-medium text-neutral-700 dark:text-neutral-300 truncate">
+              {entry.decision}
+            </span>
+          </div>
+          <p className="text-neutral-500 dark:text-neutral-400 mt-0.5">
+            {entry.reason}
+          </p>
+        </div>
+      </div>
+    </div>
+  );
+
   return (
     <div className="border border-neutral-200 dark:border-neutral-700 rounded-lg overflow-hidden">
       {/* Header */}
@@ -86,32 +143,26 @@ export function DecisionLogPanel({
         </span>
       </button>
 
-      {/* Entries */}
+      {/* Preview entries (shown when collapsed) */}
+      {isCollapsed && previewCount > 0 && previewEntries.length > 0 && (
+        <div className="divide-y divide-neutral-100 dark:divide-neutral-800 bg-neutral-50/50 dark:bg-neutral-900/30">
+          {previewEntries.map(renderEntry)}
+          {entries.length > previewCount && (
+            <button
+              type="button"
+              onClick={() => setIsCollapsed(false)}
+              className="w-full px-3 py-1.5 text-xs text-neutral-500 hover:text-neutral-700 dark:hover:text-neutral-300 text-center hover:bg-neutral-100 dark:hover:bg-neutral-800 transition-colors"
+            >
+              Show {Math.min(entries.length, maxEntries) - previewCount} more...
+            </button>
+          )}
+        </div>
+      )}
+
+      {/* Full entries (shown when expanded) */}
       {!isCollapsed && (
         <div className="divide-y divide-neutral-100 dark:divide-neutral-800 max-h-48 overflow-y-auto">
-          {displayEntries.map((entry, index) => (
-            <div
-              key={`${entry.timestamp}-${index}`}
-              className="px-3 py-2 text-xs"
-            >
-              <div className="flex items-start gap-2">
-                <Clock className="h-3 w-3 text-neutral-400 mt-0.5 shrink-0" />
-                <div className="flex-1 min-w-0">
-                  <div className="flex items-center gap-2">
-                    <span className="text-neutral-400 font-mono">
-                      {formatTimestamp(entry.timestamp)}
-                    </span>
-                    <span className="font-medium text-neutral-700 dark:text-neutral-300 truncate">
-                      {entry.decision}
-                    </span>
-                  </div>
-                  <p className="text-neutral-500 dark:text-neutral-400 mt-0.5">
-                    {entry.reason}
-                  </p>
-                </div>
-              </div>
-            </div>
-          ))}
+          {displayEntries.map(renderEntry)}
           {entries.length > maxEntries && (
             <div className="px-3 py-2 text-xs text-neutral-400 text-center">
               Showing {maxEntries} of {entries.length} entries
diff --git a/packages/dashboard/src/components/orchestration/index.ts b/packages/dashboard/src/components/orchestration/index.ts
index ddf808f..afe97b3 100644
--- a/packages/dashboard/src/components/orchestration/index.ts
+++ b/packages/dashboard/src/components/orchestration/index.ts
@@ -8,7 +8,7 @@ export { StartOrchestrationModal, type BatchPlanInfo } from './start-orchestrati
 export { OrchestrationConfigForm } from './orchestration-config-form';
 export { PhaseProgressBar } from './phase-progress-bar';
 export { BatchProgress } from './batch-progress';
-export { DecisionLogPanel } from './decision-log-panel';
+export { DecisionLogPanel, DecisionLogPanel as DecisionLogViewer } from './decision-log-panel';
 export { OrchestrationProgress } from './orchestration-progress';
 export { OrchestrationControls } from './orchestration-controls';
 export { MergeReadyPanel } from './merge-ready-panel';
diff --git a/packages/dashboard/src/components/projects/empty-state.tsx b/packages/dashboard/src/components/projects/empty-state.tsx
index 22f5bce..de46c0d 100644
--- a/packages/dashboard/src/components/projects/empty-state.tsx
+++ b/packages/dashboard/src/components/projects/empty-state.tsx
@@ -8,7 +8,7 @@ export function EmptyState() {
         No projects registered
       </h3>
       <p className="mt-2 text-sm text-neutral-500 dark:text-neutral-400 max-w-sm">
-        Run <code className="px-1.5 py-0.5 bg-neutral-100 dark:bg-neutral-800 rounded text-xs font-mono">specflow state init</code> in a project directory to register it with SpecFlow.
+        Run <code className="px-1.5 py-0.5 bg-neutral-100 dark:bg-neutral-800 rounded text-xs font-mono">specflow init</code> in a project directory to register it with SpecFlow.
       </p>
     </div>
   )
diff --git a/packages/dashboard/src/components/projects/project-card.tsx b/packages/dashboard/src/components/projects/project-card.tsx
index 0749447..6671ecc 100644
--- a/packages/dashboard/src/components/projects/project-card.tsx
+++ b/packages/dashboard/src/components/projects/project-card.tsx
@@ -23,9 +23,8 @@ import type { WorkflowStatus } from '@/components/design-system/status-pill'
 import { StatusButton } from '@/components/projects/action-button'
 import { ActionsMenu } from '@/components/projects/actions-menu'
 import { cn } from '@/lib/utils'
-import type { OrchestrationState, TasksData } from '@specflow/shared'
+import type { OrchestrationState, TasksData, WorkflowIndexEntry } from '@specflow/shared'
 import type { ProjectStatus as ActionProjectStatus } from '@/lib/action-definitions'
-import type { WorkflowExecution } from '@/lib/services/workflow-service'
 import type { OrchestrationExecution } from '@specflow/shared'
 
 /**
@@ -53,8 +52,8 @@ interface ProjectCardProps {
   tasks?: TasksData | null
   isUnavailable?: boolean
   isDiscovered?: boolean
-  /** Active workflow execution for this project */
-  workflowExecution?: WorkflowExecution | null
+  /** Active workflow execution for this project (from SSE) */
+  workflowExecution?: WorkflowIndexEntry | null
   /** Active orchestration execution for this project */
   activeOrchestration?: OrchestrationExecution | null
   /** Callback to start a workflow */
@@ -84,14 +83,74 @@ function formatRelativeTime(isoString: string | null | undefined): string {
 }
 
 /**
- * Check if activity is recent (within last 15 minutes)
+ * Activity indicator state based on workflow/orchestration status
  */
-function isRecentActivity(isoString: string | null | undefined): boolean {
-  if (!isoString) return false
-  const date = new Date(isoString)
-  const now = new Date()
-  const diffMs = now.getTime() - date.getTime()
-  return diffMs < 15 * 60 * 1000 // 15 minutes
+type ActivityIndicator = 'running' | 'waiting' | 'merge' | 'error' | 'stale' | null
+
+/**
+ * Determine activity indicator based on workflow and orchestration state
+ */
+function getActivityIndicator(
+  workflowExecution: WorkflowIndexEntry | null | undefined,
+  activeOrchestration: OrchestrationExecution | null | undefined
+): ActivityIndicator {
+  const workflowStatus = workflowExecution?.status
+  const orchestrationStatus = activeOrchestration?.status
+
+  // Error state (workflow or orchestration failed)
+  if (workflowStatus === 'failed' || orchestrationStatus === 'failed') {
+    return 'error'
+  }
+
+  // Running state (actively executing)
+  if (workflowStatus === 'running' || orchestrationStatus === 'running') {
+    return 'running'
+  }
+
+  // Waiting for user input
+  if (
+    workflowStatus === 'waiting_for_input' ||
+    orchestrationStatus === 'paused' ||
+    orchestrationStatus === 'needs_attention'
+  ) {
+    return 'waiting'
+  }
+
+  // Ready to merge
+  if (orchestrationStatus === 'waiting_merge') {
+    return 'merge'
+  }
+
+  // Stale/detached (lost tracking)
+  if (workflowStatus === 'stale' || workflowStatus === 'detached') {
+    return 'stale'
+  }
+
+  // Idle (completed, cancelled, or no activity)
+  return null
+}
+
+/**
+ * Get activity indicator styles
+ */
+function getActivityIndicatorStyles(indicator: ActivityIndicator): {
+  className: string
+  animate: boolean
+} | null {
+  switch (indicator) {
+    case 'running':
+      return { className: 'bg-success', animate: true }
+    case 'waiting':
+      return { className: 'bg-amber-500', animate: false }
+    case 'merge':
+      return { className: 'bg-purple-500', animate: false }
+    case 'error':
+      return { className: 'bg-danger', animate: false }
+    case 'stale':
+      return { className: 'bg-zinc-500', animate: false }
+    default:
+      return null
+  }
 }
 
 /**
@@ -110,6 +169,35 @@ function getMostRecentTimestamp(...timestamps: (string | null | undefined)[]): s
   ).ts
 }
 
+/**
+ * Get step badge styling based on step name
+ * Steps: design → analyze → implement → verify → complete
+ */
+function getStepBadge(step: string | null | undefined): {
+  label: string
+  className: string
+} | null {
+  if (!step) return null
+
+  const normalizedStep = step.toLowerCase()
+
+  switch (normalizedStep) {
+    case 'design':
+      return { label: 'Design', className: 'bg-purple-500/15 text-purple-400' }
+    case 'analyze':
+      return { label: 'Analyze', className: 'bg-blue-500/15 text-blue-400' }
+    case 'implement':
+      return { label: 'Implement', className: 'bg-amber-500/15 text-amber-400' }
+    case 'verify':
+      return { label: 'Verify', className: 'bg-cyan-500/15 text-cyan-400' }
+    case 'complete':
+    case 'completed':
+      return { label: 'Complete', className: 'bg-success/15 text-success' }
+    default:
+      return { label: step, className: 'bg-zinc-500/15 text-zinc-400' }
+  }
+}
+
 /**
  * Check if phase is complete
  */
@@ -135,6 +223,12 @@ function getProjectStatus(state: OrchestrationState | null | undefined): Project
     return 'warning'
   }
 
+  // If there's active orchestration data, treat as ready even if health.status is "initializing"
+  // (health.status can be stale while orchestration is actively in progress)
+  if (state.orchestration?.phase?.number || state.orchestration?.step?.current) {
+    return 'ready'
+  }
+
   if (state.health?.status === 'initializing') {
     return 'initializing'
   }
@@ -199,7 +293,7 @@ function getStatusBadge(status: ProjectStatus): {
  * Map workflow execution status to StatusPill status
  */
 function getWorkflowPillStatus(
-  execution: WorkflowExecution | null | undefined
+  execution: WorkflowIndexEntry | null | undefined
 ): WorkflowStatus {
   if (!execution?.status) return 'idle'
   switch (execution.status) {
@@ -266,13 +360,25 @@ export function ProjectCard({
   nextPhase,
 }: ProjectCardProps) {
   const phase = state?.orchestration?.phase
-  const step = state?.orchestration?.step
   const health = state?.health
 
-  const lastUpdated = getMostRecentTimestamp(state?.last_updated, state?._fileMtime)
-  const isActive = isRecentActivity(lastUpdated)
+  // Current step: prefer live orchestration data over stale state file
+  const currentStep = activeOrchestration?.currentPhase ?? state?.orchestration?.step?.current
+
+  // Last updated: prioritize workflow activity, then tasks, then state file
+  const lastUpdated = getMostRecentTimestamp(
+    workflowExecution?.updatedAt,
+    workflowExecution?.startedAt,
+    tasks?.lastUpdated,
+    state?.last_updated,
+    state?._fileMtime
+  )
   const phaseComplete = isPhaseComplete(phase?.status)
 
+  // Activity indicator based on workflow/orchestration state
+  const activityIndicator = getActivityIndicator(workflowExecution, activeOrchestration)
+  const activityStyles = getActivityIndicatorStyles(activityIndicator)
+
   // Workflow status handling
   const workflowPillStatus = getWorkflowPillStatus(workflowExecution)
   const hasActiveWorkflow =
@@ -298,10 +404,11 @@ export function ProjectCard({
   const hasTasks = totalTasks > 0
   const allTasksComplete = hasTasks && completedTasks === totalTasks
 
-  // Ready to merge - phase is complete AND verify step is done
+  // Ready to merge - orchestration says so, or phase complete, or all tasks done in verify
   const isReadyToMerge =
+    activeOrchestration?.status === 'waiting_merge' ||
     phase?.status === 'complete' ||
-    (allTasksComplete && step?.status === 'complete' && step?.current === 'verify')
+    (allTasksComplete && currentStep === 'verify')
 
   // Branch name
   const branchName = phase?.branch ?? 'main'
@@ -335,8 +442,14 @@ export function ProjectCard({
               )}
             />
           </div>
-          {isActive && (
-            <span className="absolute -top-0.5 -right-0.5 h-2.5 w-2.5 rounded-full bg-success ring-2 ring-surface-100 animate-pulse" />
+          {activityStyles && (
+            <span
+              className={cn(
+                'absolute -top-0.5 -right-0.5 h-2.5 w-2.5 rounded-full ring-2 ring-surface-100',
+                activityStyles.className,
+                activityStyles.animate && 'animate-pulse'
+              )}
+            />
           )}
         </div>
 
@@ -354,11 +467,13 @@ export function ProjectCard({
               </span>
             )}
             {workflowPillStatus !== 'idle' && !hasActiveOrchestration && (
-              <StatusPill status={workflowPillStatus} size="sm" />
+              <span className="hidden sm:block">
+                <StatusPill status={workflowPillStatus} size="sm" />
+              </span>
             )}
             {orchestrationBadge && (
               <span className={cn(
-                'inline-flex items-center gap-1 px-1.5 py-0.5 text-[10px] font-medium rounded',
+                'hidden sm:inline-flex items-center gap-1 px-1.5 py-0.5 text-[10px] font-medium rounded',
                 orchestrationBadge.className
               )}>
                 <orchestrationBadge.icon className={cn(
@@ -391,9 +506,21 @@ export function ProjectCard({
                   >
                     {phase?.number || '—'}
                   </span>
-                  <span className="text-xs text-zinc-500 truncate">
+                  <span className="hidden sm:inline text-xs text-zinc-500 truncate">
                     {phase?.name?.replace(/-/g, ' ') || 'Unknown phase'}
                   </span>
+                  {/* Step indicator */}
+                  {!phaseComplete && !isReadyToMerge && currentStep && (() => {
+                    const stepBadge = getStepBadge(currentStep)
+                    return stepBadge ? (
+                      <span className={cn(
+                        'text-[10px] font-medium px-1.5 py-0.5 rounded uppercase tracking-wide',
+                        stepBadge.className
+                      )}>
+                        {stepBadge.label}
+                      </span>
+                    ) : null
+                  })()}
                   {phaseComplete && (
                     <CheckCircle2 className="h-3 w-3 text-success flex-shrink-0" />
                   )}
@@ -411,12 +538,12 @@ export function ProjectCard({
                     Ready
                   </span>
                   {nextPhase && (
-                    <>
+                    <span className="hidden sm:flex items-center gap-2">
                       <span className="text-zinc-600">→</span>
                       <span className="text-xs text-zinc-500 truncate">
                         {nextPhase.name.replace(/-/g, ' ')}
                       </span>
-                    </>
+                    </span>
                   )}
                 </>
               )
@@ -464,12 +591,14 @@ export function ProjectCard({
 
           {/* Actions */}
           <div className="flex items-center gap-1" onClick={(e) => e.preventDefault()}>
-            <StatusButton
-              projectId={project.id}
-              projectPath={project.path}
-              projectStatus={projectStatus as ActionProjectStatus}
-              isAvailable={!isUnavailable}
-            />
+            <span className="hidden sm:block">
+              <StatusButton
+                projectId={project.id}
+                projectPath={project.path}
+                projectStatus={projectStatus as ActionProjectStatus}
+                isAvailable={!isUnavailable}
+              />
+            </span>
             <ActionsMenu
               projectId={project.id}
               projectName={project.name}
@@ -483,7 +612,7 @@ export function ProjectCard({
             />
           </div>
 
-          <ChevronRight className="h-4 w-4 text-zinc-600 group-hover:text-zinc-400 transition-colors" />
+          <ChevronRight className="hidden sm:block h-4 w-4 text-zinc-600 group-hover:text-zinc-400 transition-colors" />
         </div>
       </div>
     </Link>
diff --git a/packages/dashboard/src/components/projects/project-detail-header.tsx b/packages/dashboard/src/components/projects/project-detail-header.tsx
index d108a4d..e2eedb0 100644
--- a/packages/dashboard/src/components/projects/project-detail-header.tsx
+++ b/packages/dashboard/src/components/projects/project-detail-header.tsx
@@ -18,7 +18,7 @@ import {
 } from "@/components/ui/dropdown-menu"
 import { useWorkflowSkills, type WorkflowSkill } from "@/hooks/use-workflow-skills"
 import type { ProjectStatus } from "@/lib/action-definitions"
-import type { WorkflowExecution } from "@/lib/services/workflow-service"
+import type { WorkflowIndexEntry } from "@specflow/shared"
 import {
   toastWorkflowStarted,
   toastWorkflowError,
@@ -36,8 +36,8 @@ interface ProjectDetailHeaderProps {
   projectStatus?: ProjectStatus
   schemaVersion?: string
   isAvailable?: boolean
-  /** Active workflow execution */
-  workflowExecution?: WorkflowExecution | null
+  /** Active workflow execution (from SSE) */
+  workflowExecution?: WorkflowIndexEntry | null
   /** Whether a workflow is starting */
   isStartingWorkflow?: boolean
   /** Callback to start a workflow */
@@ -76,7 +76,8 @@ export function ProjectDetailHeader({
   const hasActiveWorkflow = workflowStatus === 'running' || workflowStatus === 'waiting_for_input' || workflowStatus === 'detached'
 
   // Question badge for waiting workflows
-  const pendingQuestions = workflowExecution?.output?.questions ?? []
+  // TODO: T010 - Questions will come via session:question SSE events
+  const pendingQuestions: Array<{ question: string }> = [] // Temporarily empty
   const showQuestionBadge = workflowStatus === 'waiting_for_input' && pendingQuestions.length > 0
 
   // Session button visibility - show when there's an active workflow (even without session ID yet)
diff --git a/packages/dashboard/src/components/projects/project-list.tsx b/packages/dashboard/src/components/projects/project-list.tsx
index c41fb3b..0646995 100644
--- a/packages/dashboard/src/components/projects/project-list.tsx
+++ b/packages/dashboard/src/components/projects/project-list.tsx
@@ -3,7 +3,6 @@
 import { useMemo, useCallback } from 'react'
 import { useProjects } from '@/hooks/use-projects'
 import { useConnection } from '@/contexts/connection-context'
-import { useWorkflowList } from '@/hooks/use-workflow-list'
 import { useProjectPhases } from '@/hooks/use-project-phases'
 import { ProjectCard } from './project-card'
 import { EmptyState } from './empty-state'
@@ -44,14 +43,7 @@ function getMostRecentTimestamp(...timestamps: (string | null | undefined)[]): D
 
 export function ProjectList() {
   const { projects, loading, error, refetch } = useProjects()
-  const { states, tasks } = useConnection()
-
-  // Get project IDs for workflow list filtering
-  const projectIds = useMemo(() => projects.map((p) => p.id), [projects])
-
-  // Fetch active workflows for all projects (with polling)
-  const { executions: workflowExecutions, refresh: refreshWorkflows } =
-    useWorkflowList(projectIds)
+  const { states, tasks, workflows, refetch: refreshWorkflows } = useConnection()
 
   // Fetch phase info for all projects (next phase from roadmap)
   const { phases: projectPhases } = useProjectPhases(projects)
@@ -191,7 +183,7 @@ export function ProjectList() {
             tasks={tasks.get(project.id)}
             isUnavailable={project.isUnavailable}
             isDiscovered={project.isDiscovered}
-            workflowExecution={workflowExecutions.get(project.id)}
+            workflowExecution={workflows.get(project.id)?.currentExecution}
             onWorkflowStart={createWorkflowStartHandler(project.id)}
             nextPhase={phaseInfo?.nextPhase}
           />
diff --git a/packages/dashboard/src/components/projects/session-viewer-drawer.tsx b/packages/dashboard/src/components/projects/session-viewer-drawer.tsx
index 1d21edb..0f87697 100644
--- a/packages/dashboard/src/components/projects/session-viewer-drawer.tsx
+++ b/packages/dashboard/src/components/projects/session-viewer-drawer.tsx
@@ -20,7 +20,7 @@ import { ScrollArea } from '@/components/ui/scroll-area';
 import { Input } from '@/components/ui/input';
 import { Button } from '@/components/ui/button';
 import { cn } from '@/lib/utils';
-import { useSessionMessages } from '@/hooks/use-session-messages';
+import { useSessionContentExtended } from '@/hooks/use-session-content';
 import { SessionMessageDisplay } from '../session/session-message';
 import { SessionPendingState } from './session-pending-state';
 import { TodoPanel } from '../session/todo-panel';
@@ -122,15 +122,18 @@ export function SessionViewerDrawer({
   onResumeSession,
   isResuming = false,
 }: SessionViewerDrawerProps) {
+  // Session content from SSE (no polling)
   const {
     messages,
     filesModified,
     elapsed,
     isLoading,
-    error,
-    activeSessionId,
     currentTodos,
-  } = useSessionMessages(projectPath, sessionId, isActive && open);
+  } = useSessionContentExtended(sessionId, projectPath);
+
+  // SSE provides real-time data - no separate error/activeSessionId needed
+  const error = null;
+  const activeSessionId = sessionId;
 
   const scrollAreaRef = React.useRef<HTMLDivElement>(null);
   const [autoScroll, setAutoScroll] = React.useState(true);
@@ -226,7 +229,7 @@ export function SessionViewerDrawer({
             </div>
             <div className="flex items-center gap-1.5 text-xs text-neutral-400">
               <FileCode className="h-3.5 w-3.5" />
-              <span>{filesModified} file{filesModified !== 1 ? 's' : ''} modified</span>
+              <span>{filesModified.length} file{filesModified.length !== 1 ? 's' : ''} modified</span>
             </div>
             {isActive && (
               <div className="flex items-center gap-1.5 text-xs">
diff --git a/packages/dashboard/src/components/projects/status-view.tsx b/packages/dashboard/src/components/projects/status-view.tsx
index 1e9a226..7b07f7e 100644
--- a/packages/dashboard/src/components/projects/status-view.tsx
+++ b/packages/dashboard/src/components/projects/status-view.tsx
@@ -83,7 +83,7 @@ export function StatusView({
         </h3>
         <p className="text-sm text-neutral-500 dark:text-neutral-400 max-w-md">
           This project doesn&apos;t have an orchestration state file yet.
-          Run <code className="px-1 py-0.5 bg-neutral-100 dark:bg-neutral-800 rounded">specflow state init</code> in the project directory.
+          Run <code className="px-1 py-0.5 bg-neutral-100 dark:bg-neutral-800 rounded">specflow init</code> in the project directory.
         </p>
       </div>
     )
diff --git a/packages/dashboard/src/components/session/agent-task-chip.tsx b/packages/dashboard/src/components/session/agent-task-chip.tsx
new file mode 100644
index 0000000..db063b1
--- /dev/null
+++ b/packages/dashboard/src/components/session/agent-task-chip.tsx
@@ -0,0 +1,100 @@
+'use client'
+
+import { cn } from '@/lib/utils'
+import { Loader2, CheckCircle, Search, FileCode, Terminal, Bot } from 'lucide-react'
+import type { AgentTaskInfo } from '@/lib/session-parser'
+
+interface AgentTaskChipProps {
+  task: AgentTaskInfo
+  className?: string
+}
+
+/**
+ * Get icon for agent type
+ */
+function getAgentIcon(subagentType: string) {
+  switch (subagentType.toLowerCase()) {
+    case 'explore':
+      return Search
+    case 'plan':
+      return FileCode
+    case 'bash':
+      return Terminal
+    default:
+      return Bot
+  }
+}
+
+/**
+ * Get color class for agent type
+ */
+function getAgentColor(subagentType: string): string {
+  switch (subagentType.toLowerCase()) {
+    case 'explore':
+      return 'border-blue-500/30 bg-blue-500/10 text-blue-400'
+    case 'plan':
+      return 'border-purple-500/30 bg-purple-500/10 text-purple-400'
+    case 'bash':
+      return 'border-orange-500/30 bg-orange-500/10 text-orange-400'
+    default:
+      return 'border-zinc-500/30 bg-zinc-500/10 text-zinc-400'
+  }
+}
+
+export function AgentTaskChip({ task, className }: AgentTaskChipProps) {
+  const Icon = getAgentIcon(task.subagentType)
+  const colorClass = getAgentColor(task.subagentType)
+  const isRunning = task.status === 'running'
+
+  return (
+    <div
+      className={cn(
+        'inline-flex items-center gap-2 px-3 py-1.5 rounded-lg border text-sm',
+        colorClass,
+        className
+      )}
+    >
+      {isRunning ? (
+        <Loader2 className="w-3.5 h-3.5 animate-spin" />
+      ) : (
+        <CheckCircle className="w-3.5 h-3.5 text-green-400" />
+      )}
+      <Icon className="w-3.5 h-3.5" />
+      <span className="truncate max-w-[200px]">{task.description}</span>
+    </div>
+  )
+}
+
+interface AgentTaskGroupProps {
+  tasks: AgentTaskInfo[]
+  className?: string
+}
+
+export function AgentTaskGroup({ tasks, className }: AgentTaskGroupProps) {
+  if (!tasks || tasks.length === 0) return null
+
+  const runningCount = tasks.filter(t => t.status === 'running').length
+  const completedCount = tasks.filter(t => t.status === 'completed').length
+
+  return (
+    <div className={cn('space-y-2', className)}>
+      {runningCount > 0 && (
+        <div className="text-xs text-zinc-500 flex items-center gap-1.5">
+          <Loader2 className="w-3 h-3 animate-spin" />
+          <span>{runningCount} agent{runningCount > 1 ? 's' : ''} working...</span>
+        </div>
+      )}
+      <div className="flex flex-wrap gap-2">
+        {tasks.map((task) => (
+          <AgentTaskChip key={task.id} task={task} />
+        ))}
+      </div>
+      {completedCount > 0 && runningCount === 0 && (
+        <div className="text-xs text-green-500/70 flex items-center gap-1.5">
+          <CheckCircle className="w-3 h-3" />
+          <span>All {completedCount} agent{completedCount > 1 ? 's' : ''} completed</span>
+        </div>
+      )}
+    </div>
+  )
+}
diff --git a/packages/dashboard/src/components/session/session-controls.tsx b/packages/dashboard/src/components/session/session-controls.tsx
index d8b958d..e30872f 100644
--- a/packages/dashboard/src/components/session/session-controls.tsx
+++ b/packages/dashboard/src/components/session/session-controls.tsx
@@ -8,7 +8,7 @@
  */
 
 import * as React from 'react';
-import { Pause, XCircle, Loader2, AlertTriangle } from 'lucide-react';
+import { Pause, Play, XCircle, Loader2, AlertTriangle } from 'lucide-react';
 import { Button } from '@/components/ui/button';
 import {
   Dialog,
@@ -26,6 +26,8 @@ import {
 export interface SessionControlsProps {
   /** Callback for pause action */
   onPause?: () => void;
+  /** Callback for resume action */
+  onResume?: () => void;
   /** Callback for cancel action */
   onCancel?: () => void;
   /** Whether controls are disabled */
@@ -34,6 +36,8 @@ export interface SessionControlsProps {
   isLoading?: boolean;
   /** Whether pause is available (e.g., when part of orchestration) */
   showPause?: boolean;
+  /** Whether orchestration is currently paused */
+  isPaused?: boolean;
   /** Compact mode - shows smaller buttons */
   compact?: boolean;
 }
@@ -44,10 +48,12 @@ export interface SessionControlsProps {
 
 export function SessionControls({
   onPause,
+  onResume,
   onCancel,
   disabled = false,
   isLoading = false,
   showPause = false,
+  isPaused = false,
   compact = false,
 }: SessionControlsProps) {
   const [showCancelDialog, setShowCancelDialog] = React.useState(false);
@@ -63,21 +69,23 @@ export function SessionControls({
   return (
     <>
       <div className="flex items-center gap-2">
-        {/* Pause Button (optional) */}
-        {showPause && onPause && (
+        {/* Pause/Resume Button (optional) */}
+        {showPause && (isPaused ? onResume : onPause) && (
           <Button
             variant="outline"
             size={buttonSize}
-            onClick={onPause}
+            onClick={isPaused ? onResume : onPause}
             disabled={disabled || isLoading}
             className={compact ? 'gap-1.5 px-2 py-1 h-7 text-xs' : 'gap-2'}
           >
             {isLoading ? (
               <Loader2 className={`${iconSize} animate-spin`} />
+            ) : isPaused ? (
+              <Play className={iconSize} />
             ) : (
               <Pause className={iconSize} />
             )}
-            {!compact && 'Pause'}
+            {!compact && (isPaused ? 'Resume' : 'Pause')}
           </Button>
         )}
 
diff --git a/packages/dashboard/src/components/session/session-message.tsx b/packages/dashboard/src/components/session/session-message.tsx
index 528753c..25eccb8 100644
--- a/packages/dashboard/src/components/session/session-message.tsx
+++ b/packages/dashboard/src/components/session/session-message.tsx
@@ -2,11 +2,12 @@
 
 import { useState, useCallback } from 'react'
 import { cn } from '@/lib/utils'
-import type { SessionMessage, ToolCallInfo } from '@/lib/session-parser'
+import type { SessionMessage, ToolCallInfo, QuestionInfo, AgentTaskInfo } from '@/lib/session-parser'
 import { CommandChip } from './command-chip'
 import { FileChipGroup } from './file-chip'
 import { FileViewerModal } from './file-viewer-modal'
 import { MarkdownContent } from '@/components/ui/markdown-content'
+import { AgentTaskGroup } from './agent-task-chip'
 
 interface SessionMessageDisplayProps {
   message: SessionMessage
@@ -275,9 +276,42 @@ export function SessionMessageDisplay({
         </div>
 
         {/* Content - render as markdown */}
-        <div className="text-zinc-300 leading-relaxed">
-          <MarkdownContent content={message.content} className="prose-p:mb-2 prose-p:last:mb-0" />
-        </div>
+        {message.content && (
+          <div className="text-zinc-300 leading-relaxed">
+            <MarkdownContent content={message.content} className="prose-p:mb-2 prose-p:last:mb-0" />
+          </div>
+        )}
+
+        {/* Questions from AskUserQuestion tool */}
+        {message.questions && message.questions.length > 0 && (
+          <div className="mt-3 space-y-3">
+            {message.questions.map((q, qIdx) => (
+              <div key={qIdx} className="rounded-lg border border-accent/30 bg-accent/5 p-4">
+                {q.header && (
+                  <span className="inline-block px-2 py-0.5 mb-2 rounded text-[10px] uppercase tracking-wider bg-accent/20 text-accent">
+                    {q.header}
+                  </span>
+                )}
+                <p className="text-zinc-200 font-medium mb-3">{q.question}</p>
+                {q.options.length > 0 && (
+                  <div className="flex flex-wrap gap-2">
+                    {q.options.map((opt, optIdx) => (
+                      <div
+                        key={optIdx}
+                        className="px-3 py-2 rounded-lg border border-surface-300 bg-surface-200 text-sm"
+                      >
+                        <span className="text-zinc-200">{opt.label}</span>
+                        {opt.description && (
+                          <span className="text-zinc-500 ml-2">— {opt.description}</span>
+                        )}
+                      </div>
+                    ))}
+                  </div>
+                )}
+              </div>
+            ))}
+          </div>
+        )}
 
         {/* File chips for tool calls */}
         {fileChips.length > 0 && (
@@ -288,6 +322,13 @@ export function SessionMessageDisplay({
             />
           </div>
         )}
+
+        {/* Agent tasks (parallel agents) */}
+        {message.agentTasks && message.agentTasks.length > 0 && (
+          <div className="mt-3">
+            <AgentTaskGroup tasks={message.agentTasks} />
+          </div>
+        )}
       </div>
 
       {/* File viewer modal (only if not using external handler) */}
diff --git a/packages/dashboard/src/components/session/workflow-output-card.tsx b/packages/dashboard/src/components/session/workflow-output-card.tsx
new file mode 100644
index 0000000..5c598f2
--- /dev/null
+++ b/packages/dashboard/src/components/session/workflow-output-card.tsx
@@ -0,0 +1,146 @@
+'use client'
+
+import { cn } from '@/lib/utils'
+import { CheckCircle, XCircle, AlertCircle, HelpCircle, FileText } from 'lucide-react'
+import { MarkdownContent } from '@/components/ui/markdown-content'
+
+export interface WorkflowOutput {
+  status: 'completed' | 'error' | 'needs_input' | 'cancelled' | string
+  phase?: string
+  message?: string
+  artifacts?: Array<{ path: string; action: string }>
+  questions?: Array<{
+    question: string
+    header?: string
+    options?: Array<{ label: string; description?: string }>
+    multiSelect?: boolean
+  }>
+}
+
+interface WorkflowOutputCardProps {
+  output: WorkflowOutput
+  className?: string
+}
+
+const statusConfig = {
+  completed: {
+    icon: CheckCircle,
+    label: 'Completed',
+    bgClass: 'bg-success/10 border-success/30',
+    iconClass: 'text-success',
+    labelClass: 'text-success',
+  },
+  error: {
+    icon: XCircle,
+    label: 'Error',
+    bgClass: 'bg-error/10 border-error/30',
+    iconClass: 'text-error',
+    labelClass: 'text-error',
+  },
+  needs_input: {
+    icon: HelpCircle,
+    label: 'Input Needed',
+    bgClass: 'bg-warning/10 border-warning/30',
+    iconClass: 'text-warning',
+    labelClass: 'text-warning',
+  },
+  cancelled: {
+    icon: AlertCircle,
+    label: 'Cancelled',
+    bgClass: 'bg-zinc-500/10 border-zinc-500/30',
+    iconClass: 'text-zinc-400',
+    labelClass: 'text-zinc-400',
+  },
+}
+
+export function WorkflowOutputCard({ output, className }: WorkflowOutputCardProps) {
+  const config = statusConfig[output.status as keyof typeof statusConfig] || statusConfig.error
+  const StatusIcon = config.icon
+
+  return (
+    <div
+      className={cn(
+        'rounded-lg border p-4',
+        config.bgClass,
+        className
+      )}
+    >
+      {/* Header with status and phase */}
+      <div className="flex items-center gap-3 mb-3">
+        <StatusIcon className={cn('w-5 h-5', config.iconClass)} />
+        <span className={cn('font-semibold', config.labelClass)}>
+          {config.label}
+        </span>
+        {output.phase && (
+          <span className="px-2 py-0.5 rounded text-xs bg-surface-300 text-zinc-300 uppercase tracking-wider">
+            {output.phase}
+          </span>
+        )}
+      </div>
+
+      {/* Message */}
+      {output.message && (
+        <div className="text-zinc-300 text-sm leading-relaxed mb-3">
+          <MarkdownContent
+            content={output.message}
+            className="prose-p:mb-2 prose-p:last:mb-0 prose-pre:bg-surface-300 prose-pre:text-xs"
+          />
+        </div>
+      )}
+
+      {/* Artifacts */}
+      {output.artifacts && output.artifacts.length > 0 && (
+        <div className="mt-3 pt-3 border-t border-surface-300">
+          <div className="text-xs text-zinc-500 uppercase tracking-wider mb-2">Artifacts</div>
+          <div className="flex flex-wrap gap-2">
+            {output.artifacts.map((artifact, idx) => (
+              <div
+                key={idx}
+                className="inline-flex items-center gap-1.5 px-2 py-1 rounded bg-surface-300 text-xs"
+              >
+                <FileText className="w-3 h-3 text-zinc-500" />
+                <span className="text-zinc-300">{artifact.path.split('/').pop()}</span>
+                <span className={cn(
+                  'text-[10px] uppercase',
+                  artifact.action === 'created' ? 'text-success' :
+                  artifact.action === 'updated' ? 'text-accent' :
+                  'text-zinc-500'
+                )}>
+                  {artifact.action}
+                </span>
+              </div>
+            ))}
+          </div>
+        </div>
+      )}
+
+      {/* Questions (if needs_input) */}
+      {output.questions && output.questions.length > 0 && (
+        <div className="mt-3 pt-3 border-t border-surface-300 space-y-3">
+          {output.questions.map((q, qIdx) => (
+            <div key={qIdx} className="rounded-lg border border-accent/30 bg-accent/5 p-3">
+              {q.header && (
+                <span className="inline-block px-2 py-0.5 mb-2 rounded text-[10px] uppercase tracking-wider bg-accent/20 text-accent">
+                  {q.header}
+                </span>
+              )}
+              <p className="text-zinc-200 text-sm font-medium mb-2">{q.question}</p>
+              {q.options && q.options.length > 0 && (
+                <div className="flex flex-wrap gap-2">
+                  {q.options.map((opt, optIdx) => (
+                    <div
+                      key={optIdx}
+                      className="px-2 py-1 rounded border border-surface-400 bg-surface-300 text-xs"
+                    >
+                      <span className="text-zinc-200">{opt.label}</span>
+                    </div>
+                  ))}
+                </div>
+              )}
+            </div>
+          ))}
+        </div>
+      )}
+    </div>
+  )
+}
diff --git a/packages/dashboard/src/components/views/session-console.tsx b/packages/dashboard/src/components/views/session-console.tsx
index 5c57d09..9323718 100644
--- a/packages/dashboard/src/components/views/session-console.tsx
+++ b/packages/dashboard/src/components/views/session-console.tsx
@@ -9,6 +9,7 @@ import { TodoPanel } from '@/components/session/todo-panel'
 import type { TodoItem } from '@/lib/session-parser'
 import { Play, Terminal, LayoutDashboard, ChevronDown, Clock, CheckCircle, XCircle, Loader2, History } from 'lucide-react'
 import { SessionControls } from '@/components/session/session-controls'
+import { WorkflowOutputCard, type WorkflowOutput } from '@/components/session/workflow-output-card'
 import type { SessionMessage } from '@/lib/session-parser'
 import type { WorkflowStatus } from '@/components/design-system'
 import type { WorkflowIndexEntry } from '@/lib/services/workflow-service'
@@ -32,12 +33,20 @@ interface SessionConsoleProps {
   onEndSession?: (sessionId: string) => void
   /** Callback to pause an active session (when part of orchestration) */
   onPauseSession?: (sessionId: string) => void
+  /** Callback to resume a paused session */
+  onResumeSession?: () => void
   /** Whether pause is available (e.g., orchestration is active) */
   canPause?: boolean
+  /** Whether orchestration is currently paused */
+  isPaused?: boolean
   /** Project ID for session operations */
   projectId?: string
   /** Current todo items from session */
   currentTodos?: TodoItem[]
+  /** Workflow's final structured output (for completed sessions) */
+  workflowOutput?: WorkflowOutput | null
+  /** Whether the session has ended */
+  sessionEnded?: boolean
   className?: string
 }
 
@@ -95,9 +104,13 @@ export function SessionConsole({
   onSelectSession,
   onEndSession,
   onPauseSession,
+  onResumeSession,
   canPause = false,
+  isPaused = false,
   projectId,
   currentTodos = [],
+  workflowOutput,
+  sessionEnded = false,
   className,
 }: SessionConsoleProps) {
   const scrollRef = useRef<HTMLDivElement>(null)
@@ -135,8 +148,8 @@ export function SessionConsole({
   // Check if we have sessions to show in dropdown
   const hasHistory = sessionHistory.length > 0
 
-  // Check if session has ended (based on messages)
-  const hasSessionEnded = messages.some(m => m.isSessionEnd)
+  // Compute hasEnded from messages if not passed via prop
+  const hasEnded = sessionEnded || messages.some(m => m.isSessionEnd)
 
   // Empty state when idle AND no history selected
   if (workflowStatus === 'idle' && messages.length === 0 && !selectedSession) {
@@ -285,7 +298,7 @@ export function SessionConsole({
             {isDropdownOpen && (
               <div className="absolute top-full left-0 mt-1 w-72 bg-surface-100 border border-surface-300 rounded-md shadow-xl z-50 overflow-hidden">
                 {/* Current session option - only show if workflow is actually active */}
-                {currentSessionId && !hasSessionEnded && workflowStatus !== 'idle' && (
+                {currentSessionId && !hasEnded && workflowStatus !== 'idle' && (
                   <>
                     <button
                       onClick={() => {
@@ -320,7 +333,7 @@ export function SessionConsole({
                   {sessionHistory.map((session) => {
                     // Override status if this is the currently viewed session and it has ended
                     const isCurrentlyViewed = session.sessionId === currentViewSessionId
-                    const effectiveStatus = (isCurrentlyViewed && hasSessionEnded) ? 'completed' : session.status
+                    const effectiveStatus = (isCurrentlyViewed && hasEnded) ? 'completed' : session.status
 
                     return (
                       <button
@@ -358,7 +371,9 @@ export function SessionConsole({
               <SessionControls
                 onCancel={handleEndCurrentSession}
                 onPause={canPause && onPauseSession ? () => onPauseSession(currentViewSessionId) : undefined}
+                onResume={onResumeSession}
                 showPause={canPause && !!onPauseSession}
+                isPaused={isPaused}
                 compact={true}
               />
             )}
@@ -398,8 +413,13 @@ export function SessionConsole({
           return <SessionMessageDisplay key={index} message={message} />
         })}
 
+        {/* Workflow output card - shown when workflow produced structured output */}
+        {workflowOutput && (
+          <WorkflowOutputCard output={workflowOutput} className="mt-4" />
+        )}
+
         {/* Typing indicator when processing (hide if session has ended) */}
-        {isProcessing && !hasSessionEnded && <TypingIndicator />}
+        {isProcessing && !hasEnded && <TypingIndicator />}
       </div>
 
       {/* Todo panel at bottom */}
diff --git a/packages/dashboard/src/contexts/unified-data-context.tsx b/packages/dashboard/src/contexts/unified-data-context.tsx
index bf0d5a2..c1007d2 100644
--- a/packages/dashboard/src/contexts/unified-data-context.tsx
+++ b/packages/dashboard/src/contexts/unified-data-context.tsx
@@ -4,17 +4,14 @@
  * UNIFIED DATA CONTEXT - Single source of truth for all real-time data
  *
  * DATA SOURCES:
- * - SSE (pushed): registry, states, tasks, workflows, phases
+ * - SSE (pushed): registry, states, tasks, workflows, phases, sessionContent
  *   -> Triggered by file system changes via chokidar watcher
+ *   -> Session JSONL files in ~/.claude/projects/ are also file-watched
  *   -> See: lib/watcher.ts, hooks/use-sse.ts
  *
- * - Polling (pulled): sessionContent
- *   -> Session JSONL files live in ~/.claude/projects/ (external)
- *   -> See: lib/session-polling-manager.ts
- *
  * ADDING NEW DATA:
  * - File in project directory? -> Add to watcher.ts + SSE events
- * - External file/API? -> Add to session-polling-manager.ts
+ * - Session JSONL file? -> Already handled by watcher.ts session watching
  * - NEVER add independent polling hooks
  */
 
@@ -22,16 +19,9 @@ import {
   createContext,
   useContext,
   useState,
-  useEffect,
-  useCallback,
   type ReactNode,
 } from 'react';
 import { useSSE, type ConnectionStatus } from '@/hooks/use-sse';
-import {
-  sessionPollingManager,
-  type SessionContent,
-  type SessionUpdateEvent,
-} from '@/lib/session-polling-manager';
 import type {
   Registry,
   OrchestrationState,
@@ -39,7 +29,31 @@ import type {
   WorkflowData,
   PhasesData,
   Project,
+  SessionQuestion,
 } from '@specflow/shared';
+import type {
+  SessionMessage,
+  TodoItem,
+  WorkflowOutput,
+  AgentTaskInfo,
+} from '@/lib/session-parser';
+
+/**
+ * Session content structure (from JSONL parsing)
+ * Re-exported for convenience
+ */
+export type { SessionMessage, TodoItem, WorkflowOutput, AgentTaskInfo };
+
+export interface SessionContent {
+  messages: SessionMessage[];
+  filesModified: string[];
+  elapsedMs: number;
+  currentTodos: TodoItem[];
+  /** Final structured output from workflow completion (if any) */
+  workflowOutput?: WorkflowOutput;
+  /** Agent tasks (parallel agents) currently running or recently completed */
+  agentTasks?: AgentTaskInfo[];
+}
 
 /**
  * Unified data context value interface
@@ -53,17 +67,19 @@ interface UnifiedDataContextValue {
   phases: Map<string, PhasesData>;
   connectionStatus: ConnectionStatus;
 
-  // === Polled Data (Session content only) ===
+  // === Session Content (SSE-pushed from JSONL file watching) ===
   sessionContent: Map<string, SessionContent>;
 
+  // === Session Questions (G4.5: AskUserQuestion tool calls from SSE) ===
+  sessionQuestions: Map<string, SessionQuestion[]>;
+  clearSessionQuestions: (sessionId: string) => void;
+
   // === UI State ===
   selectedProject: Project | null;
   setSelectedProject: (project: Project | null) => void;
 
   // === Actions ===
   refetch: () => void;
-  subscribeToSession: (sessionId: string, projectPath: string) => void;
-  unsubscribeFromSession: (sessionId: string) => void;
 }
 
 const UnifiedDataContext = createContext<UnifiedDataContextValue | null>(null);
@@ -71,59 +87,16 @@ const UnifiedDataContext = createContext<UnifiedDataContextValue | null>(null);
 /**
  * Unified Data Provider
  *
- * Wraps SSE hook for file-watched data and integrates session polling manager.
+ * Wraps SSE hook for file-watched data including session JSONL content.
+ * No polling - all data is pushed via SSE from file watchers.
  */
 export function UnifiedDataProvider({ children }: { children: ReactNode }) {
-  // SSE data (file-watched: registry, states, tasks, workflows)
+  // SSE data (file-watched: registry, states, tasks, workflows, sessions)
   const sseData = useSSE();
 
   // UI state
   const [selectedProject, setSelectedProject] = useState<Project | null>(null);
 
-  // Session content (polled)
-  const [sessionContent, setSessionContent] = useState<Map<string, SessionContent>>(
-    new Map()
-  );
-
-  // Subscribe to session polling updates
-  useEffect(() => {
-    const unsubscribe = sessionPollingManager.addListener(
-      (event: SessionUpdateEvent) => {
-        setSessionContent(prev => {
-          const next = new Map(prev);
-          next.set(event.sessionId, event.content);
-          return next;
-        });
-      }
-    );
-
-    return () => {
-      unsubscribe();
-    };
-  }, []);
-
-  // Session subscription management
-  const subscribeToSession = useCallback(
-    (sessionId: string, projectPath: string) => {
-      sessionPollingManager.subscribe(sessionId, projectPath);
-
-      // Load cached content if available
-      const cached = sessionPollingManager.getCache(sessionId);
-      if (cached) {
-        setSessionContent(prev => {
-          const next = new Map(prev);
-          next.set(sessionId, cached);
-          return next;
-        });
-      }
-    },
-    []
-  );
-
-  const unsubscribeFromSession = useCallback((sessionId: string) => {
-    sessionPollingManager.unsubscribe(sessionId);
-  }, []);
-
   const value: UnifiedDataContextValue = {
     // SSE data
     registry: sseData.registry,
@@ -133,8 +106,12 @@ export function UnifiedDataProvider({ children }: { children: ReactNode }) {
     phases: sseData.phases,
     connectionStatus: sseData.connectionStatus,
 
-    // Polled data
-    sessionContent,
+    // Session content (from SSE - pushed by session:message events)
+    sessionContent: sseData.sessionContent,
+
+    // Session questions (G4.5: from SSE - pushed by session:question events)
+    sessionQuestions: sseData.sessionQuestions,
+    clearSessionQuestions: sseData.clearSessionQuestions,
 
     // UI state
     selectedProject,
@@ -142,8 +119,6 @@ export function UnifiedDataProvider({ children }: { children: ReactNode }) {
 
     // Actions
     refetch: sseData.refetch,
-    subscribeToSession,
-    unsubscribeFromSession,
   };
 
   return (
diff --git a/packages/dashboard/src/hooks/use-git-changes.ts b/packages/dashboard/src/hooks/use-git-changes.ts
index bcb82f6..fb0b3a7 100644
--- a/packages/dashboard/src/hooks/use-git-changes.ts
+++ b/packages/dashboard/src/hooks/use-git-changes.ts
@@ -29,10 +29,11 @@ const REFRESH_DEBOUNCE_MS = 2000;
  *
  * @param projectPath - Absolute path to the project
  * @param refreshTrigger - Optional value that triggers a refresh when changed (debounced)
+ *                         Can be a number, string, or any value - changes trigger refresh
  */
 export function useGitChanges(
   projectPath: string | null,
-  refreshTrigger?: number
+  refreshTrigger?: string | number
 ): UseGitChangesResult {
   const [files, setFiles] = useState<FileChange[]>([]);
   const [totalAdditions, setTotalAdditions] = useState(0);
diff --git a/packages/dashboard/src/hooks/use-orchestration.ts b/packages/dashboard/src/hooks/use-orchestration.ts
index facade8..d4ead29 100644
--- a/packages/dashboard/src/hooks/use-orchestration.ts
+++ b/packages/dashboard/src/hooks/use-orchestration.ts
@@ -3,7 +3,8 @@
 /**
  * useOrchestration Hook
  *
- * Manages orchestration state with polling for status updates.
+ * Manages orchestration state with event-driven updates.
+ * Uses SSE events (workflow, state changes) to trigger refreshes instead of polling.
  * Provides methods for starting, pausing, resuming, canceling orchestration.
  */
 
@@ -11,6 +12,7 @@ import { useState, useCallback, useEffect, useRef } from 'react';
 import type { OrchestrationExecution, OrchestrationConfig } from '@specflow/shared';
 import type { BatchPlanInfo } from '@/components/orchestration/start-orchestration-modal';
 import type { RecoveryOption } from '@/components/orchestration/recovery-panel';
+import { useUnifiedData } from '@/contexts/unified-data-context';
 
 // =============================================================================
 // Types
@@ -26,7 +28,7 @@ export interface WorkflowInfo {
 export interface UseOrchestrationOptions {
   /** Project ID */
   projectId: string;
-  /** Polling interval in ms (default: 3000) */
+  /** @deprecated No longer used - refreshes are now SSE-driven */
   pollingInterval?: number;
   /** Callback when orchestration status changes */
   onStatusChange?: (status: OrchestrationExecution['status']) => void;
@@ -75,19 +77,13 @@ export interface UseOrchestrationReturn {
   refresh: () => Promise<void>;
 }
 
-// =============================================================================
-// Constants
-// =============================================================================
-
-const DEFAULT_POLLING_INTERVAL = 3000;
-
 // =============================================================================
 // Hook Implementation
 // =============================================================================
 
 export function useOrchestration({
   projectId,
-  pollingInterval = DEFAULT_POLLING_INTERVAL,
+  // pollingInterval is deprecated - SSE-driven refresh
   onStatusChange,
   onComplete,
   onError,
@@ -104,7 +100,9 @@ export function useOrchestration({
   const [recoveryAction, setRecoveryAction] = useState<RecoveryOption | null>(null);
 
   const lastStatusRef = useRef<OrchestrationExecution['status'] | null>(null);
-  const pollingRef = useRef<NodeJS.Timeout | null>(null);
+
+  // SSE data for event-driven refresh (T028: replaces polling)
+  const { workflows, states } = useUnifiedData();
 
   // Use refs for callbacks to avoid recreating fetchStatus on every render
   const onStatusChangeRef = useRef(onStatusChange);
@@ -223,13 +221,46 @@ export function useOrchestration({
           onWorkflowStartRef.current(data.workflow);
         }
 
-        // Refresh to get full orchestration state (including spawned workflow)
+        // Initial refresh to get orchestration state
         await refresh();
+
+        // Poll for sessionId - it becomes available after CLI spawns and returns first output
+        // This can take 30+ seconds for complex workflows. Poll for up to 90 seconds.
+        // IMPORTANT: We await this to keep isLoading=true until session is found
+        const maxAttempts = 90;
+        const pollInterval = 1000;
+
+        for (let attempt = 0; attempt < maxAttempts; attempt++) {
+          await new Promise(resolve => setTimeout(resolve, pollInterval));
+
+          try {
+            const statusResponse = await fetch(
+              `/api/workflow/orchestrate/status?projectId=${encodeURIComponent(projectId)}`
+            );
+            if (statusResponse.ok) {
+              const statusData = await statusResponse.json();
+              if (statusData.workflow?.sessionId) {
+                setActiveSessionId(statusData.workflow.sessionId);
+                setOrchestration(statusData.orchestration);
+                setIsLoading(false);
+                return; // Found sessionId, stop polling
+              }
+              // Also update orchestration state during polling so UI shows progress
+              if (statusData.orchestration) {
+                setOrchestration(statusData.orchestration);
+              }
+            }
+          } catch {
+            // Continue polling on error
+          }
+        }
+
+        // Polling timed out without finding session - still set loading false
+        setIsLoading(false);
       } catch (err) {
         const message = err instanceof Error ? err.message : 'Unknown error';
         setError(message);
         onErrorRef.current?.(message);
-      } finally {
         setIsLoading(false);
       }
     },
@@ -368,24 +399,32 @@ export function useOrchestration({
     }
   }, [orchestration, projectId, refresh]);
 
-  // Setup polling when orchestration is active
+  // T028: Event-driven refresh via SSE instead of polling
+  // When workflow or state SSE events come in, refresh orchestration status
+  // This replaces the previous setInterval polling
+  const lastWorkflowRef = useRef<unknown>(null);
+  const lastStateRef = useRef<unknown>(null);
+
   useEffect(() => {
-    // Start polling
-    const shouldPoll =
-      orchestration &&
-      ['running', 'paused', 'waiting_merge', 'needs_attention'].includes(orchestration.status);
+    // Only react if orchestration is active
+    if (!orchestration) return;
+    if (!['running', 'paused', 'waiting_merge', 'needs_attention'].includes(orchestration.status)) return;
 
-    if (shouldPoll) {
-      pollingRef.current = setInterval(fetchStatus, pollingInterval);
-    }
+    // Check if workflow data changed
+    const currentWorkflow = workflows.get(projectId);
+    const workflowChanged = currentWorkflow !== lastWorkflowRef.current;
 
-    return () => {
-      if (pollingRef.current) {
-        clearInterval(pollingRef.current);
-        pollingRef.current = null;
-      }
-    };
-  }, [orchestration?.status, pollingInterval, fetchStatus]);
+    // Check if state data changed
+    const currentState = states.get(projectId);
+    const stateChanged = currentState !== lastStateRef.current;
+
+    // Refresh on either change
+    if (workflowChanged || stateChanged) {
+      lastWorkflowRef.current = currentWorkflow;
+      lastStateRef.current = currentState;
+      fetchStatus();
+    }
+  }, [orchestration, projectId, workflows, states, fetchStatus]);
 
   // Initial fetch on mount (only once)
   const hasFetchedRef = useRef(false);
diff --git a/packages/dashboard/src/hooks/use-session-content.ts b/packages/dashboard/src/hooks/use-session-content.ts
index 36bd97f..054f991 100644
--- a/packages/dashboard/src/hooks/use-session-content.ts
+++ b/packages/dashboard/src/hooks/use-session-content.ts
@@ -1,10 +1,10 @@
 "use client"
 
 /**
- * Hook for subscribing to session content.
+ * Hook for getting session content from unified context.
  *
- * Automatically subscribes to session polling when mounted with valid session,
- * and unsubscribes when unmounted or session changes.
+ * Session content is pushed via SSE from JSONL file watchers for ACTIVE sessions.
+ * For HISTORICAL sessions, we fall back to fetching via API.
  *
  * Usage:
  *   const content = useSessionContent(sessionId, projectPath);
@@ -14,42 +14,82 @@
  *   }
  */
 
-import { useEffect, useMemo } from 'react';
-import { useUnifiedData } from '@/contexts/unified-data-context';
-import type { SessionContent } from '@/lib/session-polling-manager';
+import { useMemo, useEffect, useState, useRef } from 'react';
+import { useUnifiedData, type SessionContent } from '@/contexts/unified-data-context';
 
 /**
- * Hook for auto-subscribing to session content
+ * Hook for getting session content from SSE or API fallback
  *
  * @param sessionId - Claude session ID (or null)
- * @param projectPath - Absolute path to the project (or null)
+ * @param projectPath - Absolute path to the project (used for API fallback)
  * @returns Session content or null if not available
  */
 export function useSessionContent(
   sessionId: string | null,
   projectPath: string | null
 ): SessionContent | null {
-  const { sessionContent, subscribeToSession, unsubscribeFromSession } =
-    useUnifiedData();
+  const { sessionContent } = useUnifiedData();
+  const [apiFallback, setApiFallback] = useState<SessionContent | null>(null);
+  const fetchedRef = useRef<string | null>(null);
 
-  // Subscribe/unsubscribe based on sessionId and projectPath
+  // Check if content is available from SSE
+  const sseContent = useMemo(() => {
+    if (!sessionId) return null;
+    const content = sessionContent.get(sessionId) ?? null;
+    // Debug: log when content is looked up
+    if (sessionId) {
+      console.log(`[useSessionContent] Looking up sessionId=${sessionId}, found=${!!content}, sessionContent.size=${sessionContent.size}`);
+    }
+    return content;
+  }, [sessionId, sessionContent]);
+
+  // Fallback: fetch from API for historical sessions
   useEffect(() => {
-    if (sessionId && projectPath) {
-      subscribeToSession(sessionId, projectPath);
+    // Don't fetch if we have SSE content
+    if (sseContent) {
+      setApiFallback(null);
+      return;
+    }
 
-      return () => {
-        unsubscribeFromSession(sessionId);
-      };
+    // Don't fetch without required params
+    if (!sessionId || !projectPath) {
+      setApiFallback(null);
+      return;
     }
-  }, [sessionId, projectPath, subscribeToSession, unsubscribeFromSession]);
 
-  // Return content from context
-  const content = useMemo(() => {
-    if (!sessionId) return null;
-    return sessionContent.get(sessionId) ?? null;
-  }, [sessionId, sessionContent]);
+    // Don't re-fetch the same session
+    if (fetchedRef.current === sessionId) {
+      return;
+    }
+
+    // Fetch historical session content
+    const fetchContent = async () => {
+      try {
+        fetchedRef.current = sessionId;
+        const response = await fetch(
+          `/api/session/content?projectPath=${encodeURIComponent(projectPath)}&sessionId=${encodeURIComponent(sessionId)}&tail=500`
+        );
+        if (response.ok) {
+          const data = await response.json();
+          setApiFallback({
+            messages: data.messages,
+            filesModified: data.filesModified ? Array(data.filesModified).fill('') : [],
+            elapsedMs: data.elapsed || 0,
+            currentTodos: data.currentTodos || [],
+            workflowOutput: data.workflowOutput,
+            agentTasks: data.agentTasks,
+          });
+        }
+      } catch (error) {
+        console.error('[useSessionContent] API fallback error:', error);
+      }
+    };
+
+    fetchContent();
+  }, [sessionId, projectPath, sseContent]);
 
-  return content;
+  // Return SSE content if available, otherwise API fallback
+  return sseContent ?? apiFallback;
 }
 
 /**
@@ -60,18 +100,18 @@ interface UseSessionContentExtendedResult {
   content: SessionContent | null;
   /** Messages from the session */
   messages: SessionContent['messages'];
-  /** Number of files modified */
-  filesModified: number;
+  /** Files modified in the session */
+  filesModified: string[];
   /** Elapsed time in milliseconds */
   elapsed: number;
   /** Current todo items */
   currentTodos: SessionContent['currentTodos'];
-  /** Tool calls from the session */
-  toolCalls: SessionContent['toolCalls'];
   /** Whether the session has ended */
   hasEnded: boolean;
   /** True if content is loading (first fetch) */
   isLoading: boolean;
+  /** Final structured output from workflow completion */
+  workflowOutput: SessionContent['workflowOutput'];
 }
 
 /**
@@ -87,12 +127,12 @@ export function useSessionContentExtended(
     () => ({
       content,
       messages: content?.messages ?? [],
-      filesModified: content?.filesModified ?? 0,
-      elapsed: content?.elapsed ?? 0,
-      currentTodos: content?.currentTodos,
-      toolCalls: content?.toolCalls,
-      hasEnded: content?.hasEnded ?? false,
+      filesModified: content?.filesModified ?? [],
+      elapsed: content?.elapsedMs ?? 0,
+      currentTodos: content?.currentTodos ?? [],
+      hasEnded: content?.messages.some(m => m.isSessionEnd) ?? false,
       isLoading: sessionId !== null && content === null,
+      workflowOutput: content?.workflowOutput,
     }),
     [content, sessionId]
   );
diff --git a/packages/dashboard/src/hooks/use-session-history.ts b/packages/dashboard/src/hooks/use-session-history.ts
deleted file mode 100644
index cf53d1d..0000000
--- a/packages/dashboard/src/hooks/use-session-history.ts
+++ /dev/null
@@ -1,144 +0,0 @@
-'use client';
-
-/**
- * @deprecated This hook will be removed in a future version.
- *
- * Migration guide:
- * - Session history is now pushed via SSE workflow events
- * - Use useProjectData() from '@/hooks/use-project-data' instead
- *
- * OLD:
- *   const { sessions } = useSessionHistory(projectPath);
- *
- * NEW:
- *   const { sessions } = useProjectData(projectId);
- *
- * The sessions array contains WorkflowIndexEntry[] with the same data,
- * but updates in real-time via SSE instead of polling.
- *
- * ---
- * Hook for fetching session history for a project.
- *
- * Features:
- * - Fetches session index from API
- * - Polls every 5 seconds when enabled
- * - Returns list of sessions with metadata
- * - Loading and error states
- */
-
-import { useState, useEffect, useCallback, useRef } from 'react';
-import type { WorkflowIndexEntry } from '@/lib/services/workflow-service';
-
-const POLL_INTERVAL_MS = 5000; // 5 seconds
-
-interface UseSessionHistoryResult {
-  /** List of sessions for the project */
-  sessions: WorkflowIndexEntry[];
-  /** True during initial fetch */
-  isLoading: boolean;
-  /** Error from last fetch attempt */
-  error: string | null;
-  /** Manually refresh session list */
-  refresh: () => Promise<void>;
-}
-
-/**
- * Fetch session history from API
- */
-async function fetchSessionHistory(
-  projectPath: string
-): Promise<WorkflowIndexEntry[]> {
-  const params = new URLSearchParams({ projectPath });
-  const res = await fetch(`/api/session/history?${params}`);
-  const data = await res.json();
-
-  if (!res.ok) {
-    throw new Error(data.error || `Failed to fetch history: ${res.status}`);
-  }
-
-  return data.sessions || [];
-}
-
-/**
- * Hook for managing session history
- *
- * @param projectPath - Absolute path to the project
- * @param enablePolling - Whether to poll for updates (default: true)
- */
-export function useSessionHistory(
-  projectPath: string | null,
-  enablePolling: boolean = true
-): UseSessionHistoryResult {
-  const [sessions, setSessions] = useState<WorkflowIndexEntry[]>([]);
-  const [isLoading, setIsLoading] = useState(false);
-  const [error, setError] = useState<string | null>(null);
-  const pollIntervalRef = useRef<NodeJS.Timeout | null>(null);
-  const hasLoadedRef = useRef(false);
-
-  const refresh = useCallback(async () => {
-    if (!projectPath) {
-      setSessions([]);
-      return;
-    }
-
-    // Only show loading on initial fetch
-    if (!hasLoadedRef.current) {
-      setIsLoading(true);
-    }
-    setError(null);
-
-    try {
-      const result = await fetchSessionHistory(projectPath);
-      setSessions(result);
-      hasLoadedRef.current = true;
-    } catch (e) {
-      const message = e instanceof Error ? e.message : 'Unknown error';
-      setError(message);
-    } finally {
-      setIsLoading(false);
-    }
-  }, [projectPath]);
-
-  // Clear polling
-  const stopPolling = useCallback(() => {
-    if (pollIntervalRef.current) {
-      clearInterval(pollIntervalRef.current);
-      pollIntervalRef.current = null;
-    }
-  }, []);
-
-  // Start polling
-  const startPolling = useCallback(() => {
-    stopPolling();
-    pollIntervalRef.current = setInterval(() => {
-      refresh();
-    }, POLL_INTERVAL_MS);
-  }, [refresh, stopPolling]);
-
-  // Fetch on mount and start polling
-  useEffect(() => {
-    if (!projectPath) {
-      setSessions([]);
-      hasLoadedRef.current = false;
-      stopPolling();
-      return;
-    }
-
-    refresh();
-
-    if (enablePolling) {
-      startPolling();
-    }
-
-    return () => {
-      stopPolling();
-    };
-  }, [projectPath, enablePolling, refresh, startPolling, stopPolling]);
-
-  return {
-    sessions,
-    isLoading,
-    error,
-    refresh,
-  };
-}
diff --git a/packages/dashboard/src/hooks/use-session-messages.ts b/packages/dashboard/src/hooks/use-session-messages.ts
deleted file mode 100644
index 87ebcc8..0000000
--- a/packages/dashboard/src/hooks/use-session-messages.ts
+++ /dev/null
@@ -1,315 +0,0 @@
-'use client';
-
-/**
- * @deprecated This hook will be replaced by useSessionContent.
- *
- * Migration guide:
- * - Use useSessionContent() from '@/hooks/use-session-content' instead
- * - Session polling is now centralized in session-polling-manager.ts
- *
- * OLD:
- *   const { messages, filesModified, currentTodos } = useSessionMessages(
- *     projectPath, sessionId, isActive
- *   );
- *
- * NEW:
- *   const content = useSessionContent(sessionId, projectPath);
- *   // content.messages, content.filesModified, content.currentTodos
- *
- * For extended data:
- *   import { useSessionContentExtended } from '@/hooks/use-session-content';
- *   const { messages, filesModified, currentTodos, isLoading } = useSessionContentExtended(
- *     sessionId, projectPath
- *   );
- *
- * ---
- * Hook for fetching and polling Claude session messages.
- *
- * Features:
- * - Fetches session content from API
- * - Polls every 3 seconds when session is active
- * - Auto-discovers active session when sessionId not provided
- * - Auto-stops polling on error or when session completes
- * - Returns messages, metrics, tool calls, todos, and loading/error states
- */
-
-import { useState, useEffect, useCallback, useRef } from 'react';
-import type { SessionMessage, ToolCallInfo, TodoItem } from '@/lib/session-parser';
-
-const POLL_INTERVAL_MS = 3000; // 3 seconds to match workflow polling
-const DEFAULT_TAIL_LIMIT = 100;
-
-export interface SessionContent {
-  messages: SessionMessage[];
-  filesModified: number;
-  elapsed: number;
-  sessionId: string;
-  toolCalls?: ToolCallInfo[];
-  currentTodos?: TodoItem[];
-}
-
-interface UseSessionMessagesResult {
-  /** Session messages (user and assistant only) */
-  messages: SessionMessage[];
-  /** Number of unique files modified during session */
-  filesModified: number;
-  /** Milliseconds since session start */
-  elapsed: number;
-  /** True during initial fetch */
-  isLoading: boolean;
-  /** True while polling is active */
-  isPolling: boolean;
-  /** Error from last fetch attempt */
-  error: string | null;
-  /** Discovered session ID (may differ from prop if auto-discovered) */
-  activeSessionId: string | null;
-  /** All tool calls extracted from the session */
-  toolCalls: ToolCallInfo[];
-  /** Current todo items from latest TodoWrite call */
-  currentTodos: TodoItem[];
-  /** Manually refresh session content */
-  refresh: () => Promise<void>;
-  /** Stop polling */
-  stopPolling: () => void;
-}
-
-/**
- * Find the most recently active session for a project
- */
-async function findActiveSession(
-  projectPath: string
-): Promise<string | null> {
-  const params = new URLSearchParams({ projectPath });
-  const res = await fetch(`/api/session/active?${params}`);
-
-  if (!res.ok) {
-    return null;
-  }
-
-  const data = await res.json();
-  return data.sessionId || null;
-}
-
-/**
- * Fetch session content from API
- */
-async function fetchSessionContent(
-  projectPath: string,
-  sessionId: string,
-  tail: number = DEFAULT_TAIL_LIMIT
-): Promise<SessionContent> {
-  const params = new URLSearchParams({
-    projectPath,
-    sessionId,
-    tail: String(tail),
-  });
-
-  const res = await fetch(`/api/session/content?${params}`);
-  const data = await res.json();
-
-  if (!res.ok) {
-    throw new Error(data.error || `Failed to fetch session: ${res.status}`);
-  }
-
-  return data as SessionContent;
-}
-
-/**
- * Hook for managing session message polling
- *
- * @param projectPath - Absolute path to the project
- * @param sessionId - Claude session ID (from workflow execution), or null to auto-discover
- * @param isActive - Whether to poll for updates (true when workflow is running)
- * @param tailLimit - Number of messages to fetch (default: 100)
- */
-export function useSessionMessages(
-  projectPath: string | null,
-  sessionId: string | null,
-  isActive: boolean,
-  tailLimit: number = DEFAULT_TAIL_LIMIT
-): UseSessionMessagesResult {
-  const [messages, setMessages] = useState<SessionMessage[]>([]);
-  const [filesModified, setFilesModified] = useState(0);
-  const [elapsed, setElapsed] = useState(0);
-  const [isLoading, setIsLoading] = useState(false);
-  const [error, setError] = useState<string | null>(null);
-  const [activeSessionId, setActiveSessionId] = useState<string | null>(null);
-  const [toolCalls, setToolCalls] = useState<ToolCallInfo[]>([]);
-  const [currentTodos, setCurrentTodos] = useState<TodoItem[]>([]);
-
-  const pollIntervalRef = useRef<NodeJS.Timeout | null>(null);
-  const isPollingRef = useRef(false);
-
-  // Clear polling interval
-  const stopPolling = useCallback(() => {
-    if (pollIntervalRef.current) {
-      clearInterval(pollIntervalRef.current);
-      pollIntervalRef.current = null;
-    }
-    isPollingRef.current = false;
-  }, []);
-
-  // Fetch session content (using discovered session if provided sessionId is null)
-  const refresh = useCallback(async () => {
-    if (!projectPath) {
-      return;
-    }
-
-    // Use provided sessionId or try to discover active session
-    let effectiveSessionId = sessionId || activeSessionId;
-
-    if (!effectiveSessionId && isActive) {
-      // Try to discover active session
-      effectiveSessionId = await findActiveSession(projectPath);
-      if (effectiveSessionId) {
-        setActiveSessionId(effectiveSessionId);
-      }
-    }
-
-    if (!effectiveSessionId) {
-      return;
-    }
-
-    try {
-      const content = await fetchSessionContent(projectPath, effectiveSessionId, tailLimit);
-      setMessages(content.messages);
-      setFilesModified(content.filesModified);
-      setElapsed(content.elapsed);
-      setActiveSessionId(content.sessionId);
-      setToolCalls(content.toolCalls ?? []);
-      setCurrentTodos(content.currentTodos ?? []);
-      setError(null);
-    } catch (e) {
-      const message = e instanceof Error ? e.message : 'Unknown error';
-      setError(message);
-      // Stop polling on error
-      stopPolling();
-    }
-  }, [projectPath, sessionId, activeSessionId, isActive, tailLimit, stopPolling]);
-
-  // Start polling
-  const startPolling = useCallback(() => {
-    if (isPollingRef.current) return;
-
-    isPollingRef.current = true;
-    pollIntervalRef.current = setInterval(() => {
-      refresh();
-    }, POLL_INTERVAL_MS);
-  }, [refresh]);
-
-  // Track if this is the very first load (no messages yet)
-  const hasLoadedRef = useRef(false);
-  // Track the last loaded session to detect session changes
-  const lastSessionIdRef = useRef<string | null>(null);
-
-  // Initial fetch and polling setup
-  useEffect(() => {
-    if (!projectPath) {
-      setMessages([]);
-      setFilesModified(0);
-      setElapsed(0);
-      setError(null);
-      setActiveSessionId(null);
-      setToolCalls([]);
-      setCurrentTodos([]);
-      hasLoadedRef.current = false;
-      lastSessionIdRef.current = null;
-      stopPolling();
-      return;
-    }
-
-    // Use provided sessionId or nothing yet (will discover on first poll)
-    const effectiveSessionId = sessionId;
-
-    // Reset loaded state if session changed
-    if (effectiveSessionId !== lastSessionIdRef.current) {
-      hasLoadedRef.current = false;
-      lastSessionIdRef.current = effectiveSessionId;
-    }
-
-    // Only show loading state on true initial load, not on refetch
-    // This prevents blank screen when polling callbacks change
-    if (!hasLoadedRef.current) {
-      setIsLoading(true);
-    }
-    setError(null);
-
-    const doInitialFetch = async () => {
-      let sid = effectiveSessionId;
-
-      // If no session ID and active, try to discover
-      if (!sid && isActive) {
-        sid = await findActiveSession(projectPath);
-        if (sid) {
-          setActiveSessionId(sid);
-        }
-      }
-
-      if (!sid) {
-        setIsLoading(false);
-        // Start polling to keep trying to discover
-        if (isActive) {
-          startPolling();
-        }
-        return;
-      }
-
-      try {
-        const content = await fetchSessionContent(projectPath, sid, tailLimit);
-        setMessages(content.messages);
-        setFilesModified(content.filesModified);
-        setElapsed(content.elapsed);
-        setActiveSessionId(content.sessionId);
-        setToolCalls(content.toolCalls ?? []);
-        setCurrentTodos(content.currentTodos ?? []);
-        setIsLoading(false);
-        hasLoadedRef.current = true;
-
-        // Start polling if active
-        if (isActive) {
-          startPolling();
-        }
-      } catch (e) {
-        const message = e instanceof Error ? e.message : 'Unknown error';
-        setError(message);
-        setIsLoading(false);
-      }
-    };
-
-    doInitialFetch();
-
-    return () => {
-      stopPolling();
-    };
-  }, [projectPath, sessionId, tailLimit, isActive, startPolling, stopPolling]);
-
-  // Handle isActive changes
-  useEffect(() => {
-    if (isActive && projectPath && !isPollingRef.current) {
-      startPolling();
-    } else if (!isActive) {
-      stopPolling();
-    }
-  }, [isActive, projectPath, startPolling, stopPolling]);
-
-  // Cleanup on unmount
-  useEffect(() => {
-    return () => {
-      stopPolling();
-    };
-  }, [stopPolling]);
-
-  return {
-    messages,
-    filesModified,
-    elapsed,
-    isLoading,
-    isPolling: isPollingRef.current,
-    error,
-    activeSessionId: sessionId || activeSessionId,
-    toolCalls,
-    currentTodos,
-    refresh,
-    stopPolling,
-  };
-}
diff --git a/packages/dashboard/src/hooks/use-sse.ts b/packages/dashboard/src/hooks/use-sse.ts
index eb6ab58..3ac4cc3 100644
--- a/packages/dashboard/src/hooks/use-sse.ts
+++ b/packages/dashboard/src/hooks/use-sse.ts
@@ -8,6 +8,8 @@ import type {
   TasksData,
   WorkflowData,
   PhasesData,
+  SessionContent,
+  SessionQuestion,
 } from '@specflow/shared';
 
 export type ConnectionStatus = 'connected' | 'connecting' | 'disconnected';
@@ -18,12 +20,17 @@ interface SSEState {
   tasks: Map<string, TasksData>;
   workflows: Map<string, WorkflowData>;
   phases: Map<string, PhasesData>;
+  sessionContent: Map<string, SessionContent>;
+  /** Questions from AskUserQuestion tool calls, keyed by sessionId (G4.2) */
+  sessionQuestions: Map<string, SessionQuestion[]>;
   connectionStatus: ConnectionStatus;
   error: Error | null;
 }
 
 interface SSEResult extends SSEState {
   refetch: () => void;
+  /** Clear questions for a session after they've been answered (G4.8) */
+  clearSessionQuestions: (sessionId: string) => void;
 }
 
 /**
@@ -35,6 +42,8 @@ export function useSSE(): SSEResult {
   const [tasks, setTasks] = useState<Map<string, TasksData>>(new Map());
   const [workflows, setWorkflows] = useState<Map<string, WorkflowData>>(new Map());
   const [phases, setPhases] = useState<Map<string, PhasesData>>(new Map());
+  const [sessionContent, setSessionContent] = useState<Map<string, SessionContent>>(new Map());
+  const [sessionQuestions, setSessionQuestions] = useState<Map<string, SessionQuestion[]>>(new Map());
   const [connectionStatus, setConnectionStatus] = useState<ConnectionStatus>('connecting');
   const [error, setError] = useState<Error | null>(null);
   const eventSourceRef = useRef<EventSource | null>(null);
@@ -109,6 +118,30 @@ export function useSSE(): SSEResult {
           case 'heartbeat':
             // Heartbeat received - connection is alive
             break;
+
+          case 'session:message':
+            // Session content update - store by sessionId
+            console.log(`[SSE] session:message received: sessionId=${data.sessionId}, messages=${data.data?.messages?.length ?? 0}`);
+            setSessionContent((prev) => {
+              const next = new Map(prev);
+              next.set(data.sessionId, data.data);
+              return next;
+            });
+            break;
+
+          case 'session:question':
+            // G4.3: Question detected - populate sessionQuestions map
+            setSessionQuestions((prev) => {
+              const next = new Map(prev);
+              // Replace questions for this session (new questions replace old)
+              next.set(data.sessionId, data.data.questions);
+              return next;
+            });
+            break;
+
+          case 'session:end':
+            // Session ended - keep content but could mark as complete
+            break;
         }
       } catch (e) {
         console.error('[SSE] Error parsing event:', e);
@@ -157,14 +190,26 @@ export function useSSE(): SSEResult {
     };
   }, [connect]);
 
+  // G4.8: Function to clear questions after user answers
+  const clearSessionQuestions = useCallback((sessionId: string) => {
+    setSessionQuestions((prev) => {
+      const next = new Map(prev);
+      next.delete(sessionId);
+      return next;
+    });
+  }, []);
+
   return {
     registry,
     states,
     tasks,
     workflows,
     phases,
+    sessionContent,
+    sessionQuestions,
     connectionStatus,
     error,
     refetch,
+    clearSessionQuestions,
   };
 }
diff --git a/packages/dashboard/src/hooks/use-workflow-execution.ts b/packages/dashboard/src/hooks/use-workflow-execution.ts
deleted file mode 100644
index adc78fe..0000000
--- a/packages/dashboard/src/hooks/use-workflow-execution.ts
+++ /dev/null
@@ -1,471 +0,0 @@
-'use client';
-
-/**
- * @deprecated This hook will be removed in a future version.
- *
- * Migration guide:
- * - For workflow data: use useProjectData() from '@/hooks/use-project-data'
- * - For actions: use useWorkflowActions() from '@/hooks/use-workflow-actions'
- *
- * The new architecture uses SSE-pushed workflow events instead of polling,
- * providing real-time updates with less overhead.
- *
- * OLD:
- *   const { execution, start, cancel, submitAnswers } = useWorkflowExecution(projectId);
- *
- * NEW:
- *   const { workflow, currentExecution, isWorkflowActive } = useProjectData(projectId);
- *   const { start, cancel, submitAnswers } = useWorkflowActions(projectId);
- *
- * ---
- * Hook for managing workflow execution state with polling
- *
- * Features:
- * - Fetches current workflow status for a project
- * - Polls every 3 seconds when workflow is active (running/waiting)
- * - Auto-stops polling on terminal states (completed, failed, cancelled)
- * - Provides start, cancel, refresh methods
- */
-
-import { useState, useEffect, useCallback, useRef } from 'react';
-import type { WorkflowExecution } from '@/lib/services/workflow-service';
-import {
-  requestNotificationPermission,
-  hasRequestedPermission,
-  showQuestionNotification,
-} from '@/lib/notifications';
-
-const POLL_INTERVAL_MS = 3000; // 3 seconds per PDR
-
-type WorkflowStatus = WorkflowExecution['status'];
-
-// Detached and stale are NOT terminal - the session may still be running
-const TERMINAL_STATES: WorkflowStatus[] = ['completed', 'failed', 'cancelled'];
-// Detached and stale count as potentially active - continue polling to see if session updates
-const ACTIVE_STATES: WorkflowStatus[] = ['running', 'waiting_for_input', 'detached', 'stale'];
-
-interface StartWorkflowOptions {
-  /** Optional session ID to resume an existing session */
-  resumeSessionId?: string;
-}
-
-interface UseWorkflowExecutionResult {
-  /** Current workflow execution, or null if none */
-  execution: WorkflowExecution | null;
-  /** True during initial load */
-  isLoading: boolean;
-  /** True if workflow is in 'running' state */
-  isRunning: boolean;
-  /** True if workflow is in 'waiting_for_input' state */
-  isWaiting: boolean;
-  /** True if workflow is in a terminal state */
-  isTerminal: boolean;
-  /** Error from last operation */
-  error: Error | null;
-  /** Start a new workflow with the given skill, optionally resuming an existing session */
-  start: (skill: string, options?: StartWorkflowOptions) => Promise<void>;
-  /** Cancel the current workflow */
-  cancel: () => Promise<void>;
-  /** Submit answers to resume a waiting workflow */
-  submitAnswers: (answers: Record<string, string>) => Promise<void>;
-  /** Manually refresh the execution status */
-  refresh: () => Promise<void>;
-}
-
-/**
- * Fetch the most recent active or recent workflow for a project
- */
-async function fetchWorkflowForProject(
-  projectId: string
-): Promise<WorkflowExecution | null> {
-  const res = await fetch(`/api/workflow/list?projectId=${encodeURIComponent(projectId)}`);
-  if (!res.ok) {
-    throw new Error(`Failed to fetch workflow list: ${res.status}`);
-  }
-  const data = await res.json();
-  const executions = data.executions as WorkflowExecution[];
-
-  // Return the most recent execution (already sorted by updatedAt desc)
-  // Prefer active workflows over completed ones
-  // Priority: waiting_for_input > running > other active states
-  // This ensures questions are shown even if multiple workflows exist
-  const waiting = executions.find((e) => e.status === 'waiting_for_input');
-  if (waiting) return waiting;
-
-  const active = executions.find((e) => ACTIVE_STATES.includes(e.status));
-  if (active) return active;
-
-  // Return most recent if within last 30 seconds (for fade effect)
-  const recent = executions[0];
-  if (recent) {
-    const updatedAt = new Date(recent.updatedAt).getTime();
-    const now = Date.now();
-    const thirtySecondsAgo = now - 30000;
-    if (updatedAt > thirtySecondsAgo) {
-      return recent;
-    }
-  }
-
-  return null;
-}
-
-/**
- * Fetch a specific workflow execution by ID
- */
-async function fetchWorkflowById(
-  id: string,
-  projectId: string
-): Promise<WorkflowExecution | null> {
-  const res = await fetch(
-    `/api/workflow/status?id=${encodeURIComponent(id)}&projectId=${encodeURIComponent(projectId)}`
-  );
-  if (!res.ok) {
-    if (res.status === 404) return null;
-    throw new Error(`Failed to fetch workflow: ${res.status}`);
-  }
-  const data = await res.json();
-  return data.execution as WorkflowExecution;
-}
-
-/**
- * Start a workflow for a project
- * @param resumeSessionId - Optional session ID to resume (uses --resume flag)
- */
-async function startWorkflow(
-  projectId: string,
-  skill: string,
-  resumeSessionId?: string
-): Promise<WorkflowExecution> {
-  const body: Record<string, string> = { projectId, skill };
-  if (resumeSessionId) {
-    body.resumeSessionId = resumeSessionId;
-  }
-  const res = await fetch('/api/workflow/start', {
-    method: 'POST',
-    headers: { 'Content-Type': 'application/json' },
-    body: JSON.stringify(body),
-  });
-  if (!res.ok) {
-    const data = await res.json().catch(() => ({}));
-    throw new Error(data.error || `Failed to start workflow: ${res.status}`);
-  }
-  const data = await res.json();
-  return data.execution as WorkflowExecution;
-}
-
-/**
- * Cancel a workflow
- * @param id - Execution ID (optional if sessionId and projectId provided)
- * @param sessionId - Session ID for fallback cancellation
- * @param projectId - Project ID for fallback cancellation
- */
-async function cancelWorkflow(
-  id?: string,
-  sessionId?: string,
-  projectId?: string
-): Promise<{ execution?: WorkflowExecution; cancelled?: boolean }> {
-  const params = new URLSearchParams();
-  if (id) params.set('id', id);
-  if (sessionId) params.set('sessionId', sessionId);
-  if (projectId) params.set('projectId', projectId);
-
-  const res = await fetch(`/api/workflow/cancel?${params}`, {
-    method: 'POST',
-  });
-  if (!res.ok) {
-    const data = await res.json().catch(() => ({}));
-    throw new Error(data.error || `Failed to cancel workflow: ${res.status}`);
-  }
-  return await res.json();
-}
-
-/**
- * Submit answers to a waiting workflow
- */
-async function answerWorkflow(
-  id: string,
-  answers: Record<string, string>
-): Promise<WorkflowExecution> {
-  const res = await fetch('/api/workflow/answer', {
-    method: 'POST',
-    headers: { 'Content-Type': 'application/json' },
-    body: JSON.stringify({ id, answers }),
-  });
-  if (!res.ok) {
-    const data = await res.json().catch(() => ({}));
-    throw new Error(data.error || `Failed to submit answers: ${res.status}`);
-  }
-  const data = await res.json();
-  return data.execution as WorkflowExecution;
-}
-
-interface UseWorkflowExecutionOptions {
-  /** Project name for notifications (optional) */
-  projectName?: string;
-}
-
-/**
- * Hook for managing workflow execution for a specific project
- */
-export function useWorkflowExecution(
-  projectId: string,
-  options?: UseWorkflowExecutionOptions
-): UseWorkflowExecutionResult {
-  const [execution, setExecution] = useState<WorkflowExecution | null>(null);
-  const [isLoading, setIsLoading] = useState(true);
-  const [error, setError] = useState<Error | null>(null);
-
-  // Track current execution ID for polling
-  const executionIdRef = useRef<string | null>(null);
-  const pollIntervalRef = useRef<NodeJS.Timeout | null>(null);
-  // Track previous status to detect transitions
-  const previousStatusRef = useRef<WorkflowStatus | null>(null);
-
-  // Derived state
-  const isRunning = execution?.status === 'running';
-  const isWaiting = execution?.status === 'waiting_for_input';
-  const isTerminal = execution ? TERMINAL_STATES.includes(execution.status) : false;
-
-  // Clear any existing polling interval
-  const clearPolling = useCallback(() => {
-    if (pollIntervalRef.current) {
-      clearInterval(pollIntervalRef.current);
-      pollIntervalRef.current = null;
-    }
-  }, []);
-
-  // Fetch current execution status
-  const refresh = useCallback(async () => {
-    try {
-      let exec: WorkflowExecution | null = null;
-
-      // If we have a known execution ID, fetch it directly
-      if (executionIdRef.current) {
-        exec = await fetchWorkflowById(executionIdRef.current, projectId);
-        if (exec) {
-          // Detect transition to waiting_for_input
-          const prevStatus = previousStatusRef.current;
-          if (
-            exec.status === 'waiting_for_input' &&
-            prevStatus !== 'waiting_for_input' &&
-            options?.projectName
-          ) {
-            showQuestionNotification(options.projectName);
-          }
-          previousStatusRef.current = exec.status;
-
-          setExecution(exec);
-          // Stop polling if terminal
-          if (TERMINAL_STATES.includes(exec.status)) {
-            clearPolling();
-          }
-          return;
-        }
-      }
-
-      // Otherwise fetch the most recent for the project
-      exec = await fetchWorkflowForProject(projectId);
-
-      // Detect transition to waiting_for_input
-      if (exec) {
-        const prevStatus = previousStatusRef.current;
-        if (
-          exec.status === 'waiting_for_input' &&
-          prevStatus !== 'waiting_for_input' &&
-          options?.projectName
-        ) {
-          showQuestionNotification(options.projectName);
-        }
-        previousStatusRef.current = exec.status;
-      }
-
-      setExecution(exec);
-      executionIdRef.current = exec?.id || null;
-
-      // Stop polling if terminal or no execution
-      if (!exec || TERMINAL_STATES.includes(exec.status)) {
-        clearPolling();
-      }
-
-      setError(null);
-    } catch (e) {
-      setError(e instanceof Error ? e : new Error('Unknown error'));
-    }
-  }, [projectId, clearPolling, options?.projectName]);
-
-  // Start polling for active workflows
-  const startPolling = useCallback(() => {
-    clearPolling();
-    pollIntervalRef.current = setInterval(() => {
-      refresh();
-    }, POLL_INTERVAL_MS);
-  }, [refresh, clearPolling]);
-
-  // Start a new workflow
-  const start = useCallback(
-    async (skill: string, options?: StartWorkflowOptions) => {
-      // Validate: check if there's already an active workflow
-      // Only running/waiting_for_input states block new workflows
-      // cancelled/completed/failed states allow restart
-      // detached state allows restart (dashboard lost track, user explicitly wants new workflow)
-      // Exception: when resuming a session, we allow starting even if active
-      // (the new workflow will link to the same session)
-      const blockingStates: WorkflowStatus[] = ['running', 'waiting_for_input'];
-      if (
-        execution &&
-        blockingStates.includes(execution.status) &&
-        !options?.resumeSessionId
-      ) {
-        const err = new Error('A workflow is already running on this project');
-        setError(err);
-        throw err;
-      }
-
-      // Request notification permission on first workflow start
-      if (!hasRequestedPermission()) {
-        await requestNotificationPermission();
-      }
-
-      try {
-        setError(null);
-        const exec = await startWorkflow(projectId, skill, options?.resumeSessionId);
-        setExecution(exec);
-        executionIdRef.current = exec.id;
-        // Start polling for updates
-        startPolling();
-      } catch (e) {
-        setError(e instanceof Error ? e : new Error('Unknown error'));
-        throw e;
-      }
-    },
-    [projectId, startPolling, execution]
-  );
-
-  // Cancel the current workflow
-  const cancel = useCallback(async () => {
-    // Get session ID before clearing state (needed for fallback cancel)
-    const sessionId = execution?.sessionId;
-
-    if (!executionIdRef.current && !sessionId) {
-      // No execution or session to cancel - just clear local state
-      setExecution(null);
-      clearPolling();
-      return;
-    }
-
-    try {
-      setError(null);
-      // Pass sessionId and projectId for fallback if execution tracking is lost
-      const result = await cancelWorkflow(
-        executionIdRef.current || undefined,
-        sessionId,
-        projectId
-      );
-      if (result.execution) {
-        setExecution(result.execution);
-      } else {
-        // Cancelled by session ID - clear local state
-        setExecution(null);
-        executionIdRef.current = null;
-      }
-      clearPolling();
-    } catch (e) {
-      const errorMessage = e instanceof Error ? e.message : 'Unknown error';
-      // If execution/session not found, it's already gone - just clear local state
-      if (errorMessage.includes('not found')) {
-        setExecution(null);
-        executionIdRef.current = null;
-        clearPolling();
-        setError(null);
-        return;
-      }
-      setError(e instanceof Error ? e : new Error('Unknown error'));
-      throw e;
-    }
-  }, [clearPolling, execution, projectId]);
-
-  // Submit answers
-  const submitAnswers = useCallback(
-    async (answers: Record<string, string>) => {
-      if (!executionIdRef.current) {
-        throw new Error('No workflow to answer');
-      }
-      try {
-        setError(null);
-        const exec = await answerWorkflow(executionIdRef.current, answers);
-        setExecution(exec);
-        // Resume polling
-        startPolling();
-      } catch (e) {
-        const errorMessage = e instanceof Error ? e.message : 'Unknown error';
-        // If execution not found, the workflow timed out or was cleaned up
-        // Clear the stale state so user can start fresh
-        if (errorMessage.includes('not found') || errorMessage.includes('Execution not found')) {
-          setExecution(null);
-          executionIdRef.current = null;
-          clearPolling();
-          setError(new Error('Workflow session expired. Please start a new workflow.'));
-        } else {
-          setError(e instanceof Error ? e : new Error('Unknown error'));
-        }
-        throw e;
-      }
-    },
-    [startPolling, clearPolling]
-  );
-
-  // Initial fetch on mount
-  useEffect(() => {
-    let mounted = true;
-
-    const init = async () => {
-      setIsLoading(true);
-      try {
-        const exec = await fetchWorkflowForProject(projectId);
-        if (!mounted) return;
-
-        setExecution(exec);
-        executionIdRef.current = exec?.id || null;
-
-        // Start polling if there's an active workflow
-        if (exec && ACTIVE_STATES.includes(exec.status)) {
-          startPolling();
-        }
-      } catch (e) {
-        if (!mounted) return;
-        setError(e instanceof Error ? e : new Error('Unknown error'));
-      } finally {
-        if (mounted) {
-          setIsLoading(false);
-        }
-      }
-    };
-
-    init();
-
-    return () => {
-      mounted = false;
-      clearPolling();
-    };
-  }, [projectId, startPolling, clearPolling]);
-
-  // Clean up polling on unmount
-  useEffect(() => {
-    return () => {
-      clearPolling();
-    };
-  }, [clearPolling]);
-
-  return {
-    execution,
-    isLoading,
-    isRunning,
-    isWaiting,
-    isTerminal,
-    error,
-    start,
-    cancel,
-    submitAnswers,
-    refresh,
-  };
-}
diff --git a/packages/dashboard/src/hooks/use-workflow-list.ts b/packages/dashboard/src/hooks/use-workflow-list.ts
deleted file mode 100644
index 288e963..0000000
--- a/packages/dashboard/src/hooks/use-workflow-list.ts
+++ /dev/null
@@ -1,179 +0,0 @@
-'use client';
-
-/**
- * @deprecated This hook will be removed in a future version.
- *
- * Migration guide:
- * - Workflow data is now pushed via SSE events to the unified context
- * - Use useUnifiedData() from '@/contexts/unified-data-context' to access workflows
- *
- * OLD:
- *   const { executions } = useWorkflowList();
- *   const execution = executions.get(projectId);
- *
- * NEW:
- *   const { workflows } = useUnifiedData();
- *   const workflowData = workflows.get(projectId);
- *   const currentExecution = workflowData?.currentExecution;
- *
- * ---
- * Hook for fetching active workflow executions across all projects
- *
- * Used by ProjectList to display workflow status badges on project cards.
- * Polls every 3 seconds when there are active workflows.
- */
-
-import { useState, useEffect, useCallback, useRef } from 'react';
-import type { WorkflowExecution } from '@/lib/services/workflow-service';
-
-const POLL_INTERVAL_MS = 3000; // 3 seconds per PDR
-
-interface UseWorkflowListResult {
-  /** Map of projectId to their most recent workflow execution */
-  executions: Map<string, WorkflowExecution>;
-  /** True during initial load */
-  isLoading: boolean;
-  /** Error from last fetch */
-  error: Error | null;
-  /** Manually refresh all executions */
-  refresh: () => Promise<void>;
-}
-
-/**
- * Fetch all active workflows (running or waiting_for_input)
- */
-async function fetchActiveWorkflows(): Promise<WorkflowExecution[]> {
-  const res = await fetch('/api/workflow/list');
-  if (!res.ok) {
-    throw new Error(`Failed to fetch workflows: ${res.status}`);
-  }
-  const data = await res.json();
-  return data.executions as WorkflowExecution[];
-}
-
-/**
- * Hook for managing workflow executions across all projects
- *
- * Features:
- * - Fetches all workflows on mount
- * - Polls every 3 seconds when there are active workflows
- * - Stops polling when no active workflows
- * - Returns map keyed by projectId for easy lookup
- */
-export function useWorkflowList(projectIds?: string[]): UseWorkflowListResult {
-  const [executions, setExecutions] = useState<Map<string, WorkflowExecution>>(
-    new Map()
-  );
-  const [isLoading, setIsLoading] = useState(true);
-  const [error, setError] = useState<Error | null>(null);
-
-  const pollIntervalRef = useRef<NodeJS.Timeout | null>(null);
-
-  // Check if any executions are active (require polling)
-  // Include 'detached' - the session may still be running even if we lost track
-  const hasActiveWorkflows = Array.from(executions.values()).some(
-    (e) => e.status === 'running' || e.status === 'waiting_for_input' || e.status === 'detached'
-  );
-
-  // Clear any existing polling interval
-  const clearPolling = useCallback(() => {
-    if (pollIntervalRef.current) {
-      clearInterval(pollIntervalRef.current);
-      pollIntervalRef.current = null;
-    }
-  }, []);
-
-  // Fetch and update executions
-  const refresh = useCallback(async () => {
-    try {
-      const allExecutions = await fetchActiveWorkflows();
-
-      // Group by projectId, keeping only the most recent for each
-      const executionMap = new Map<string, WorkflowExecution>();
-
-      for (const exec of allExecutions) {
-        // Filter by projectIds if provided
-        if (projectIds && !projectIds.includes(exec.projectId)) {
-          continue;
-        }
-
-        const existing = executionMap.get(exec.projectId);
-        if (
-          !existing ||
-          new Date(exec.updatedAt) > new Date(existing.updatedAt)
-        ) {
-          executionMap.set(exec.projectId, exec);
-        }
-      }
-
-      // Remove executions that have faded (completed more than 30s ago)
-      const now = Date.now();
-      for (const [projectId, exec] of executionMap) {
-        if (exec.status === 'completed' || exec.status === 'failed' || exec.status === 'cancelled') {
-          const updatedAt = new Date(exec.updatedAt).getTime();
-          const age = now - updatedAt;
-          // Keep for 30s after completion for fade effect
-          if (age > 30000) {
-            executionMap.delete(projectId);
-          }
-        }
-      }
-
-      setExecutions(executionMap);
-      setError(null);
-    } catch (e) {
-      setError(e instanceof Error ? e : new Error('Unknown error'));
-    }
-  }, [projectIds]);
-
-  // Start polling
-  const startPolling = useCallback(() => {
-    clearPolling();
-    pollIntervalRef.current = setInterval(() => {
-      refresh();
-    }, POLL_INTERVAL_MS);
-  }, [refresh, clearPolling]);
-
-  // Initial fetch on mount
-  useEffect(() => {
-    let mounted = true;
-
-    const init = async () => {
-      setIsLoading(true);
-      try {
-        await refresh();
-      } finally {
-        if (mounted) {
-          setIsLoading(false);
-        }
-      }
-    };
-
-    init();
-
-    return () => {
-      mounted = false;
-      clearPolling();
-    };
-  }, [refresh, clearPolling]);
-
-  // Start/stop polling based on active workflows
-  useEffect(() => {
-    if (hasActiveWorkflows) {
-      startPolling();
-    } else {
-      clearPolling();
-    }
-
-    return () => {
-      clearPolling();
-    };
-  }, [hasActiveWorkflows, startPolling, clearPolling]);
-
-  return {
-    executions,
-    isLoading,
-    error,
-    refresh,
-  };
-}
diff --git a/packages/dashboard/src/lib/action-definitions.ts b/packages/dashboard/src/lib/action-definitions.ts
index ddb27a1..dab510f 100644
--- a/packages/dashboard/src/lib/action-definitions.ts
+++ b/packages/dashboard/src/lib/action-definitions.ts
@@ -22,7 +22,7 @@ export interface ActionDefinition {
   label: string;
   /** Short description for tooltips */
   description: string;
-  /** CLI command to execute (e.g., "init", "doctor") */
+  /** CLI command to execute (e.g., "init", "check", "status") */
   command: string;
   /** Default arguments to pass to the command */
   args: string[];
@@ -50,9 +50,9 @@ export interface ActionDefinition {
  * All available project actions
  *
  * SpecFlow CLI v3.0 commands:
+ * - init: Initialize a new project with full 3.0 compliance
  * - status: Get complete project status
  * - check: Deep validation with auto-fix support
- * - state init: Initialize a new state file
  * - phase: Manage phase lifecycle
  */
 export const ACTION_DEFINITIONS: ActionDefinition[] = [
@@ -60,16 +60,18 @@ export const ACTION_DEFINITIONS: ActionDefinition[] = [
   {
     id: 'init',
     label: 'Initialize',
-    description: 'Initialize SpecFlow state for this project',
-    command: 'state',
-    args: ['init'],
+    description: 'Initialize SpecFlow project with full 3.0 compliance',
+    command: 'init',
+    args: [],
     requiresConfirmation: true,
     confirmationTitle: 'Initialize Project',
-    confirmationDescription: 'This will create a new orchestration state file.',
+    confirmationDescription: 'This will create a fully compliant SpecFlow 3.0 project structure.',
     confirmationItems: [
-      '.specflow/ directory',
-      'orchestration-state.json',
-      'Project registration',
+      '.specflow/ directory (state, manifest, workflows)',
+      '.specify/ directories (memory, templates, phases, archive)',
+      'ROADMAP.md and BACKLOG.md templates',
+      'specs/ directory for phase artifacts',
+      'Project registration in global registry',
     ],
     applicableStatuses: ['not_initialized'],
     variant: 'default',
diff --git a/packages/dashboard/src/lib/services/batch-parser.ts b/packages/dashboard/src/lib/services/batch-parser.ts
index fe27e9e..bb22a92 100644
--- a/packages/dashboard/src/lib/services/batch-parser.ts
+++ b/packages/dashboard/src/lib/services/batch-parser.ts
@@ -462,3 +462,90 @@ export function getBatchPlanSummary(plan: BatchPlan): string {
 
   return `${batchCount} batch${batchCount !== 1 ? 'es' : ''} from tasks.md sections (${taskCount} tasks)`;
 }
+
+/**
+ * Verify which tasks from a batch are actually complete in tasks.md
+ *
+ * @param projectPath - Path to the project root
+ * @param taskIds - List of task IDs to verify
+ * @returns Object with completed and incomplete task IDs
+ */
+export function verifyBatchTaskCompletion(
+  projectPath: string,
+  taskIds: string[]
+): { completedTasks: string[]; incompleteTasks: string[] } {
+  // Re-parse tasks.md to get current state
+  const plan = parseBatchesFromProject(projectPath);
+
+  if (!plan) {
+    // Can't verify - assume all incomplete
+    return { completedTasks: [], incompleteTasks: taskIds };
+  }
+
+  // Get all tasks from the current plan
+  const allTaskIds = new Set<string>();
+  const completedTaskIds = new Set<string>();
+
+  // We need to re-parse to get completion status, not just batch structure
+  const specsDir = join(projectPath, 'specs');
+  const { readdirSync } = require('fs');
+  const entries = readdirSync(specsDir, { withFileTypes: true });
+
+  const phaseDirs = entries
+    .filter((e: { isDirectory: () => boolean; name: string }) =>
+      e.isDirectory() && /^\d{4}-/.test(e.name)
+    )
+    .map((e: { name: string }) => e.name)
+    .sort()
+    .reverse();
+
+  if (phaseDirs.length === 0) {
+    return { completedTasks: [], incompleteTasks: taskIds };
+  }
+
+  const tasksPath = join(specsDir, phaseDirs[0], 'tasks.md');
+  if (!existsSync(tasksPath)) {
+    return { completedTasks: [], incompleteTasks: taskIds };
+  }
+
+  const content = readFileSync(tasksPath, 'utf-8');
+  const lines = content.split('\n');
+
+  // Parse all tasks and their completion status
+  for (const line of lines) {
+    const taskMatch = line.match(TASK_PATTERN);
+    if (taskMatch) {
+      const completed = taskMatch[1].toLowerCase() === 'x';
+      const id = taskMatch[2];
+      allTaskIds.add(id);
+      if (completed) {
+        completedTaskIds.add(id);
+      }
+    }
+  }
+
+  // Check which of the requested tasks are complete
+  const completedTasks: string[] = [];
+  const incompleteTasks: string[] = [];
+
+  for (const taskId of taskIds) {
+    if (completedTaskIds.has(taskId)) {
+      completedTasks.push(taskId);
+    } else {
+      incompleteTasks.push(taskId);
+    }
+  }
+
+  return { completedTasks, incompleteTasks };
+}
+
+/**
+ * Check total incomplete task count in a project
+ *
+ * @param projectPath - Path to the project root
+ * @returns Number of incomplete tasks, or null if can't determine
+ */
+export function getTotalIncompleteTasks(projectPath: string): number | null {
+  const plan = parseBatchesFromProject(projectPath);
+  return plan?.totalIncomplete ?? null;
+}
diff --git a/packages/dashboard/src/lib/services/claude-helper.ts b/packages/dashboard/src/lib/services/claude-helper.ts
index 8de0b98..28b5fb3 100644
--- a/packages/dashboard/src/lib/services/claude-helper.ts
+++ b/packages/dashboard/src/lib/services/claude-helper.ts
@@ -17,7 +17,7 @@ import { spawn, execSync } from 'child_process';
 import { existsSync, mkdirSync, writeFileSync, readFileSync, unlinkSync } from 'fs';
 import { join } from 'path';
 import { randomUUID } from 'crypto';
-import type { z } from 'zod';
+import { z } from 'zod';
 import zodToJsonSchema from 'zod-to-json-schema';
 import type {
   ClaudeHelperOptions,
@@ -558,3 +558,444 @@ export async function healWithClaude<T>(
     ...options,
   });
 }
+
+// =============================================================================
+// Claude Helper Use Cases (G3) - Exactly 3 allowed use cases
+// =============================================================================
+
+// Schema for state recovery response
+const StateRecoverySchema = z.object({
+  action: z.enum(['use_recovered', 'use_heuristic', 'abort']),
+  confidence: z.number().min(0).max(1),
+  recovered_state: z.object({
+    step: z.object({
+      current: z.string(),
+      index: z.number(),
+      status: z.string(),
+    }).optional(),
+    phase: z.object({
+      number: z.string(),
+      name: z.string(),
+    }).optional(),
+  }).optional(),
+  reason: z.string(),
+});
+
+type StateRecoveryResult = z.infer<typeof StateRecoverySchema>;
+
+// Schema for stale workflow diagnosis
+const StaleWorkflowSchema = z.object({
+  action: z.enum(['continue', 'restart_task', 'skip_task', 'abort']),
+  confidence: z.enum(['high', 'medium', 'low']),
+  reason: z.string(),
+  context: z.object({
+    last_output: z.string().optional(),
+    likely_stuck_at: z.string().optional(),
+  }).optional(),
+});
+
+type StaleWorkflowResult = z.infer<typeof StaleWorkflowSchema>;
+
+// Schema for failed step diagnosis
+const FailedStepSchema = z.object({
+  action: z.enum(['retry', 'skip_tasks', 'run_prerequisite', 'abort']),
+  confidence: z.enum(['high', 'medium', 'low']),
+  reason: z.string(),
+  tasks_to_skip: z.array(z.string()).optional(),
+  prerequisite: z.string().optional(),
+});
+
+type FailedStepResult = z.infer<typeof FailedStepSchema>;
+
+/**
+ * Recovery result from state recovery
+ */
+export interface StateRecoveryResponse {
+  success: boolean;
+  state?: {
+    step: {
+      current: string;
+      index: number;
+      status: string;
+    };
+    phase?: {
+      number: string;
+      name: string;
+    };
+  };
+  source: 'claude' | 'heuristic' | 'none';
+  reason: string;
+  cost: number;
+}
+
+/**
+ * Case 1: Corrupt/Missing State Recovery (G3.1-G3.6)
+ *
+ * Attempts to recover orchestration state using Claude Helper.
+ * Falls back to heuristic recovery if Claude fails.
+ * Silently returns null if all recovery attempts fail.
+ *
+ * @param projectPath - Path to the project
+ * @param existingState - The corrupt/partial existing state (if any)
+ * @param backupPath - Path to create backup before recovery
+ */
+export async function recoverStateWithClaudeHelper(
+  projectPath: string,
+  existingState: Record<string, unknown> | null,
+  backupPath: string
+): Promise<StateRecoveryResponse> {
+  // G3.2: Create backup BEFORE attempting recovery
+  if (existingState && backupPath) {
+    try {
+      writeFileSync(backupPath, JSON.stringify(existingState, null, 2), 'utf-8');
+    } catch (error) {
+      // Continue even if backup fails - recovery attempt is still valuable
+      console.warn('[claude-helper] Failed to create backup:', error);
+    }
+  }
+
+  // G3.3: Call Claude Helper with task: 'recover_state'
+  const message = `
+You are analyzing a corrupt or missing orchestration state file.
+
+Existing state (may be corrupt or partial):
+${existingState ? JSON.stringify(existingState, null, 2) : 'null (missing)'}
+
+Analyze the project to determine the correct orchestration state:
+1. Check .specflow/orchestration-state.json for any recoverable data
+2. Check specs/ directory for active phase artifacts
+3. Check ROADMAP.md for phase information
+
+Provide your best assessment of the current state.
+`;
+
+  try {
+    const response = await claudeHelper<StateRecoveryResult>({
+      message,
+      schema: StateRecoverySchema,
+      projectPath,
+      model: 'haiku',
+      tools: ['Read', 'Glob'],
+      maxTurns: 3,
+      maxBudgetUsd: 0.5,
+      noSessionPersistence: true,
+    });
+
+    // G3.4: If Claude Helper succeeds + confidence > 0.7 → use recovered state
+    if (response.success && response.result.confidence > 0.7 && response.result.recovered_state?.step) {
+      return {
+        success: true,
+        state: {
+          step: response.result.recovered_state.step as StateRecoveryResponse['state'] extends { step: infer S } ? S : never,
+          phase: response.result.recovered_state.phase,
+        },
+        source: 'claude',
+        reason: response.result.reason,
+        cost: response.cost,
+      };
+    }
+
+    // G3.5: If Claude Helper fails or low confidence → try heuristic recovery (silent)
+    const heuristicResult = tryHeuristicStateRecovery(projectPath);
+    if (heuristicResult) {
+      return {
+        success: true,
+        state: heuristicResult,
+        source: 'heuristic',
+        reason: 'Recovered using heuristic analysis',
+        cost: response.cost,
+      };
+    }
+
+    // G3.6: If heuristic fails → return null (caller sets needs_attention)
+    return {
+      success: false,
+      source: 'none',
+      reason: 'All recovery methods failed',
+      cost: response.cost,
+    };
+  } catch {
+    // G3.5: Silent fallback to heuristic on error
+    const heuristicResult = tryHeuristicStateRecovery(projectPath);
+    if (heuristicResult) {
+      return {
+        success: true,
+        state: heuristicResult,
+        source: 'heuristic',
+        reason: 'Recovered using heuristic (Claude Helper unavailable)',
+        cost: 0,
+      };
+    }
+
+    return {
+      success: false,
+      source: 'none',
+      reason: 'All recovery methods failed',
+      cost: 0,
+    };
+  }
+}
+
+/**
+ * Heuristic state recovery - analyzes project files to infer state
+ * Called when Claude Helper fails or has low confidence
+ */
+function tryHeuristicStateRecovery(projectPath: string): StateRecoveryResponse['state'] | null {
+  try {
+    // Check specs directory for active artifacts
+    const specsDir = join(projectPath, 'specs');
+    if (!existsSync(specsDir)) return null;
+
+    // Find the most recent specs folder (highest number prefix)
+    const dirsRaw = require('fs').readdirSync(specsDir, { withFileTypes: true }) as { name: string; isDirectory: () => boolean }[];
+    const dirs = dirsRaw
+      .filter((d: { isDirectory: () => boolean }) => d.isDirectory())
+      .map((d: { name: string }) => d.name)
+      .filter((name: string) => /^\d+/.test(name))
+      .sort()
+      .reverse();
+
+    if (dirs.length === 0) return null;
+
+    const activeDir = dirs[0];
+    const match = activeDir.match(/^(\d+)-(.+)/);
+    if (!match) return null;
+
+    const phaseNumber = match[1];
+    const phaseName = match[2];
+    const phasePath = join(specsDir, activeDir);
+
+    // Determine current step based on what artifacts exist
+    const hasSpec = existsSync(join(phasePath, 'spec.md'));
+    const hasPlan = existsSync(join(phasePath, 'plan.md'));
+    const hasTasks = existsSync(join(phasePath, 'tasks.md'));
+    const hasChecklists = existsSync(join(phasePath, 'checklists'));
+
+    let currentStep = 'design';
+    let stepIndex = 0;
+    let status = 'in_progress';
+
+    if (hasChecklists) {
+      // All design artifacts exist, likely in implement or verify
+      currentStep = 'implement';
+      stepIndex = 2;
+    } else if (hasTasks && hasPlan) {
+      currentStep = 'implement';
+      stepIndex = 2;
+    } else if (hasPlan) {
+      currentStep = 'design';
+      stepIndex = 0;
+      status = 'complete';
+    } else if (hasSpec) {
+      currentStep = 'design';
+      stepIndex = 0;
+    }
+
+    return {
+      step: {
+        current: currentStep,
+        index: stepIndex,
+        status,
+      },
+      phase: {
+        number: phaseNumber,
+        name: phaseName,
+      },
+    };
+  } catch {
+    return null;
+  }
+}
+
+/**
+ * Stale workflow response
+ */
+export interface StaleWorkflowResponse {
+  action: 'continue' | 'restart_task' | 'skip_task' | 'abort';
+  reason: string;
+  confidence: 'high' | 'medium' | 'low';
+  context?: {
+    last_output?: string;
+    likely_stuck_at?: string;
+  };
+  cost: number;
+}
+
+/**
+ * Case 2: Stale Workflow Diagnosis (G3.7-G3.10)
+ *
+ * Diagnoses a workflow that has been running with no output for >10 minutes.
+ * Returns recommended action. Sets needs_attention if Claude Helper fails.
+ *
+ * @param projectPath - Path to the project
+ * @param workflowId - ID of the stale workflow
+ * @param lastOutput - Last output from the workflow (if any)
+ * @param staleMinutes - How long the workflow has been stale
+ */
+export async function handleStaleWorkflow(
+  projectPath: string,
+  workflowId: string,
+  lastOutput: string | undefined,
+  staleMinutes: number
+): Promise<StaleWorkflowResponse> {
+  // G3.8: Call Claude Helper with task: 'diagnose_stale_workflow'
+  const message = `
+You are diagnosing a stale workflow.
+
+Workflow ID: ${workflowId}
+Time since last activity: ${staleMinutes} minutes
+
+Last output:
+${lastOutput || '(no output available)'}
+
+Analyze the situation and recommend an action:
+- continue: Wait longer (if workflow might still be working)
+- restart_task: Kill and restart the current task
+- skip_task: Skip the current task and move on
+- abort: Stop orchestration entirely
+
+Be conservative - prefer 'continue' if there's any chance the workflow is still working.
+`;
+
+  try {
+    const response = await claudeHelper<StaleWorkflowResult>({
+      message,
+      schema: StaleWorkflowSchema,
+      projectPath,
+      model: 'haiku',
+      tools: ['Read', 'Glob'],
+      maxTurns: 2,
+      maxBudgetUsd: 0.25,
+      noSessionPersistence: true,
+    });
+
+    // G3.9: Handle response actions
+    if (response.success) {
+      return {
+        action: response.result.action,
+        reason: response.result.reason,
+        confidence: response.result.confidence,
+        context: response.result.context,
+        cost: response.cost,
+      };
+    }
+
+    // G3.10: If Claude Helper fails → needs_attention (silent, no error toast)
+    return {
+      action: 'continue', // Default to waiting
+      reason: 'Claude Helper unavailable, defaulting to continue',
+      confidence: 'low',
+      cost: response.cost,
+    };
+  } catch {
+    // Silent failure - default to continue
+    return {
+      action: 'continue',
+      reason: 'Claude Helper error, defaulting to continue',
+      confidence: 'low',
+      cost: 0,
+    };
+  }
+}
+
+/**
+ * Failed step response
+ */
+export interface FailedStepResponse {
+  action: 'retry' | 'skip_tasks' | 'run_prerequisite' | 'abort' | 'needs_attention';
+  reason: string;
+  confidence: 'high' | 'medium' | 'low';
+  tasksToSkip?: string[];
+  prerequisite?: string;
+  cost: number;
+}
+
+/**
+ * Case 3: Failed Step Diagnosis (G3.11-G3.16)
+ *
+ * Diagnoses a failed step and recommends recovery action.
+ * Skips Claude Helper if max heal attempts reached.
+ *
+ * @param projectPath - Path to the project
+ * @param stepName - Name of the failed step
+ * @param errorMessage - Error message from the failure
+ * @param healAttempts - Number of heal attempts already made
+ * @param maxHealAttempts - Maximum allowed heal attempts
+ */
+export async function handleFailedStep(
+  projectPath: string,
+  stepName: string,
+  errorMessage: string | undefined,
+  healAttempts: number,
+  maxHealAttempts: number
+): Promise<FailedStepResponse> {
+  // G3.12: Pre-check heal attempts → skip Claude Helper if exhausted
+  if (healAttempts >= maxHealAttempts) {
+    return {
+      action: 'needs_attention',
+      reason: `Max heal attempts (${maxHealAttempts}) reached`,
+      confidence: 'high',
+      cost: 0,
+    };
+  }
+
+  // G3.13: Call Claude Helper with task: 'diagnose_failed_step'
+  const message = `
+You are diagnosing a failed orchestration step.
+
+Step: ${stepName}
+Error: ${errorMessage || '(no error message)'}
+Heal attempts: ${healAttempts}/${maxHealAttempts}
+
+Analyze the error and recommend an action:
+- retry: Try the step again (maybe with different approach)
+- skip_tasks: Skip specific failing tasks and continue
+- run_prerequisite: Run a prerequisite step first
+- abort: Stop orchestration entirely
+
+If the error is transient (network, timeout), recommend 'retry'.
+If specific tasks are failing, list them in tasks_to_skip.
+If a prerequisite is needed, specify it.
+`;
+
+  try {
+    const response = await claudeHelper<FailedStepResult>({
+      message,
+      schema: FailedStepSchema,
+      projectPath,
+      model: 'haiku',
+      tools: ['Read', 'Glob'],
+      maxTurns: 2,
+      maxBudgetUsd: 0.25,
+      noSessionPersistence: true,
+    });
+
+    // G3.14: Handle response actions
+    if (response.success) {
+      return {
+        action: response.result.action,
+        reason: response.result.reason,
+        confidence: response.result.confidence,
+        tasksToSkip: response.result.tasks_to_skip,
+        prerequisite: response.result.prerequisite,
+        cost: response.cost,
+      };
+    }
+
+    // G3.15: If Claude Helper fails + heal attempts remaining → simple retry (silent)
+    return {
+      action: 'retry',
+      reason: 'Claude Helper unavailable, attempting simple retry',
+      confidence: 'low',
+      cost: response.cost,
+    };
+  } catch {
+    // G3.15: Silent failure - default to retry if attempts remaining
+    return {
+      action: 'retry',
+      reason: 'Claude Helper error, attempting simple retry',
+      confidence: 'low',
+      cost: 0,
+    };
+  }
+}
diff --git a/packages/dashboard/src/lib/services/orchestration-decisions.ts b/packages/dashboard/src/lib/services/orchestration-decisions.ts
new file mode 100644
index 0000000..7fdda6f
--- /dev/null
+++ b/packages/dashboard/src/lib/services/orchestration-decisions.ts
@@ -0,0 +1,662 @@
+/**
+ * Orchestration Decision Logic - Pure Functions
+ *
+ * This module contains pure decision-making functions extracted from orchestration-runner.ts
+ * for better testability and separation of concerns.
+ *
+ * Key principles:
+ * - All functions are pure (no I/O, no side effects)
+ * - State is passed in, decisions are returned
+ * - Trusts step.status from state file (FR-001)
+ * - Complete decision matrix with no ambiguous cases (FR-002)
+ */
+
+import type {
+  OrchestrationExecution,
+  OrchestrationPhase,
+  OrchestrationState,
+  StepStatus,
+  BatchItem,
+} from '@specflow/shared';
+import { STEP_INDEX_MAP } from '@specflow/shared';
+
+// =============================================================================
+// Types
+// =============================================================================
+
+/**
+ * Decision actions that the runner can execute
+ */
+export type DecisionAction =
+  | 'wait'                    // Continue polling, nothing to do
+  | 'wait_with_backoff'       // Wait with exponential backoff (lookup failure)
+  | 'wait_user_gate'          // Wait for USER_GATE confirmation
+  | 'wait_merge'              // Wait for user to trigger merge
+  | 'transition'              // Transition to next step
+  | 'spawn'                   // Spawn workflow for current step
+  | 'spawn_batch'             // Spawn workflow for current batch
+  | 'advance_batch'           // Move to next batch
+  | 'initialize_batches'      // Initialize batch tracking
+  | 'force_step_complete'     // Force step.status to complete (all batches done)
+  | 'heal_batch'              // Attempt to heal failed batch
+  | 'pause'                   // Pause orchestration (pauseBetweenBatches)
+  | 'complete'                // Orchestration complete
+  | 'recover_stale'           // Recover from stale workflow
+  | 'recover_failed'          // Recover from failed step/workflow
+  | 'needs_attention'         // Needs user intervention
+  | 'fail';                   // Terminal failure
+
+/**
+ * Result of the decision function
+ */
+export interface DecisionResult {
+  action: DecisionAction;
+  reason: string;
+  /** Skill to spawn (for spawn/spawn_batch actions) */
+  skill?: string;
+  /** Next step to transition to */
+  nextStep?: string;
+  /** Next step index */
+  nextIndex?: number;
+  /** Batch context for implement phase */
+  batchContext?: string;
+  /** Batch index for batch operations */
+  batchIndex?: number;
+  /** Error message for failure cases */
+  errorMessage?: string;
+  /** Recovery options for needs_attention */
+  recoveryOptions?: Array<'retry' | 'skip' | 'abort'>;
+  /** Failed workflow ID for recovery context */
+  failedWorkflowId?: string;
+  /** Backoff time in ms */
+  backoffMs?: number;
+  /** Workflow ID for stale recovery */
+  workflowId?: string;
+}
+
+/**
+ * Workflow state passed to decision functions
+ * Simplified interface to avoid coupling to workflow service
+ * NOTE: 'detached' and 'stale' are intermediate health states that
+ * can occur during workflow execution monitoring
+ */
+export interface WorkflowState {
+  id: string;
+  status: 'running' | 'waiting_for_input' | 'completed' | 'failed' | 'cancelled' | 'detached' | 'stale';
+  error?: string;
+  lastActivityAt?: string;
+}
+
+/**
+ * Input for makeDecision - all state needed to make a decision
+ */
+export interface DecisionInput {
+  /** Current orchestration step from state file */
+  step: {
+    current: string | null;
+    index: number | null;
+    status: StepStatus | null;
+  };
+  /** Phase info from state file */
+  phase: {
+    hasUserGate?: boolean;
+    userGateStatus?: 'pending' | 'confirmed' | 'skipped';
+  };
+  /** Orchestration execution state */
+  execution: OrchestrationExecution;
+  /** Current workflow state (if any) */
+  workflow: WorkflowState | null;
+  /** Last file change time (for staleness detection) */
+  lastFileChangeTime?: number;
+  /** Lookup failures count (for backoff) */
+  lookupFailures?: number;
+  /** Current timestamp (for duration checks) */
+  currentTime?: number;
+}
+
+// =============================================================================
+// Constants
+// =============================================================================
+
+/** Stale threshold - 10 minutes with no activity */
+export const STALE_THRESHOLD_MS = 10 * 60 * 1000;
+
+/** Maximum orchestration duration - 4 hours */
+export const MAX_ORCHESTRATION_DURATION_MS = 4 * 60 * 60 * 1000;
+
+/** Step order for transitions */
+const STEP_ORDER: readonly string[] = ['design', 'analyze', 'implement', 'verify', 'merge'] as const;
+
+// =============================================================================
+// Helper Functions (Pure)
+// =============================================================================
+
+/**
+ * Get the skill command for a given step
+ */
+export function getSkillForStep(step: string): string {
+  const skillMap: Record<string, string> = {
+    design: 'flow.design',
+    analyze: 'flow.analyze',
+    implement: 'flow.implement',
+    verify: 'flow.verify',
+    merge: 'flow.merge',
+  };
+  return skillMap[step] || 'flow.implement';
+}
+
+/**
+ * Get the next step in the orchestration flow
+ * Returns null if current step is the last one (merge)
+ */
+export function getNextStep(current: string): string | null {
+  const currentIndex = STEP_ORDER.indexOf(current);
+  if (currentIndex === -1 || currentIndex >= STEP_ORDER.length - 1) {
+    return null;
+  }
+  return STEP_ORDER[currentIndex + 1];
+}
+
+/**
+ * Calculate exponential backoff for lookup failures
+ */
+export function calculateExponentialBackoff(failures: number): number {
+  const baseMs = 1000;
+  const maxMs = 30000;
+  const backoff = Math.min(baseMs * Math.pow(2, failures), maxMs);
+  return backoff;
+}
+
+/**
+ * Check if all batches are complete (completed or healed)
+ */
+export function areAllBatchesComplete(batches: OrchestrationExecution['batches']): boolean {
+  if (batches.items.length === 0) return false;
+  return batches.items.every(
+    (b) => b.status === 'completed' || b.status === 'healed'
+  );
+}
+
+/**
+ * Get the current batch from execution state
+ */
+export function getCurrentBatch(execution: OrchestrationExecution): BatchItem | undefined {
+  return execution.batches.items[execution.batches.current];
+}
+
+// =============================================================================
+// Batch Handling (Pure) - FR-003
+// =============================================================================
+
+/**
+ * Handle implement phase batching decisions
+ *
+ * This is the batch state machine from FR-003:
+ * - No batches → initialize_batches
+ * - Pending batch + no workflow → spawn_batch
+ * - Running batch + workflow running → let staleness check handle
+ * - Completed batch + pauseBetweenBatches → pause
+ * - Completed batch + continue → advance_batch
+ * - Failed batch + heal attempts remaining → heal_batch
+ * - Failed batch + no attempts → recover_failed
+ * - All batches complete + step not complete → force_step_complete
+ *
+ * Returns null if no batch-specific decision needed (defer to main matrix)
+ */
+export function handleImplementBatching(
+  step: DecisionInput['step'],
+  execution: OrchestrationExecution,
+  workflow: WorkflowState | null
+): DecisionResult | null {
+  const { batches, config } = execution;
+
+  // No batches yet - need to initialize (G2.1)
+  if (batches.total === 0) {
+    return {
+      action: 'initialize_batches',
+      reason: 'No batches populated',
+    };
+  }
+
+  const currentBatch = batches.items[batches.current];
+  const allBatchesComplete = areAllBatchesComplete(batches);
+
+  // All batches done (G2.10) → check if step.status needs updating
+  if (allBatchesComplete) {
+    // Trust sub-command to set step.status=complete
+    // But if it didn't, force it (G2.11)
+    if (step.status !== 'complete') {
+      return {
+        action: 'force_step_complete',
+        reason: 'All batches complete but step.status not updated',
+      };
+    }
+    return null; // Let normal decision matrix handle transition
+  }
+
+  // Current batch running with active workflow (G2.5) → defer to staleness check
+  if (currentBatch?.status === 'running' && workflow?.status === 'running') {
+    return null; // Let normal staleness check handle this
+  }
+
+  // Current batch running but workflow completed → mark batch complete and advance (G2.5b)
+  if (currentBatch?.status === 'running' && workflow?.status === 'completed') {
+    // Check pauseBetweenBatches config (G2.6)
+    if (config.pauseBetweenBatches) {
+      return {
+        action: 'advance_batch',
+        batchIndex: batches.current,
+        reason: 'Batch workflow complete, pauseBetweenBatches enabled - completing and pausing',
+      };
+    }
+
+    const nextBatchIndex = batches.current + 1;
+    if (nextBatchIndex < batches.total) {
+      return {
+        action: 'advance_batch',
+        batchIndex: batches.current,
+        reason: `Batch ${batches.current} workflow complete, advancing to batch ${nextBatchIndex}`,
+      };
+    }
+
+    // All batches done, but step not marked complete yet
+    return {
+      action: 'force_step_complete',
+      reason: 'All batches completed (last batch workflow done)',
+    };
+  }
+
+  // Current batch completed or healed → advance to next batch (G2.7, G2.8)
+  if (currentBatch?.status === 'completed' || currentBatch?.status === 'healed') {
+    // Check pauseBetweenBatches config (G2.6)
+    if (config.pauseBetweenBatches) {
+      return {
+        action: 'pause',
+        reason: 'Batch complete, pauseBetweenBatches enabled',
+      };
+    }
+
+    const nextBatchIndex = batches.current + 1;
+    if (nextBatchIndex < batches.total) {
+      return {
+        action: 'advance_batch',
+        batchIndex: nextBatchIndex,
+        reason: `Batch ${batches.current} complete, advancing to batch ${nextBatchIndex}`,
+      };
+    }
+  }
+
+  // Current batch pending + no workflow (G2.4) → spawn batch
+  if (currentBatch?.status === 'pending' && !workflow) {
+    const batchContext = `Execute tasks ${currentBatch.taskIds.join(', ')} in section "${currentBatch.section}"`;
+    return {
+      action: 'spawn_batch',
+      skill: 'flow.implement',
+      batchContext: config.additionalContext
+        ? `${batchContext}\n\n${config.additionalContext}`
+        : batchContext,
+      reason: `Starting batch ${batches.current + 1}/${batches.total}: ${currentBatch.section}`,
+    };
+  }
+
+  // Current batch failed (G2.9) → try healing
+  if (currentBatch?.status === 'failed') {
+    if (config.autoHealEnabled && currentBatch.healAttempts < config.maxHealAttempts) {
+      return {
+        action: 'heal_batch',
+        batchIndex: batches.current,
+        reason: 'Batch failed, attempting heal',
+      };
+    }
+    return {
+      action: 'recover_failed',
+      reason: `Batch ${batches.current} failed after ${currentBatch.healAttempts} heal attempts`,
+      errorMessage: `Batch ${batches.current} failed`,
+    };
+  }
+
+  return null; // No batch-specific decision, use normal matrix
+}
+
+// =============================================================================
+// Main Decision Function (Pure) - FR-001, FR-002
+// =============================================================================
+
+/**
+ * Make a decision about what to do next
+ *
+ * This is the complete decision matrix from FR-002. Every possible state
+ * combination has an explicit action - no ambiguous cases.
+ *
+ * Key principle (FR-001): Trust step.status from state file. Sub-commands
+ * set step.status=complete when done. We don't check for artifacts.
+ *
+ * @param input - All state needed to make a decision
+ * @returns Decision result with action and reason
+ */
+export function makeDecision(input: DecisionInput): DecisionResult {
+  const { step, phase, execution, workflow, lastFileChangeTime, lookupFailures, currentTime } = input;
+  const { config, batches } = execution;
+  const currentStep = step.current || 'design';
+
+  // ═══════════════════════════════════════════════════════════════════
+  // PRE-DECISION GATES (G1.1, G1.2)
+  // ═══════════════════════════════════════════════════════════════════
+
+  // G1.1: Budget gate - fail if budget exceeded
+  if (execution.totalCostUsd >= config.budget.maxTotal) {
+    return {
+      action: 'fail',
+      reason: `Budget exceeded: $${execution.totalCostUsd.toFixed(2)} >= $${config.budget.maxTotal}`,
+      errorMessage: 'Budget limit exceeded',
+    };
+  }
+
+  // G1.2: Duration gate - needs_attention if running too long (4 hours)
+  if (currentTime !== undefined) {
+    const startTime = new Date(execution.startedAt).getTime();
+    const duration = currentTime - startTime;
+    if (duration > MAX_ORCHESTRATION_DURATION_MS) {
+      return {
+        action: 'needs_attention',
+        reason: `Orchestration running too long: ${Math.round(duration / (60 * 60 * 1000))} hours`,
+        errorMessage: 'Orchestration duration exceeded 4 hours',
+        recoveryOptions: ['retry', 'abort'],
+      };
+    }
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // IMPLEMENT PHASE: BATCH HANDLING (checked first) - FR-003
+  // ═══════════════════════════════════════════════════════════════════
+  if (currentStep === 'implement') {
+    const batchDecision = handleImplementBatching(step, execution, workflow);
+    if (batchDecision) return batchDecision;
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // WORKFLOW IS RUNNING (G1.4, G1.5)
+  // ═══════════════════════════════════════════════════════════════════
+  if (workflow?.status === 'running') {
+    // Check for stale workflow (G1.5)
+    // Use the workflow's lastActivityAt, NOT project file changes
+    // A workflow is stale if it's been running but hasn't had any activity
+    if (workflow.lastActivityAt) {
+      const workflowActivityTime = new Date(workflow.lastActivityAt).getTime();
+      const staleDuration = Date.now() - workflowActivityTime;
+      if (staleDuration > STALE_THRESHOLD_MS) {
+        return {
+          action: 'recover_stale',
+          reason: `No activity for ${Math.round(staleDuration / 60000)} minutes`,
+          workflowId: workflow.id,
+        };
+      }
+    }
+
+    // Active workflow (G1.4)
+    return {
+      action: 'wait',
+      reason: 'Workflow running',
+    };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // WORKFLOW NEEDS INPUT (G1.6, G1.7)
+  // ═══════════════════════════════════════════════════════════════════
+  if (workflow?.status === 'waiting_for_input') {
+    return {
+      action: 'wait',
+      reason: 'Waiting for user input',
+    };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // WORKFLOW DETACHED OR STALE - Intermediate Health States
+  // These are monitoring states that indicate the workflow might be stuck
+  // We treat 'stale' as needing recovery and 'detached' as waiting
+  // ═══════════════════════════════════════════════════════════════════
+  if (workflow?.status === 'stale') {
+    console.log(`[orchestration-decisions] DEBUG: Workflow ${workflow.id} is stale`);
+    return {
+      action: 'recover_stale',
+      reason: `Workflow ${workflow.id} appears stale - no recent activity`,
+      workflowId: workflow.id,
+    };
+  }
+
+  if (workflow?.status === 'detached') {
+    // Detached means process was orphaned but might still be running
+    // Wait a bit and let the health checker determine final state
+    console.log(`[orchestration-decisions] DEBUG: Workflow ${workflow.id} is detached, waiting`);
+    return {
+      action: 'wait',
+      reason: `Workflow ${workflow.id} detached, waiting for health check`,
+    };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // WORKFLOW FAILED OR CANCELLED
+  // ═══════════════════════════════════════════════════════════════════
+  if (workflow?.status === 'failed' || workflow?.status === 'cancelled') {
+    // If cancelled by user, don't auto-heal
+    if (workflow.status === 'cancelled') {
+      return {
+        action: 'needs_attention',
+        reason: 'Workflow was cancelled by user',
+        errorMessage: 'Workflow cancelled',
+        recoveryOptions: ['retry', 'skip', 'abort'],
+        failedWorkflowId: workflow.id,
+      };
+    }
+
+    // If failed in implement phase, try auto-healing first (G2.9)
+    if (currentStep === 'implement' && config.autoHealEnabled) {
+      const currentBatch = batches.items[batches.current];
+      if (currentBatch && currentBatch.healAttempts < config.maxHealAttempts) {
+        return {
+          action: 'heal_batch',
+          reason: `Workflow failed, attempting heal (attempt ${currentBatch.healAttempts + 1}/${config.maxHealAttempts})`,
+          batchIndex: batches.current,
+        };
+      }
+    }
+
+    // Otherwise, needs user attention
+    return {
+      action: 'needs_attention',
+      reason: `Workflow ${workflow.status}: ${workflow.error || 'Unknown error'}`,
+      errorMessage: workflow.error,
+      recoveryOptions: ['retry', 'skip', 'abort'],
+      failedWorkflowId: workflow.id,
+    };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // WORKFLOW ID EXISTS BUT LOOKUP FAILS (G1.3)
+  // ═══════════════════════════════════════════════════════════════════
+  const storedWorkflowId = getStoredWorkflowId(execution, currentStep);
+  if (storedWorkflowId && !workflow) {
+    return {
+      action: 'wait_with_backoff',
+      reason: `Workflow ${storedWorkflowId} lookup failed, waiting...`,
+      backoffMs: calculateExponentialBackoff(lookupFailures || 0),
+    };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // WORKFLOW COMPLETED - INFER STEP COMPLETION (G1.7)
+  // For non-implement phases, workflow completion means step is done.
+  // Implement phase uses batch logic instead (handled separately).
+  // ═══════════════════════════════════════════════════════════════════
+  console.log(`[orchestration-decisions] DEBUG: workflow=${workflow?.id ?? 'none'}, status=${workflow?.status ?? 'none'}, currentStep=${currentStep}`);
+  if (workflow?.status === 'completed' && currentStep !== 'implement') {
+    console.log(`[orchestration-decisions] DEBUG: Workflow completed for ${currentStep}, transitioning...`);
+    const nextStep = getNextStep(currentStep);
+
+    // All steps done - after merge completes
+    if (nextStep === null) {
+      return {
+        action: 'complete',
+        reason: 'All steps finished (workflow completed)',
+      };
+    }
+
+    // Verify complete → check USER_GATE before merge
+    if (currentStep === 'verify' && nextStep === 'merge') {
+      if (phase.hasUserGate && phase.userGateStatus !== 'confirmed') {
+        return {
+          action: 'wait_user_gate',
+          reason: 'USER_GATE requires confirmation',
+        };
+      }
+      if (!config.autoMerge) {
+        return {
+          action: 'wait_merge',
+          reason: 'Verify workflow complete, waiting for user to trigger merge',
+        };
+      }
+      return {
+        action: 'transition',
+        nextStep: 'merge',
+        nextIndex: STEP_INDEX_MAP.verify + 1,
+        skill: getSkillForStep('merge'),
+        reason: 'Verify workflow complete, auto-merge enabled',
+      };
+    }
+
+    // Normal step transition when workflow completes
+    return {
+      action: 'transition',
+      nextStep,
+      nextIndex: STEP_INDEX_MAP[nextStep as keyof typeof STEP_INDEX_MAP],
+      skill: getSkillForStep(nextStep),
+      reason: `${currentStep} workflow complete, advancing to ${nextStep}`,
+    };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // STEP IS COMPLETE - DETERMINE NEXT ACTION (G1.8 - G1.12)
+  // ═══════════════════════════════════════════════════════════════════
+  if (step.status === 'complete') {
+    const nextStep = getNextStep(currentStep);
+
+    // All steps done - after merge completes (G1.11)
+    if (nextStep === null) {
+      return {
+        action: 'complete',
+        reason: 'All steps finished',
+      };
+    }
+
+    // Verify complete → check USER_GATE before merge (G1.8)
+    if (currentStep === 'verify' && nextStep === 'merge') {
+      // USER_GATE requires explicit confirmation
+      if (phase.hasUserGate && phase.userGateStatus !== 'confirmed') {
+        return {
+          action: 'wait_user_gate',
+          reason: 'USER_GATE requires confirmation',
+        };
+      }
+      // autoMerge disabled → wait for user to trigger (G1.9)
+      if (!config.autoMerge) {
+        return {
+          action: 'wait_merge',
+          reason: 'Auto-merge disabled, waiting for user',
+        };
+      }
+      // autoMerge enabled → transition to merge step (G1.10)
+      return {
+        action: 'transition',
+        nextStep: 'merge',
+        nextIndex: STEP_INDEX_MAP.verify + 1, // merge is after verify
+        skill: getSkillForStep('merge'),
+        reason: 'Verify complete, auto-merge enabled',
+      };
+    }
+
+    // Normal step transition (G1.12)
+    return {
+      action: 'transition',
+      nextStep,
+      nextIndex: STEP_INDEX_MAP[nextStep as keyof typeof STEP_INDEX_MAP],
+      skill: getSkillForStep(nextStep),
+      reason: `${currentStep} complete, advancing to ${nextStep}`,
+    };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // STEP FAILED OR BLOCKED (G1.13, G1.14)
+  // ═══════════════════════════════════════════════════════════════════
+  if (step.status === 'failed' || step.status === 'blocked') {
+    return {
+      action: 'recover_failed',
+      reason: `Step ${currentStep} is ${step.status}`,
+    };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // STEP IN PROGRESS BUT NO WORKFLOW (G1.15)
+  // ═══════════════════════════════════════════════════════════════════
+  if (step.status === 'in_progress' && !workflow) {
+    return {
+      action: 'spawn',
+      skill: getSkillForStep(currentStep),
+      reason: `Step ${currentStep} in_progress but no active workflow`,
+    };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // STEP NOT STARTED - SPAWN WORKFLOW (G1.16, G1.17)
+  // ═══════════════════════════════════════════════════════════════════
+  if (step.status === 'not_started' || step.status === null || step.status === undefined) {
+    // Initialize batches when entering implement (G1.17)
+    if (currentStep === 'implement' && batches.total === 0) {
+      return {
+        action: 'initialize_batches',
+        reason: 'Entering implement, need to populate batches',
+      };
+    }
+    return {
+      action: 'spawn',
+      skill: getSkillForStep(currentStep),
+      reason: `Step ${currentStep} not started, spawning workflow`,
+    };
+  }
+
+  // ═══════════════════════════════════════════════════════════════════
+  // UNKNOWN STATUS - SHOULD NOT HAPPEN (G1.18)
+  // ═══════════════════════════════════════════════════════════════════
+  console.error(`[orchestration-decisions] Unknown step.status: ${step.status}`);
+  return {
+    action: 'needs_attention',
+    reason: `Unknown status: ${step.status}`,
+    errorMessage: `Unexpected step status: ${step.status}`,
+    recoveryOptions: ['retry', 'abort'],
+  };
+}
+
+// =============================================================================
+// Internal Helpers
+// =============================================================================
+
+/**
+ * Get the stored workflow ID for a given step from execution state
+ */
+function getStoredWorkflowId(execution: OrchestrationExecution, step: string): string | undefined {
+  const { executions, batches } = execution;
+
+  switch (step) {
+    case 'design':
+      return executions.design;
+    case 'analyze':
+      return executions.analyze;
+    case 'implement':
+      return batches.items[batches.current]?.workflowExecutionId;
+    case 'verify':
+      return executions.verify;
+    case 'merge':
+      return executions.merge;
+    default:
+      return undefined;
+  }
+}
diff --git a/packages/dashboard/src/lib/services/orchestration-runner.ts b/packages/dashboard/src/lib/services/orchestration-runner.ts
index c442dd4..fd75aa7 100644
--- a/packages/dashboard/src/lib/services/orchestration-runner.ts
+++ b/packages/dashboard/src/lib/services/orchestration-runner.ts
@@ -16,16 +16,24 @@
  * - Claude fallback analyzer (after 3 unclear state checks)
  */
 
-import { execSync } from 'child_process';
 import { join } from 'path';
-import { existsSync, readFileSync } from 'fs';
+import { existsSync, readFileSync, readdirSync, writeFileSync, unlinkSync, type Dirent } from 'fs';
 import { z } from 'zod';
-import { orchestrationService } from './orchestration-service';
+import { orchestrationService, getNextPhase, isPhaseComplete } from './orchestration-service';
 import { workflowService, type WorkflowExecution } from './workflow-service';
 import { attemptHeal, getHealingSummary } from './auto-healing-service';
 import { quickDecision } from './claude-helper';
-import { parseBatchesFromProject } from './batch-parser';
-import { isClaudeHelperError, type OrchestrationExecution, type OrchestrationPhase } from '@specflow/shared';
+import { parseBatchesFromProject, verifyBatchTaskCompletion, getTotalIncompleteTasks } from './batch-parser';
+import { isClaudeHelperError, type OrchestrationExecution, type OrchestrationPhase, type SSEEvent } from '@specflow/shared';
+// G2 Compliance: Import pure decision functions from orchestration-decisions module
+import {
+  makeDecision as makeDecisionPure,
+  type DecisionInput,
+  type DecisionResult as PureDecisionResult,
+  type WorkflowState,
+  getSkillForStep,
+  STALE_THRESHOLD_MS,
+} from './orchestration-decisions';
 
 // =============================================================================
 // Types
@@ -40,6 +48,283 @@ interface RunnerContext {
   consecutiveUnclearChecks: number;
 }
 
+/**
+ * Dependency injection interface for testing (T120/G12.4)
+ * Allows injecting mock services without vi.mock
+ */
+export interface OrchestrationDeps {
+  orchestrationService: typeof orchestrationService;
+  workflowService: typeof workflowService;
+  getNextPhase: typeof getNextPhase;
+  isPhaseComplete: typeof isPhaseComplete;
+  attemptHeal?: typeof attemptHeal;
+  quickDecision?: typeof quickDecision;
+  parseBatchesFromProject?: typeof parseBatchesFromProject;
+}
+
+/**
+ * Default dependencies using module imports
+ */
+const defaultDeps: OrchestrationDeps = {
+  orchestrationService,
+  workflowService,
+  getNextPhase,
+  isPhaseComplete,
+  attemptHeal,
+  quickDecision,
+  parseBatchesFromProject,
+};
+
+// =============================================================================
+// Spawn Intent Pattern (G5.3-G5.7)
+// =============================================================================
+
+/**
+ * Get the path to the spawn intent file for an orchestration
+ * Uses a separate file to avoid race conditions with state updates
+ */
+function getSpawnIntentPath(projectPath: string, orchestrationId: string): string {
+  return join(projectPath, '.specflow', 'workflows', `spawn-intent-${orchestrationId}.json`);
+}
+
+/**
+ * SpawnIntent structure - tracks what we're trying to spawn
+ */
+interface SpawnIntent {
+  skill: string;
+  orchestrationId: string;
+  timestamp: string;
+}
+
+/**
+ * Check if a spawn intent exists for this orchestration (G5.4)
+ * If an intent exists, another process is already spawning a workflow
+ */
+function hasSpawnIntent(projectPath: string, orchestrationId: string): boolean {
+  const intentPath = getSpawnIntentPath(projectPath, orchestrationId);
+  if (!existsSync(intentPath)) {
+    return false;
+  }
+
+  // Check if intent is stale (older than 30 seconds)
+  try {
+    const content = readFileSync(intentPath, 'utf-8');
+    const intent = JSON.parse(content) as SpawnIntent;
+    const intentTime = new Date(intent.timestamp).getTime();
+    const now = Date.now();
+    const staleThresholdMs = 30 * 1000; // 30 seconds
+
+    if (now - intentTime > staleThresholdMs) {
+      // Stale intent - clean it up
+      console.log(`[orchestration-runner] Found stale spawn intent (${Math.round((now - intentTime) / 1000)}s old), clearing`);
+      clearSpawnIntent(projectPath, orchestrationId);
+      return false;
+    }
+
+    return true;
+  } catch {
+    // If we can't read it, assume it's stale and clean it up
+    clearSpawnIntent(projectPath, orchestrationId);
+    return false;
+  }
+}
+
+/**
+ * Write spawn intent BEFORE calling workflowService.start() (G5.6)
+ * This prevents race conditions where two runners try to spawn simultaneously
+ */
+function writeSpawnIntent(projectPath: string, orchestrationId: string, skill: string): void {
+  const intentPath = getSpawnIntentPath(projectPath, orchestrationId);
+  const intent: SpawnIntent = {
+    skill,
+    orchestrationId,
+    timestamp: new Date().toISOString(),
+  };
+  writeFileSync(intentPath, JSON.stringify(intent, null, 2));
+}
+
+/**
+ * Clear spawn intent in finally block (G5.7)
+ * Called regardless of whether spawn succeeded or failed
+ */
+function clearSpawnIntent(projectPath: string, orchestrationId: string): void {
+  const intentPath = getSpawnIntentPath(projectPath, orchestrationId);
+  try {
+    if (existsSync(intentPath)) {
+      unlinkSync(intentPath);
+    }
+  } catch {
+    // Ignore errors during cleanup
+  }
+}
+
+/**
+ * Spawn a workflow with intent pattern to prevent race conditions (G5.3)
+ *
+ * This wraps the workflow spawn logic with:
+ * 1. Check for existing spawn intent (G5.4)
+ * 2. Check hasActiveWorkflow() (G5.5)
+ * 3. Write spawn intent BEFORE calling start() (G5.6)
+ * 4. Clear spawn intent in finally block (G5.7)
+ */
+async function spawnWorkflowWithIntent(
+  ctx: RunnerContext,
+  skill: string,
+  context?: string
+): Promise<WorkflowExecution | null> {
+  const fullSkill = context ? `${skill} ${context}` : skill;
+
+  // G5.4: Check for existing spawn intent
+  if (hasSpawnIntent(ctx.projectPath, ctx.orchestrationId)) {
+    console.log(`[orchestration-runner] Spawn intent already exists for orchestration ${ctx.orchestrationId}, skipping spawn`);
+    return null;
+  }
+
+  // G5.5: Check if there's already an active workflow
+  if (workflowService.hasActiveWorkflow(ctx.projectId, ctx.orchestrationId)) {
+    console.log(`[orchestration-runner] Workflow already active for orchestration ${ctx.orchestrationId}, skipping spawn`);
+    return null;
+  }
+
+  try {
+    // G5.6: Write spawn intent BEFORE calling start()
+    writeSpawnIntent(ctx.projectPath, ctx.orchestrationId, skill);
+
+    // Actually spawn the workflow
+    const workflow = await workflowService.start(
+      ctx.projectId,
+      fullSkill,
+      undefined, // default timeout
+      undefined, // no resume session
+      ctx.orchestrationId // link to this orchestration
+    );
+
+    // Link workflow to orchestration for backwards compatibility
+    orchestrationService.linkWorkflowExecution(ctx.projectPath, ctx.orchestrationId, workflow.id);
+
+    console.log(`[orchestration-runner] Spawned workflow ${workflow.id} for ${skill} (linked to orchestration ${ctx.orchestrationId})`);
+
+    return workflow;
+  } finally {
+    // G5.7: Clear spawn intent regardless of success/failure
+    clearSpawnIntent(ctx.projectPath, ctx.orchestrationId);
+  }
+}
+
+// =============================================================================
+// Persistent Runner State (G5.8-G5.10)
+// =============================================================================
+
+/**
+ * Get the path to the runner state file for an orchestration
+ * This file persists runner info across process restarts
+ */
+function getRunnerStatePath(projectPath: string, orchestrationId: string): string {
+  return join(projectPath, '.specflow', 'workflows', `runner-${orchestrationId}.json`);
+}
+
+/**
+ * RunnerState structure - tracks which process is running the orchestration
+ */
+interface RunnerState {
+  orchestrationId: string;
+  pid: number;
+  startedAt: string;
+}
+
+/**
+ * Persist runner state to file (G5.8)
+ * Called when runner starts to track which process owns this orchestration
+ */
+function persistRunnerState(projectPath: string, orchestrationId: string): void {
+  const statePath = getRunnerStatePath(projectPath, orchestrationId);
+  const state: RunnerState = {
+    orchestrationId,
+    pid: process.pid,
+    startedAt: new Date().toISOString(),
+  };
+  try {
+    writeFileSync(statePath, JSON.stringify(state, null, 2));
+    console.log(`[orchestration-runner] Persisted runner state for ${orchestrationId} (PID: ${process.pid})`);
+  } catch (error) {
+    console.error(`[orchestration-runner] Failed to persist runner state: ${error}`);
+  }
+}
+
+/**
+ * Clear runner state file (G5.9)
+ * Called when runner exits (normally or due to error)
+ */
+function clearRunnerState(projectPath: string, orchestrationId: string): void {
+  const statePath = getRunnerStatePath(projectPath, orchestrationId);
+  try {
+    if (existsSync(statePath)) {
+      unlinkSync(statePath);
+      console.log(`[orchestration-runner] Cleared runner state for ${orchestrationId}`);
+    }
+  } catch {
+    // Ignore errors during cleanup
+  }
+}
+
+/**
+ * Check if a runner process is still alive by PID
+ */
+function isProcessAlive(pid: number): boolean {
+  try {
+    // Sending signal 0 doesn't actually send a signal, but checks if process exists
+    process.kill(pid, 0);
+    return true;
+  } catch {
+    return false;
+  }
+}
+
+/**
+ * Reconcile runners on dashboard startup (G5.10)
+ * Detects orphaned runner state files where the process is no longer running
+ */
+export function reconcileRunners(projectPath: string): void {
+  const workflowsDir = join(projectPath, '.specflow', 'workflows');
+  if (!existsSync(workflowsDir)) return;
+
+  try {
+    const files = readdirSync(workflowsDir);
+    const runnerFiles = files.filter((f) => f.startsWith('runner-') && f.endsWith('.json'));
+
+    for (const file of runnerFiles) {
+      const filePath = join(workflowsDir, file);
+      try {
+        const content = readFileSync(filePath, 'utf-8');
+        const state = JSON.parse(content) as RunnerState;
+
+        if (!isProcessAlive(state.pid)) {
+          // Process is dead but state file exists - orphaned runner
+          console.log(`[orchestration-runner] Detected orphaned runner for ${state.orchestrationId} (PID ${state.pid} is dead), cleaning up`);
+          unlinkSync(filePath);
+
+          // Also clear from in-memory map if present
+          activeRunners.delete(state.orchestrationId);
+        } else {
+          // Process is alive - mark as active in memory
+          console.log(`[orchestration-runner] Runner for ${state.orchestrationId} is still active (PID ${state.pid})`);
+          activeRunners.set(state.orchestrationId, true);
+        }
+      } catch {
+        // Corrupted file, remove it
+        console.log(`[orchestration-runner] Removing corrupted runner state file: ${file}`);
+        try {
+          unlinkSync(filePath);
+        } catch {
+          // Ignore
+        }
+      }
+    }
+  } catch (error) {
+    console.error(`[orchestration-runner] Failed to reconcile runners: ${error}`);
+  }
+}
+
 // =============================================================================
 // Claude State Analyzer (Fallback)
 // =============================================================================
@@ -216,7 +501,26 @@ function mapClaudeDecision(decision: StateAnalyzerDecision): DecisionResult {
 }
 
 interface DecisionResult {
-  action: 'continue' | 'spawn_workflow' | 'spawn_batch' | 'heal' | 'wait_merge' | 'needs_attention' | 'complete' | 'fail';
+  action:
+    // Legacy actions (kept for compatibility)
+    | 'continue'
+    | 'spawn_workflow'
+    | 'spawn_batch'
+    | 'heal'
+    | 'wait_merge'
+    | 'needs_attention'
+    | 'complete'
+    | 'fail'
+    // G2 Compliance: New actions from pure decision module
+    | 'transition'
+    | 'advance_batch'
+    | 'initialize_batches'
+    | 'force_step_complete'
+    | 'pause'
+    | 'recover_stale'
+    | 'recover_failed'
+    | 'wait_with_backoff'
+    | 'wait_user_gate';
   reason: string;
   skill?: string;
   batchContext?: string;
@@ -225,6 +529,14 @@ interface DecisionResult {
   recoveryOptions?: Array<'retry' | 'skip' | 'abort'>;
   /** Failed workflow ID for recovery context */
   failedWorkflowId?: string;
+  /** Next step for transition action */
+  nextStep?: string;
+  /** Batch index for batch actions */
+  batchIndex?: number;
+  /** Workflow ID for stale recovery */
+  workflowId?: string;
+  /** Backoff time for wait_with_backoff */
+  backoffMs?: number;
 }
 
 // =============================================================================
@@ -250,39 +562,276 @@ function getProjectPath(projectId: string): string | null {
 }
 
 // =============================================================================
-// Specflow Status Integration
+// Specflow Status Integration (Direct File Access - No Subprocess)
 // =============================================================================
 
 interface SpecflowStatus {
   phase?: {
     number?: number;
     name?: string;
+    hasUserGate?: boolean;
+    userGateStatus?: 'pending' | 'confirmed' | 'skipped';
   };
   context?: {
     hasSpec?: boolean;
     hasPlan?: boolean;
     hasTasks?: boolean;
+    featureDir?: string;
   };
   progress?: {
     tasksTotal?: number;
     tasksComplete?: number;
     percentage?: number;
   };
+  orchestration?: {
+    step?: {
+      current?: string;
+      index?: number;
+      status?: string;
+    };
+  };
 }
 
+/**
+ * Task counts from parsing tasks.md directly
+ */
+interface TaskCounts {
+  total: number;
+  completed: number;
+  blocked: number;
+  deferred: number;
+  percentage: number;
+}
+
+/**
+ * Get task counts by parsing tasks.md directly (no subprocess)
+ *
+ * @param tasksPath - Path to tasks.md file
+ * @returns Task counts or null if file doesn't exist
+ */
+function getTaskCounts(tasksPath: string): TaskCounts | null {
+  if (!existsSync(tasksPath)) {
+    return null;
+  }
+
+  try {
+    const content = readFileSync(tasksPath, 'utf-8');
+    const lines = content.split('\n');
+
+    let total = 0;
+    let completed = 0;
+    let blocked = 0;
+    let deferred = 0;
+
+    for (const line of lines) {
+      const trimmed = line.trim();
+
+      // Match task lines: - [x] T###, - [ ] T###, etc.
+      const taskMatch = trimmed.match(/^-\s*\[[xX ~\-bB]\]\s*T\d{3}/);
+      if (!taskMatch) continue;
+
+      total++;
+
+      // Determine status from checkbox
+      if (trimmed.startsWith('- [x]') || trimmed.startsWith('- [X]')) {
+        completed++;
+      } else if (trimmed.startsWith('- [b]') || trimmed.startsWith('- [B]')) {
+        blocked++;
+      } else if (trimmed.startsWith('- [~]') || trimmed.startsWith('- [-]')) {
+        deferred++;
+      }
+      // else it's '- [ ]' which is todo (not counted separately)
+    }
+
+    return {
+      total,
+      completed,
+      blocked,
+      deferred,
+      percentage: total > 0 ? Math.round((completed / total) * 100) : 0,
+    };
+  } catch {
+    return null;
+  }
+}
+
+/**
+ * Check if design artifacts exist in a feature directory (no subprocess)
+ *
+ * @param featureDir - Path to the feature directory (specs/NNNN-name/)
+ * @returns Object indicating which artifacts exist
+ */
+function checkArtifactExistence(featureDir: string): { hasSpec: boolean; hasPlan: boolean; hasTasks: boolean } {
+  return {
+    hasSpec: existsSync(join(featureDir, 'spec.md')),
+    hasPlan: existsSync(join(featureDir, 'plan.md')),
+    hasTasks: existsSync(join(featureDir, 'tasks.md')),
+  };
+}
+
+/**
+ * Find the active feature directory in a project
+ * Looks for specs/NNNN-name/ directories and returns the highest numbered one
+ *
+ * @param projectPath - Root path of the project
+ * @returns Feature directory path or null if none found
+ */
+function findActiveFeatureDir(projectPath: string): string | null {
+  const specsDir = join(projectPath, 'specs');
+  if (!existsSync(specsDir)) {
+    return null;
+  }
+
+  try {
+    const entries = readdirSync(specsDir, { withFileTypes: true }) as Dirent[];
+
+    // Find directories matching NNNN-* pattern
+    const featureDirs = entries
+      .filter((e) => e.isDirectory() && /^\d{4}-/.test(e.name))
+      .map((e) => e.name)
+      .sort()
+      .reverse();
+
+    if (featureDirs.length === 0) {
+      return null;
+    }
+
+    return join(specsDir, featureDirs[0]);
+  } catch {
+    return null;
+  }
+}
+
+/**
+ * Get specflow status by reading files directly (no subprocess)
+ * Replaces the previous getSpecflowStatus that called `specflow status --json`
+ *
+ * @param projectPath - Root path of the project
+ * @returns Status object compatible with previous interface
+ */
 function getSpecflowStatus(projectPath: string): SpecflowStatus | null {
   try {
-    const result = execSync('specflow status --json', {
-      cwd: projectPath,
-      encoding: 'utf-8',
-      timeout: 30000,
-    });
-    return JSON.parse(result);
+    // Find active feature directory
+    const featureDir = findActiveFeatureDir(projectPath);
+    if (!featureDir) {
+      return {
+        context: {
+          hasSpec: false,
+          hasPlan: false,
+          hasTasks: false,
+        },
+        progress: {
+          tasksTotal: 0,
+          tasksComplete: 0,
+          percentage: 0,
+        },
+      };
+    }
+
+    // Check which artifacts exist
+    const artifacts = checkArtifactExistence(featureDir);
+
+    // Get task counts if tasks.md exists
+    const tasksPath = join(featureDir, 'tasks.md');
+    const taskCounts = artifacts.hasTasks ? getTaskCounts(tasksPath) : null;
+
+    // Extract phase info from directory name (e.g., "1056-jsonl-watcher" -> 1056)
+    const dirName = featureDir.split('/').pop() || '';
+    const phaseMatch = dirName.match(/^(\d+)-(.+)/);
+
+    // Read orchestration state from state file
+    let orchestrationState: SpecflowStatus['orchestration'] = undefined;
+    let phaseGateInfo: Pick<NonNullable<SpecflowStatus['phase']>, 'hasUserGate' | 'userGateStatus'> = {};
+    try {
+      // Try .specflow first (v3), then .specify (v2)
+      let statePath = join(projectPath, '.specflow', 'orchestration-state.json');
+      if (!existsSync(statePath)) {
+        statePath = join(projectPath, '.specify', 'orchestration-state.json');
+      }
+      if (existsSync(statePath)) {
+        const stateContent = readFileSync(statePath, 'utf-8');
+        const state = JSON.parse(stateContent);
+        if (state?.orchestration?.step) {
+          orchestrationState = {
+            step: {
+              current: state.orchestration.step.current,
+              index: state.orchestration.step.index,
+              status: state.orchestration.step.status,
+            },
+          };
+        }
+        // Extract phase gate info from state file
+        if (state?.orchestration?.phase) {
+          phaseGateInfo = {
+            hasUserGate: state.orchestration.phase.hasUserGate,
+            userGateStatus: state.orchestration.phase.userGateStatus,
+          };
+        }
+      }
+    } catch {
+      // Ignore errors reading state file
+    }
+
+    return {
+      phase: phaseMatch ? {
+        number: parseInt(phaseMatch[1], 10),
+        name: phaseMatch[2].replace(/-/g, ' '),
+        ...phaseGateInfo,
+      } : phaseGateInfo.hasUserGate !== undefined ? phaseGateInfo : undefined,
+      context: {
+        hasSpec: artifacts.hasSpec,
+        hasPlan: artifacts.hasPlan,
+        hasTasks: artifacts.hasTasks,
+        featureDir,
+      },
+      progress: taskCounts ? {
+        tasksTotal: taskCounts.total,
+        tasksComplete: taskCounts.completed,
+        percentage: taskCounts.percentage,
+      } : {
+        tasksTotal: 0,
+        tasksComplete: 0,
+        percentage: 0,
+      },
+      orchestration: orchestrationState,
+    };
   } catch {
     return null;
   }
 }
 
+// =============================================================================
+// Staleness Detection
+// =============================================================================
+
+/**
+ * Get the last file change time for the project
+ * Used for staleness detection (G1.5)
+ */
+function getLastFileChangeTime(projectPath: string): number {
+  try {
+    // Check common directories for recent changes
+    const dirsToCheck = [
+      join(projectPath, 'src'),
+      join(projectPath, 'specs'),
+      join(projectPath, '.specflow'),
+    ];
+
+    let latestTime = 0;
+    for (const dir of dirsToCheck) {
+      if (existsSync(dir)) {
+        const stat = require('fs').statSync(dir);
+        if (stat.mtimeMs > latestTime) {
+          latestTime = stat.mtimeMs;
+        }
+      }
+    }
+    return latestTime || Date.now();
+  } catch {
+    return Date.now();
+  }
+}
+
 // =============================================================================
 // State Machine Decision Logic
 // =============================================================================
@@ -307,70 +856,113 @@ function getSkillForPhase(phase: OrchestrationPhase): string {
   }
 }
 
+// =============================================================================
+// G2 Compliance: Adapter for Pure Decision Functions
+// =============================================================================
+
 /**
- * Determine if the current phase is complete based on specflow status
+ * Convert runner context to DecisionInput for the pure makeDecision function
+ * This adapter bridges the old runner patterns with the new pure decision module
  */
-function isPhaseComplete(status: SpecflowStatus | null, phase: OrchestrationPhase): boolean {
-  if (!status) return false;
+function createDecisionInput(
+  orchestration: OrchestrationExecution,
+  workflow: WorkflowExecution | undefined,
+  specflowStatus: SpecflowStatus | null,
+  lastFileChangeTime?: number
+): DecisionInput {
+  // Convert workflow to WorkflowState (simplified interface)
+  const workflowState: WorkflowState | null = workflow ? {
+    id: workflow.id,
+    status: workflow.status as WorkflowState['status'],
+    error: workflow.error,
+    lastActivityAt: workflow.updatedAt,
+  } : null;
+
+  // Extract step info from specflow status and orchestration
+  // IMPORTANT: The state file tracks the PROJECT's current step, which may differ from
+  // the orchestration's currentPhase (e.g., when skipping to merge).
+  // We only trust step.status if it's for the SAME step as the orchestration's currentPhase.
+  const stateFileStep = specflowStatus?.orchestration?.step?.current;
+  const rawStatus = specflowStatus?.orchestration?.step?.status;
+  const validStatuses = ['not_started', 'pending', 'in_progress', 'complete', 'failed', 'blocked', 'skipped'] as const;
+
+  // Only use the state file's status if it matches the orchestration's current phase
+  // Otherwise, the step hasn't been started in this orchestration
+  const stepStatus = (stateFileStep === orchestration.currentPhase && rawStatus && validStatuses.includes(rawStatus as typeof validStatuses[number]))
+    ? (rawStatus as typeof validStatuses[number])
+    : 'not_started';
+
+  const stepCurrent = orchestration.currentPhase;
+  const stepIndex = specflowStatus?.orchestration?.step?.index ?? 0;
 
-  switch (phase) {
-    case 'design':
-      return status.context?.hasPlan === true && status.context?.hasTasks === true;
-    case 'analyze':
-      // Analyze doesn't produce artifacts - considered complete after running
-      return true;
-    case 'implement':
-      // All tasks complete
-      return (
-        status.progress?.tasksComplete === status.progress?.tasksTotal &&
-        (status.progress?.tasksTotal ?? 0) > 0
-      );
-    case 'verify':
-      // Verify doesn't change task count - considered complete after running
-      return true;
-    case 'merge':
-      return true;
-    case 'complete':
-      return true;
-    default:
-      return false;
-  }
+  return {
+    step: {
+      current: stepCurrent,
+      index: stepIndex,
+      status: stepStatus,
+    },
+    phase: {
+      hasUserGate: specflowStatus?.phase?.hasUserGate,
+      userGateStatus: specflowStatus?.phase?.userGateStatus,
+    },
+    execution: orchestration,
+    workflow: workflowState,
+    lastFileChangeTime,
+    lookupFailures: 0,
+    currentTime: Date.now(),
+  };
 }
 
 /**
- * Get the next phase in orchestration flow
+ * Adapt pure DecisionResult to the legacy action names where needed
+ * The executeDecision function will be updated to handle all new action types
  */
-function getNextPhase(
-  current: OrchestrationPhase,
-  config: OrchestrationExecution['config']
-): OrchestrationPhase | null {
-  const phases: OrchestrationPhase[] = ['design', 'analyze', 'implement', 'verify', 'merge', 'complete'];
-  const currentIndex = phases.indexOf(current);
-
-  if (currentIndex === -1 || currentIndex === phases.length - 1) {
-    return null;
-  }
+function adaptDecisionResult(result: PureDecisionResult): DecisionResult {
+  // Map new action names to ensure compatibility
+  const actionMap: Record<string, DecisionResult['action']> = {
+    'wait': 'continue',           // wait → continue (legacy)
+    'spawn': 'spawn_workflow',    // spawn → spawn_workflow (legacy)
+    'heal_batch': 'heal',         // heal_batch → heal (legacy)
+  };
 
-  let nextIndex = currentIndex + 1;
-  let nextPhase = phases[nextIndex];
+  const action = actionMap[result.action] ?? result.action;
 
-  // Skip design if configured
-  if (nextPhase === 'design' && config.skipDesign) {
-    nextIndex++;
-    nextPhase = phases[nextIndex];
-  }
+  return {
+    action: action as DecisionResult['action'],
+    reason: result.reason,
+    skill: result.skill,
+    batchContext: result.batchContext,
+    errorMessage: result.errorMessage,
+    recoveryOptions: result.recoveryOptions,
+    failedWorkflowId: result.failedWorkflowId,
+    // For transition actions, extract the skill
+    ...(result.action === 'transition' && result.skill ? { skill: result.skill } : {}),
+  };
+}
 
-  // Skip analyze if configured
-  if (nextPhase === 'analyze' && config.skipAnalyze) {
-    nextIndex++;
-    nextPhase = phases[nextIndex];
-  }
+/**
+ * Make a decision using the pure decision module (G2 compliant)
+ * Falls back to legacy makeDecision if pure module fails
+ */
+function makeDecisionWithAdapter(
+  orchestration: OrchestrationExecution,
+  workflow: WorkflowExecution | undefined,
+  specflowStatus: SpecflowStatus | null,
+  lastFileChangeTime?: number
+): DecisionResult {
+  // Create input for pure decision function
+  const input = createDecisionInput(orchestration, workflow, specflowStatus, lastFileChangeTime);
+
+  // Get decision from pure function
+  const pureResult = makeDecisionPure(input);
 
-  return nextPhase || null;
+  // Adapt to legacy format
+  return adaptDecisionResult(pureResult);
 }
 
 /**
  * Make a decision about what to do next
+ * @deprecated Use makeDecisionWithAdapter instead - this is kept for reference during transition
  */
 function makeDecision(
   orchestration: OrchestrationExecution,
@@ -492,8 +1084,9 @@ function makeDecision(
   // CRITICAL: For design phase, require BOTH workflow completion AND artifacts exist
   // This prevents auto-advancing when workflow completes without producing required artifacts
   const workflowComplete = workflow?.status === 'completed';
-  const canAdvance = currentPhase === 'analyze'
-    ? workflowComplete  // Analyze has no artifacts, workflow completion is enough
+  // Analyze and verify don't produce artifacts - workflow completion is enough
+  const canAdvance = (currentPhase === 'analyze' || currentPhase === 'verify')
+    ? workflowComplete  // No artifacts, workflow completion is enough
     : (phaseComplete && workflowComplete);  // Other phases need artifacts AND workflow done
 
   if (currentPhase !== 'implement' && canAdvance) {
@@ -563,6 +1156,146 @@ function makeDecision(
   };
 }
 
+// =============================================================================
+// Event-Driven Orchestration (T025-T026, G5.11-G5.13)
+// =============================================================================
+
+/**
+ * Pending event signals for each orchestration runner
+ * G5.11: Changed from single callback to Set of callbacks to support multiple sleepers
+ * When a relevant file change is detected, ALL registered callbacks are invoked
+ */
+const eventSignals = new Map<string, Set<() => void>>();
+
+/**
+ * Wake up all sleepers for an orchestration (G5.13)
+ * Called when a relevant file change is detected
+ */
+function wakeUp(orchestrationId: string): void {
+  const callbacks = eventSignals.get(orchestrationId);
+  if (callbacks && callbacks.size > 0) {
+    // Copy to avoid modification during iteration
+    const callbacksCopy = [...callbacks];
+    for (const callback of callbacksCopy) {
+      try {
+        callback();
+      } catch (error) {
+        console.error(`[orchestration-runner] Error in wake-up callback:`, error);
+      }
+    }
+  }
+}
+
+/**
+ * Subscribe to file events for event-driven orchestration
+ *
+ * T025: Subscribe to watcher events to wake up the runner when relevant files change
+ * instead of relying purely on fixed-interval polling
+ *
+ * @param orchestrationId - ID of the orchestration runner
+ * @param projectId - Project ID to filter events
+ * @param onEvent - Callback when relevant event occurs (wakes up runner)
+ * @returns Cleanup function to unsubscribe
+ */
+function subscribeToFileEvents(
+  orchestrationId: string,
+  projectId: string,
+  onEvent: () => void
+): () => void {
+  // Import addListener from watcher
+  const { addListener: addWatcherListener } = require('../watcher');
+
+  // G5.11: Initialize Set if needed, then add callback
+  if (!eventSignals.has(orchestrationId)) {
+    eventSignals.set(orchestrationId, new Set());
+  }
+  eventSignals.get(orchestrationId)!.add(onEvent);
+
+  // Subscribe to SSE events from watcher
+  const cleanup = addWatcherListener((event: SSEEvent) => {
+    // Only react to events for this project
+    if ('projectId' in event && event.projectId !== projectId) {
+      return;
+    }
+
+    // Wake up runner on relevant events
+    switch (event.type) {
+      case 'tasks':
+        // Task file changed - might have new completions
+        console.log(`[orchestration-runner] Tasks event for ${projectId}, waking runner`);
+        wakeUp(orchestrationId);
+        break;
+      case 'workflow':
+        // Workflow index changed - workflow might have completed
+        console.log(`[orchestration-runner] Workflow event for ${projectId}, waking runner`);
+        wakeUp(orchestrationId);
+        break;
+      case 'state':
+        // Orchestration state changed - might need to react
+        console.log(`[orchestration-runner] State event for ${projectId}, waking runner`);
+        wakeUp(orchestrationId);
+        break;
+      // Ignore: registry, phases, heartbeat, session events
+    }
+  });
+
+  return () => {
+    // Remove this specific callback from the Set
+    const callbacks = eventSignals.get(orchestrationId);
+    if (callbacks) {
+      callbacks.delete(onEvent);
+      // Clean up empty Sets
+      if (callbacks.size === 0) {
+        eventSignals.delete(orchestrationId);
+      }
+    }
+    cleanup();
+  };
+}
+
+/**
+ * Event-driven sleep with early wake-up on file events
+ *
+ * T026, G5.12: Replace fixed sleep with event-triggered wake-up
+ * This allows the runner to react immediately to file changes
+ * while still having a maximum wait time
+ *
+ * G5.12: Now adds callback to Set instead of replacing
+ *
+ * @param ms - Maximum time to wait (fallback if no events)
+ * @param orchestrationId - ID to check for wake-up signal
+ * @returns Promise that resolves when woken up or timeout reached
+ */
+function eventDrivenSleep(ms: number, orchestrationId: string): Promise<void> {
+  return new Promise((resolve) => {
+    const timeout = setTimeout(resolve, ms);
+
+    // G5.12: Create a wake-up callback that clears timeout and resolves
+    const wakeUpCallback = () => {
+      clearTimeout(timeout);
+      resolve();
+    };
+
+    // G5.12: Initialize Set if needed, then add callback
+    if (!eventSignals.has(orchestrationId)) {
+      eventSignals.set(orchestrationId, new Set());
+    }
+    eventSignals.get(orchestrationId)!.add(wakeUpCallback);
+
+    // When promise resolves (either by timeout or wake-up), remove our callback
+    // This prevents memory leaks from accumulated callbacks
+    const cleanup = () => {
+      const callbacks = eventSignals.get(orchestrationId);
+      if (callbacks) {
+        callbacks.delete(wakeUpCallback);
+      }
+    };
+
+    // Set up cleanup for both paths
+    setTimeout(() => cleanup(), ms + 1); // Cleanup after max timeout
+  });
+}
+
 // =============================================================================
 // Orchestration Runner
 // =============================================================================
@@ -577,12 +1310,19 @@ const activeRunners = new Map<string, boolean>();
  *
  * This function runs in the background and drives orchestration forward
  * until completion, failure, or cancellation.
+ *
+ * @param projectId - Project identifier
+ * @param orchestrationId - Orchestration execution ID
+ * @param pollingInterval - Interval between state checks (ms)
+ * @param maxPollingAttempts - Maximum polling iterations before stopping
+ * @param deps - Optional dependency injection for testing (T120/G12.4)
  */
 export async function runOrchestration(
   projectId: string,
   orchestrationId: string,
   pollingInterval: number = 3000,
-  maxPollingAttempts: number = 1000
+  maxPollingAttempts: number = 1000,
+  deps: OrchestrationDeps = defaultDeps
 ): Promise<void> {
   const projectPath = getProjectPath(projectId);
   if (!projectPath) {
@@ -597,7 +1337,11 @@ export async function runOrchestration(
   }
 
   activeRunners.set(orchestrationId, true);
-  console.log(`[orchestration-runner] Starting runner for ${orchestrationId}`);
+
+  // G5.8: Persist runner state to file for cross-process detection
+  persistRunnerState(projectPath, orchestrationId);
+
+  console.log(`[orchestration-runner] Starting event-driven runner for ${orchestrationId}`);
 
   const ctx: RunnerContext = {
     projectId,
@@ -608,9 +1352,21 @@ export async function runOrchestration(
     consecutiveUnclearChecks: 0,
   };
 
+  // T025: Subscribe to file events for event-driven wake-up
+  let eventCleanup: (() => void) | null = null;
+  try {
+    eventCleanup = subscribeToFileEvents(orchestrationId, projectId, () => {
+      // Wake-up callback is set by eventDrivenSleep
+    });
+    console.log(`[orchestration-runner] Subscribed to file events for ${projectId}`);
+  } catch (error) {
+    console.log(`[orchestration-runner] Event subscription not available, using polling fallback: ${error}`);
+  }
+
   let attempts = 0;
 
   try {
+    // T026: Event-driven loop - wake on file events OR timeout
     while (attempts < maxPollingAttempts) {
       attempts++;
 
@@ -627,22 +1383,22 @@ export async function runOrchestration(
         break;
       }
 
-      // Check for paused/waiting states
+      // Check for paused/waiting states - use longer wait, still event-driven
       if (orchestration.status === 'needs_attention') {
         console.log(`[orchestration-runner] Orchestration ${orchestrationId} needs attention, waiting for user action...`);
-        await sleep(ctx.pollingInterval * 2);
+        await eventDrivenSleep(ctx.pollingInterval * 2, orchestrationId);
         continue;
       }
 
       if (orchestration.status === 'paused') {
         console.log(`[orchestration-runner] Orchestration ${orchestrationId} is paused, waiting...`);
-        await sleep(ctx.pollingInterval * 2);
+        await eventDrivenSleep(ctx.pollingInterval * 2, orchestrationId);
         continue;
       }
 
       if (orchestration.status === 'waiting_merge') {
         console.log(`[orchestration-runner] Orchestration ${orchestrationId} waiting for merge trigger`);
-        await sleep(ctx.pollingInterval * 2);
+        await eventDrivenSleep(ctx.pollingInterval * 2, orchestrationId);
         continue;
       }
 
@@ -664,17 +1420,34 @@ export async function runOrchestration(
         }
       }
 
-      // Get specflow status
+      // Get specflow status (now direct file access, no subprocess - T021-T024)
       const specflowStatus = getSpecflowStatus(projectPath);
 
-      // Make decision
-      let decision = makeDecision(orchestration, workflow, specflowStatus);
+      // Get last file change time for staleness detection
+      const lastFileChangeTime = getLastFileChangeTime(projectPath);
+
+      // DEBUG: Log state before decision
+      console.log(`[orchestration-runner] DEBUG: Making decision for ${orchestrationId}`);
+      console.log(`[orchestration-runner] DEBUG:   currentPhase=${orchestration.currentPhase}`);
+      console.log(`[orchestration-runner] DEBUG:   workflow.id=${workflow?.id ?? 'none'}, workflow.status=${workflow?.status ?? 'none'}`);
+      console.log(`[orchestration-runner] DEBUG:   specflowStatus.step=${specflowStatus?.orchestration?.step?.current ?? 'none'}, stepStatus=${specflowStatus?.orchestration?.step?.status ?? 'none'}`);
+
+      // Make decision using the G2-compliant pure decision module
+      let decision = makeDecisionWithAdapter(orchestration, workflow, specflowStatus, lastFileChangeTime);
 
       // Track consecutive "continue" (unclear/waiting) decisions
+      // Only count as "unclear" if NO workflow is actively running
       if (decision.action === 'continue') {
-        ctx.consecutiveUnclearChecks++;
+        // If workflow is actively running, this is a CLEAR state - we know what's happening
+        // Don't count these as "unclear" checks that would trigger Claude analyzer
+        if (workflow && ['running', 'waiting_for_input'].includes(workflow.status)) {
+          ctx.consecutiveUnclearChecks = 0; // Reset - state is clear, just waiting
+        } else {
+          // No workflow running but we're not spawning one - this IS unclear
+          ctx.consecutiveUnclearChecks++;
+        }
 
-        // After MAX_UNCLEAR_CHECKS_BEFORE_CLAUDE consecutive waits, spawn Claude analyzer
+        // After MAX_UNCLEAR_CHECKS_BEFORE_CLAUDE consecutive TRULY unclear waits, spawn Claude analyzer
         if (ctx.consecutiveUnclearChecks >= MAX_UNCLEAR_CHECKS_BEFORE_CLAUDE) {
           decision = await analyzeStateWithClaude(ctx, orchestration, workflow, specflowStatus);
           ctx.consecutiveUnclearChecks = 0; // Reset counter after Claude analysis
@@ -685,13 +1458,15 @@ export async function runOrchestration(
       }
 
       // Log decision
+      console.log(`[orchestration-runner] DEBUG:   DECISION: action=${decision.action}, skill=${decision.skill ?? 'none'}, reason=${decision.reason}`);
       logDecision(ctx, orchestration, decision);
 
       // Execute decision
       await executeDecision(ctx, orchestration, decision, workflow);
 
-      // Wait before next poll
-      await sleep(ctx.pollingInterval);
+      // T026: Event-driven wait - wakes on file events OR timeout
+      // This replaces fixed polling with reactive wake-up
+      await eventDrivenSleep(ctx.pollingInterval, orchestrationId);
     }
 
     if (attempts >= maxPollingAttempts) {
@@ -706,6 +1481,15 @@ export async function runOrchestration(
       error instanceof Error ? error.message : 'Unknown error in orchestration runner'
     );
   } finally {
+    // Cleanup event subscription
+    if (eventCleanup) {
+      eventCleanup();
+      console.log(`[orchestration-runner] Unsubscribed from file events for ${projectId}`);
+    }
+
+    // G5.9: Clear runner state file when exiting
+    clearRunnerState(projectPath, orchestrationId);
+
     activeRunners.delete(orchestrationId);
     console.log(`[orchestration-runner] Runner stopped for ${orchestrationId}`);
   }
@@ -780,12 +1564,6 @@ async function executeDecision(
         return;
       }
 
-      // QUEUE CHECK: Don't spawn if there's already an active workflow for this orchestration
-      if (workflowService.hasActiveWorkflow(ctx.projectId, ctx.orchestrationId)) {
-        console.log(`[orchestration-runner] Workflow already active for orchestration ${ctx.orchestrationId}, skipping spawn`);
-        return;
-      }
-
       // Transition to next phase if needed
       const nextPhase = getNextPhaseFromSkill(decision.skill);
 
@@ -823,71 +1601,54 @@ async function executeDecision(
         orchestrationService.transitionToNextPhase(ctx.projectPath, ctx.orchestrationId);
       }
 
-      // Spawn the workflow with orchestrationId for proper linking
-      const workflow = await workflowService.start(
-        ctx.projectId,
-        decision.skill,
-        undefined, // default timeout
-        undefined, // no resume session
-        ctx.orchestrationId // link to this orchestration
-      );
-
-      // Also store in orchestration for backwards compatibility
-      orchestrationService.linkWorkflowExecution(ctx.projectPath, ctx.orchestrationId, workflow.id);
+      // Use spawn intent pattern (G5.3-G5.7) to prevent race conditions
+      const workflow = await spawnWorkflowWithIntent(ctx, decision.skill);
+      if (!workflow) {
+        // Spawn was skipped (intent exists or workflow already active)
+        return;
+      }
 
-      // Track cost
+      // Track cost from previous workflow
       if (currentWorkflow?.costUsd) {
         orchestrationService.addCost(ctx.projectPath, ctx.orchestrationId, currentWorkflow.costUsd);
       }
-
-      console.log(`[orchestration-runner] Spawned workflow ${workflow.id} for ${decision.skill} (linked to orchestration ${ctx.orchestrationId})`);
       break;
     }
 
     case 'spawn_batch': {
-      // QUEUE CHECK: Don't spawn if there's already an active workflow for this orchestration
-      if (workflowService.hasActiveWorkflow(ctx.projectId, ctx.orchestrationId)) {
-        console.log(`[orchestration-runner] Workflow already active for orchestration ${ctx.orchestrationId}, skipping batch spawn`);
-        return;
-      }
-
-      // Complete current batch
-      orchestrationService.completeBatch(ctx.projectPath, ctx.orchestrationId);
+      // DO NOT call completeBatch here - the batch hasn't been executed yet!
+      // spawn_batch is triggered when batch.status === 'pending' && no workflow
+      // We spawn a workflow for the CURRENT batch, not advance to next.
 
-      // Track cost from previous workflow
+      // Track cost from previous workflow (if any - for healing scenarios)
       if (currentWorkflow?.costUsd) {
         orchestrationService.addCost(ctx.projectPath, ctx.orchestrationId, currentWorkflow.costUsd);
       }
 
-      // Reload orchestration to get updated batch index
-      const updatedOrchestration = orchestrationService.get(ctx.projectPath, ctx.orchestrationId);
-      if (!updatedOrchestration) return;
-
-      // Check if more batches
-      const nextBatch = updatedOrchestration.batches.items[updatedOrchestration.batches.current];
-      if (nextBatch && nextBatch.status === 'pending') {
-        // Check for pause between batches
-        if (updatedOrchestration.config.pauseBetweenBatches) {
-          orchestrationService.pause(ctx.projectPath, ctx.orchestrationId);
-          console.log(`[orchestration-runner] Paused between batches (configured)`);
-        } else {
-          // Build batch context
-          const batchContext = `Execute only the "${nextBatch.section}" section (${nextBatch.taskIds.join(', ')}). Do NOT work on tasks from other sections.`;
-          const fullContext = updatedOrchestration.config.additionalContext
-            ? `${batchContext}\n\n${updatedOrchestration.config.additionalContext}`
-            : batchContext;
-
-          // Spawn next batch with orchestrationId
-          const workflow = await workflowService.start(
-            ctx.projectId,
-            `flow.implement ${fullContext}`,
-            undefined,
-            undefined,
-            ctx.orchestrationId
-          );
-          orchestrationService.linkWorkflowExecution(ctx.projectPath, ctx.orchestrationId, workflow.id);
-          console.log(`[orchestration-runner] Spawned batch ${updatedOrchestration.batches.current + 1}/${updatedOrchestration.batches.total} (linked to orchestration ${ctx.orchestrationId})`);
-        }
+      // Get the current batch (which is pending)
+      const currentBatch = orchestration.batches.items[orchestration.batches.current];
+      if (!currentBatch || currentBatch.status !== 'pending') {
+        console.error(`[orchestration-runner] spawn_batch called but current batch is not pending: ${currentBatch?.status}`);
+        break;
+      }
+
+      // Check for pause between batches (only applies after first batch)
+      if (orchestration.batches.current > 0 && orchestration.config.pauseBetweenBatches) {
+        orchestrationService.pause(ctx.projectPath, ctx.orchestrationId);
+        console.log(`[orchestration-runner] Paused between batches (configured)`);
+        break;
+      }
+
+      // Build batch context for the CURRENT batch
+      const batchContext = `Execute only the "${currentBatch.section}" section (${currentBatch.taskIds.join(', ')}). Do NOT work on tasks from other sections.`;
+      const fullContext = orchestration.config.additionalContext
+        ? `${batchContext}\n\n${orchestration.config.additionalContext}`
+        : batchContext;
+
+      // Use spawn intent pattern (G5.3-G5.7) to prevent race conditions
+      const workflow = await spawnWorkflowWithIntent(ctx, 'flow.implement', fullContext);
+      if (workflow) {
+        console.log(`[orchestration-runner] Spawned batch ${orchestration.batches.current + 1}/${orchestration.batches.total}: "${currentBatch.section}" (linked to orchestration ${ctx.orchestrationId})`);
       }
       break;
     }
@@ -991,6 +1752,180 @@ async function executeDecision(
       console.error(`[orchestration-runner] Orchestration failed: ${decision.errorMessage}`);
       break;
     }
+
+    // =========================================================================
+    // G2 Compliance: New action types from pure decision module
+    // =========================================================================
+
+    case 'transition': {
+      // Transition to next step (G2.3)
+      if (!decision.skill) {
+        console.error('[orchestration-runner] No skill specified for transition');
+        return;
+      }
+      orchestrationService.transitionToNextPhase(ctx.projectPath, ctx.orchestrationId);
+      const workflow = await spawnWorkflowWithIntent(ctx, decision.skill);
+      if (currentWorkflow?.costUsd) {
+        orchestrationService.addCost(ctx.projectPath, ctx.orchestrationId, currentWorkflow.costUsd);
+      }
+      console.log(`[orchestration-runner] Transitioned to ${decision.nextStep}`);
+      break;
+    }
+
+    case 'advance_batch': {
+      // Move to next batch (G2.7, G2.8) - but first verify tasks were actually completed
+      const currentBatch = orchestration.batches.items[orchestration.batches.current];
+      if (currentBatch) {
+        // Verify which tasks are actually complete in tasks.md
+        const { completedTasks, incompleteTasks } = verifyBatchTaskCompletion(
+          ctx.projectPath,
+          currentBatch.taskIds
+        );
+
+        console.log(`[orchestration-runner] Batch ${orchestration.batches.current + 1} verification: ${completedTasks.length}/${currentBatch.taskIds.length} tasks complete`);
+
+        if (incompleteTasks.length > 0) {
+          // Tasks still incomplete - re-spawn the batch workflow to continue
+          console.log(`[orchestration-runner] Batch has ${incompleteTasks.length} incomplete tasks, re-spawning workflow`);
+          orchestrationService.logDecision(
+            ctx.projectPath,
+            ctx.orchestrationId,
+            'batch_incomplete',
+            `Batch ${orchestration.batches.current + 1} still has ${incompleteTasks.length} incomplete tasks: ${incompleteTasks.join(', ')}`
+          );
+
+          // Re-spawn the batch workflow to continue working on incomplete tasks
+          const batchContext = `Continue working on incomplete tasks in batch "${currentBatch.section}": ${incompleteTasks.join(', ')}`;
+          const workflow = await spawnWorkflowWithIntent(
+            ctx,
+            'flow.implement',
+            orchestration.config.additionalContext
+              ? `${batchContext}\n\n${orchestration.config.additionalContext}`
+              : batchContext
+          );
+
+          if (workflow) {
+            orchestrationService.linkWorkflowExecution(ctx.projectPath, ctx.orchestrationId, workflow.id);
+          }
+
+          // Don't advance - stay on current batch
+          break;
+        }
+      }
+
+      // All tasks in batch are complete - advance to next batch
+      orchestrationService.completeBatch(ctx.projectPath, ctx.orchestrationId);
+      if (currentWorkflow?.costUsd) {
+        orchestrationService.addCost(ctx.projectPath, ctx.orchestrationId, currentWorkflow.costUsd);
+      }
+      console.log(`[orchestration-runner] Batch complete, advancing to batch ${decision.batchIndex}`);
+      break;
+    }
+
+    case 'initialize_batches': {
+      // Initialize batch tracking (G2.1)
+      const batchPlan = parseBatchesFromProject(ctx.projectPath, orchestration.config.batchSizeFallback);
+      if (batchPlan && batchPlan.totalIncomplete > 0) {
+        orchestrationService.updateBatches(ctx.projectPath, ctx.orchestrationId, batchPlan);
+        console.log(`[orchestration-runner] Initialized batches: ${batchPlan.batches.length} batches, ${batchPlan.totalIncomplete} tasks`);
+      } else {
+        console.error('[orchestration-runner] No tasks found to create batches');
+        orchestrationService.setNeedsAttention(
+          ctx.projectPath,
+          ctx.orchestrationId,
+          'No tasks found to create batches',
+          ['retry', 'abort']
+        );
+      }
+      break;
+    }
+
+    case 'force_step_complete': {
+      // Force step.status to complete when all batches done (G2.2)
+      // First verify all tasks are actually complete in tasks.md
+      const totalIncomplete = getTotalIncompleteTasks(ctx.projectPath);
+
+      if (totalIncomplete !== null && totalIncomplete > 0) {
+        // Tasks still incomplete - don't transition, re-initialize batches
+        console.log(`[orchestration-runner] Still ${totalIncomplete} incomplete tasks, re-initializing batches`);
+        orchestrationService.logDecision(
+          ctx.projectPath,
+          ctx.orchestrationId,
+          'tasks_incomplete',
+          `Cannot mark implement complete: ${totalIncomplete} tasks still incomplete`
+        );
+
+        // Re-parse and update batches with remaining incomplete tasks
+        const batchPlan = parseBatchesFromProject(ctx.projectPath, orchestration.config.batchSizeFallback);
+        if (batchPlan && batchPlan.totalIncomplete > 0) {
+          orchestrationService.updateBatches(ctx.projectPath, ctx.orchestrationId, batchPlan);
+          console.log(`[orchestration-runner] Re-initialized batches: ${batchPlan.batches.length} batches, ${batchPlan.totalIncomplete} tasks`);
+        }
+        break;
+      }
+
+      // All tasks complete - transition to next phase
+      orchestrationService.transitionToNextPhase(ctx.projectPath, ctx.orchestrationId);
+      console.log(`[orchestration-runner] All tasks complete, transitioning to next phase`);
+      break;
+    }
+
+    case 'pause': {
+      // Pause orchestration (G2.6)
+      orchestrationService.pause(ctx.projectPath, ctx.orchestrationId);
+      console.log(`[orchestration-runner] Paused: ${decision.reason}`);
+      break;
+    }
+
+    case 'recover_stale': {
+      // Recover from stale workflow (G1.5, G3.7-G3.10)
+      console.log(`[orchestration-runner] Workflow appears stale: ${decision.reason}`);
+      orchestrationService.setNeedsAttention(
+        ctx.projectPath,
+        ctx.orchestrationId,
+        `Workflow stale: ${decision.reason}`,
+        ['retry', 'skip', 'abort'],
+        decision.workflowId
+      );
+      break;
+    }
+
+    case 'recover_failed': {
+      // Recover from failed step/workflow (G1.13, G1.14, G2.10, G3.11-G3.16)
+      console.log(`[orchestration-runner] Step/batch failed: ${decision.reason}`);
+      orchestrationService.setNeedsAttention(
+        ctx.projectPath,
+        ctx.orchestrationId,
+        decision.errorMessage || decision.reason,
+        decision.recoveryOptions || ['retry', 'skip', 'abort'],
+        decision.failedWorkflowId
+      );
+      break;
+    }
+
+    case 'wait_with_backoff': {
+      // Wait with exponential backoff (G1.7)
+      console.log(`[orchestration-runner] Waiting with backoff: ${decision.reason}`);
+      // The backoff is handled by the main loop, not here
+      break;
+    }
+
+    case 'wait_user_gate': {
+      // Wait for USER_GATE confirmation (G1.8)
+      console.log(`[orchestration-runner] Waiting for USER_GATE confirmation`);
+      // Update orchestration status to indicate waiting for user gate
+      const orchToUpdate = orchestrationService.get(ctx.projectPath, ctx.orchestrationId);
+      if (orchToUpdate) {
+        orchToUpdate.status = 'waiting_user_gate' as OrchestrationExecution['status'];
+      }
+      break;
+    }
+
+    default: {
+      // Unknown action - log error but don't crash
+      console.error(`[orchestration-runner] Unknown decision action: ${decision.action}`);
+      break;
+    }
   }
 }
 
@@ -1049,15 +1984,36 @@ export async function triggerMerge(
   const projectPath = getProjectPath(projectId);
   if (!projectPath) return;
 
-  // Update status via orchestration service
-  orchestrationService.triggerMerge(projectPath, orchestrationId);
+  // Use spawn intent pattern for race condition safety (G5.3-G5.7)
+  // Check for existing spawn intent
+  if (hasSpawnIntent(projectPath, orchestrationId)) {
+    console.log(`[orchestration-runner] Spawn intent already exists for merge, skipping`);
+    return;
+  }
 
-  // Spawn merge workflow
-  const workflow = await workflowService.start(projectId, 'flow.merge');
-  orchestrationService.linkWorkflowExecution(projectPath, orchestrationId, workflow.id);
+  // Check if there's already an active workflow
+  if (workflowService.hasActiveWorkflow(projectId, orchestrationId)) {
+    console.log(`[orchestration-runner] Workflow already active for merge, skipping`);
+    return;
+  }
 
-  // Restart the runner to handle merge completion
-  runOrchestration(projectId, orchestrationId).catch(console.error);
+  try {
+    // Write spawn intent BEFORE calling start()
+    writeSpawnIntent(projectPath, orchestrationId, 'flow.merge');
+
+    // Update status via orchestration service
+    orchestrationService.triggerMerge(projectPath, orchestrationId);
+
+    // Spawn merge workflow
+    const workflow = await workflowService.start(projectId, 'flow.merge', undefined, undefined, orchestrationId);
+    orchestrationService.linkWorkflowExecution(projectPath, orchestrationId, workflow.id);
+
+    // Restart the runner to handle merge completion
+    runOrchestration(projectId, orchestrationId).catch(console.error);
+  } finally {
+    // Clear spawn intent regardless of success/failure
+    clearSpawnIntent(projectPath, orchestrationId);
+  }
 }
 
 /**
diff --git a/packages/dashboard/src/lib/services/orchestration-service.ts b/packages/dashboard/src/lib/services/orchestration-service.ts
index 7cc0fe0..f79f356 100644
--- a/packages/dashboard/src/lib/services/orchestration-service.ts
+++ b/packages/dashboard/src/lib/services/orchestration-service.ts
@@ -12,7 +12,7 @@
  * - Integration with specflow status --json
  */
 
-import { existsSync, readFileSync, writeFileSync, mkdirSync, readdirSync } from 'fs';
+import { existsSync, readFileSync, writeFileSync, mkdirSync, readdirSync, renameSync, unlinkSync } from 'fs';
 import { join } from 'path';
 import { execSync } from 'child_process';
 import { randomUUID } from 'crypto';
@@ -57,12 +57,66 @@ function getOrchestrationPath(projectPath: string, id: string): string {
 }
 
 /**
- * Save orchestration state to file
+ * Save orchestration state to file (atomic write - G5.1, G5.2)
+ *
+ * Uses write-to-temp + atomic rename pattern to prevent partial writes
+ * from corrupting state during crashes or concurrent access.
  */
 function saveOrchestration(projectPath: string, execution: OrchestrationExecution): void {
   const filePath = getOrchestrationPath(projectPath, execution.id);
+  const tempPath = `${filePath}.tmp`;
+
   execution.updatedAt = new Date().toISOString();
-  writeFileSync(filePath, JSON.stringify(execution, null, 2));
+  const content = JSON.stringify(execution, null, 2);
+
+  // G5.1: Write to temp file first
+  writeFileSync(tempPath, content);
+
+  // G5.2: Atomic rename (POSIX guarantees atomicity on same filesystem)
+  try {
+    renameSync(tempPath, filePath);
+  } catch (error) {
+    // Clean up temp file if rename fails
+    try {
+      unlinkSync(tempPath);
+    } catch {
+      // Ignore cleanup errors
+    }
+    throw error;
+  }
+}
+
+/**
+ * Sync current phase to orchestration-state.json for UI consistency
+ * This keeps the state file in sync with the orchestration execution
+ */
+function syncPhaseToStateFile(projectPath: string, phase: OrchestrationPhase): void {
+  try {
+    // Try .specflow first (v3), then .specify (v2)
+    let statePath = join(projectPath, '.specflow', 'orchestration-state.json');
+    if (!existsSync(statePath)) {
+      statePath = join(projectPath, '.specify', 'orchestration-state.json');
+    }
+    if (!existsSync(statePath)) {
+      return; // No state file to update
+    }
+
+    const content = readFileSync(statePath, 'utf-8');
+    const state = JSON.parse(content);
+
+    // Update step.current to match orchestration phase
+    if (state.orchestration) {
+      state.orchestration.step = state.orchestration.step || {};
+      state.orchestration.step.current = phase;
+      state.orchestration.step.status = 'in_progress';
+      state.last_updated = new Date().toISOString();
+    }
+
+    writeFileSync(statePath, JSON.stringify(state, null, 2));
+  } catch {
+    // Non-critical: log but don't fail orchestration
+    console.warn('[orchestration-service] Failed to sync phase to state file');
+  }
 }
 
 /**
@@ -112,13 +166,39 @@ function listOrchestrations(projectPath: string): OrchestrationExecution[] {
   );
 }
 
+/**
+ * Staleness threshold for waiting_merge orchestrations
+ * If an orchestration has been waiting for merge for longer than this, consider it stale
+ */
+const WAITING_MERGE_STALE_MS = 2 * 60 * 60 * 1000; // 2 hours
+
+/**
+ * Check if an orchestration is stale based on its status and age
+ */
+function isOrchestrationStale(orchestration: OrchestrationExecution): boolean {
+  // Only apply staleness check to waiting_merge status
+  // running/paused should always be considered active regardless of age
+  if (orchestration.status !== 'waiting_merge') {
+    return false;
+  }
+
+  // Check if waiting_merge has been stale for too long
+  const updatedAt = new Date(orchestration.updatedAt).getTime();
+  const age = Date.now() - updatedAt;
+  return age > WAITING_MERGE_STALE_MS;
+}
+
 /**
  * Find active orchestration for a project (FR-024)
  * Returns the first orchestration in 'running' or 'paused' status
+ * Excludes stale waiting_merge orchestrations (older than 2 hours)
  */
 function findActiveOrchestration(projectPath: string): OrchestrationExecution | null {
   const orchestrations = listOrchestrations(projectPath);
-  return orchestrations.find((o) => ['running', 'paused', 'waiting_merge'].includes(o.status)) || null;
+  return orchestrations.find((o) =>
+    ['running', 'paused', 'waiting_merge'].includes(o.status) &&
+    !isOrchestrationStale(o)
+  ) || null;
 }
 
 // =============================================================================
@@ -191,42 +271,76 @@ function getSpecflowStatus(projectPath: string): SpecflowStatus | null {
 /**
  * Check if a step is complete based on specflow status
  */
-function isStepComplete(projectPath: string, phase: OrchestrationPhase): boolean {
-  const status = getSpecflowStatus(projectPath);
+/**
+ * Check if a phase is complete based on specflow status
+ * Exported for use by orchestration-runner.ts
+ */
+export function isPhaseComplete(status: SpecflowStatus | null, phase: OrchestrationPhase): boolean {
   if (!status) return false;
 
   switch (phase) {
     case 'design':
+      // Design is complete when plan.md and tasks.md exist
       return status.context?.hasPlan === true && status.context?.hasTasks === true;
+
     case 'analyze':
-      // Analyze doesn't produce new artifacts - check orchestration state
-      return status.orchestration?.step?.current === 'implement';
+      // Analyze doesn't produce artifacts - check orchestration state
+      // step.current must have moved past analyze (to 'implement' or later)
+      // OR step.status is 'complete' when current step is analyze
+      const analyzeStepComplete =
+        status.orchestration?.step?.current === 'implement' ||
+        status.orchestration?.step?.current === 'verify' ||
+        (status.orchestration?.step?.current === 'analyze' &&
+          status.orchestration?.step?.status === 'complete');
+      return analyzeStepComplete ?? false;
+
     case 'implement':
       // All tasks complete
       return (
         status.progress?.tasksComplete === status.progress?.tasksTotal &&
         (status.progress?.tasksTotal ?? 0) > 0
       );
+
     case 'verify':
-      // Check orchestration state moved to merge
-      return status.orchestration?.step?.current === 'merge';
+      // Verify is complete when step.current has moved past verify (to merge)
+      // OR when step.status is 'complete' with current step as verify
+      const verifyStepComplete =
+        status.orchestration?.step?.current === 'merge' ||
+        (status.orchestration?.step?.current === 'verify' &&
+          status.orchestration?.step?.status === 'complete');
+      return verifyStepComplete ?? false;
+
     case 'merge':
-      return status.orchestration?.step?.status === 'complete';
+      // Merge is complete when orchestration marks it so
+      return status.orchestration?.step?.status === 'complete' &&
+        (status.orchestration?.step?.current === 'merge' ||
+          status.orchestration?.step?.current === undefined);
+
     case 'complete':
       return true;
+
     default:
       return false;
   }
 }
 
+/**
+ * Check if a step is complete for a project (convenience wrapper)
+ */
+function isStepComplete(projectPath: string, phase: OrchestrationPhase): boolean {
+  const status = getSpecflowStatus(projectPath);
+  return isPhaseComplete(status, phase);
+}
+
 // =============================================================================
 // State Machine (FR-020, T016)
 // =============================================================================
 
 /**
  * Get the next phase in the orchestration flow
+ * Respects all skip flags: skipDesign, skipAnalyze, skipImplement, skipVerify
  */
-function getNextPhase(
+export function getNextPhase(
   current: OrchestrationPhase,
   config: OrchestrationConfig
 ): OrchestrationPhase | null {
@@ -238,18 +352,21 @@ function getNextPhase(
     return null;
   }
 
-  // Get next phase
+  // Get next phase, respecting skip flags
   let nextIndex = currentIndex + 1;
   let nextPhase = phases[nextIndex];
 
-  // Skip design if configured
-  if (nextPhase === 'design' && config.skipDesign) {
-    nextIndex++;
-    nextPhase = phases[nextIndex];
-  }
+  // Skip phases as configured (loop to handle consecutive skips)
+  while (nextPhase && nextIndex < phases.length - 1) {
+    const shouldSkip =
+      (nextPhase === 'design' && config.skipDesign) ||
+      (nextPhase === 'analyze' && config.skipAnalyze) ||
+      (nextPhase === 'implement' && config.skipImplement) ||
+      (nextPhase === 'verify' && config.skipVerify);
+
+    if (!shouldSkip) break;
 
-  // Skip analyze if configured
-  if (nextPhase === 'analyze' && config.skipAnalyze) {
+    console.log(`[getNextPhase] Skipping ${nextPhase} (skip flag is true)`);
     nextIndex++;
     nextPhase = phases[nextIndex];
   }
@@ -348,6 +465,9 @@ class OrchestrationService {
     // Save initial state
     saveOrchestration(projectPath, execution);
 
+    // Sync initial phase to state file for UI consistency
+    syncPhaseToStateFile(projectPath, execution.currentPhase);
+
     return execution;
   }
 
@@ -478,6 +598,8 @@ class OrchestrationService {
       execution.status = 'waiting_merge';
       logDecision(execution, 'waiting_merge', 'Auto-merge disabled, waiting for user');
       saveOrchestration(projectPath, execution);
+      // Sync to state file for UI consistency
+      syncPhaseToStateFile(projectPath, nextPhase);
       return execution;
     }
 
@@ -486,6 +608,9 @@ class OrchestrationService {
     logDecision(execution, 'transition', `Moving from ${currentPhase} to ${nextPhase}`);
     saveOrchestration(projectPath, execution);
 
+    // Sync to state file for UI consistency (project list, sidebar)
+    syncPhaseToStateFile(projectPath, nextPhase);
+
     return execution;
   }
 
@@ -843,6 +968,18 @@ class OrchestrationService {
     return execution.totalCostUsd >= budget.maxTotal;
   }
 
+  /**
+   * Touch activity timestamp for external session detection (G6.6)
+   * Called when external CLI session activity is detected
+   */
+  touchActivity(projectPath: string, orchestrationId: string): void {
+    const execution = loadOrchestration(projectPath, orchestrationId);
+    if (!execution) return;
+
+    // saveOrchestration already updates updatedAt, so just save
+    saveOrchestration(projectPath, execution);
+  }
+
   /**
    * Get the skill to run for the current phase
    */
@@ -899,6 +1036,23 @@ class OrchestrationService {
       status: batch.status,
     };
   }
+
+  /**
+   * Add an entry to the decision log (public interface for runner)
+   */
+  logDecision(
+    projectPath: string,
+    orchestrationId: string,
+    decision: string,
+    reason: string,
+    data?: Record<string, unknown>
+  ): void {
+    const execution = loadOrchestration(projectPath, orchestrationId);
+    if (!execution) return;
+
+    logDecision(execution, decision, reason, data);
+    saveOrchestration(projectPath, execution);
+  }
 }
 
 // Export singleton
diff --git a/packages/dashboard/src/lib/services/orchestration-types.ts b/packages/dashboard/src/lib/services/orchestration-types.ts
new file mode 100644
index 0000000..11b3408
--- /dev/null
+++ b/packages/dashboard/src/lib/services/orchestration-types.ts
@@ -0,0 +1,343 @@
+/**
+ * Orchestration Types - Dependency Injection Interfaces
+ *
+ * This module defines the dependency injection interfaces for orchestration
+ * to enable testing and separation of concerns.
+ *
+ * Key interfaces:
+ * - OrchestrationDeps: All external dependencies for the orchestration runner
+ * - Clock: Time abstraction for testability
+ * - StateIO: File I/O abstraction for state management
+ * - WorkflowIO: Workflow management abstraction
+ */
+
+import type {
+  OrchestrationExecution,
+  OrchestrationState,
+  WorkflowExecution,
+  BatchPlan,
+} from '@specflow/shared';
+
+// =============================================================================
+// Clock Interface (NFR-003 - Testability)
+// =============================================================================
+
+/**
+ * Clock abstraction for time-based logic
+ *
+ * Allows tests to control time without depending on real time.
+ */
+export interface Clock {
+  /** Get current timestamp in milliseconds */
+  now(): number;
+  /** Get current ISO timestamp string */
+  isoNow(): string;
+}
+
+/**
+ * Default clock implementation using real time
+ */
+export const realClock: Clock = {
+  now: () => Date.now(),
+  isoNow: () => new Date().toISOString(),
+};
+
+// =============================================================================
+// State I/O Interface
+// =============================================================================
+
+/**
+ * State file I/O abstraction
+ *
+ * Enables atomic writes and testable file operations.
+ */
+export interface StateIO {
+  /**
+   * Read orchestration state from project
+   * @param projectPath - Path to project root
+   * @returns State or null if not found
+   */
+  readState(projectPath: string): Promise<OrchestrationState | null>;
+
+  /**
+   * Write orchestration state atomically
+   * Uses temp file + rename pattern for atomicity
+   * @param projectPath - Path to project root
+   * @param state - State to write
+   */
+  writeState(projectPath: string, state: OrchestrationState): Promise<void>;
+
+  /**
+   * Read orchestration execution state
+   * @param projectPath - Path to project root
+   * @param orchestrationId - UUID of the orchestration
+   * @returns Execution state or null if not found
+   */
+  readExecution(projectPath: string, orchestrationId: string): Promise<OrchestrationExecution | null>;
+
+  /**
+   * Write orchestration execution state atomically
+   * @param projectPath - Path to project root
+   * @param orchestrationId - UUID of the orchestration
+   * @param execution - Execution state to write
+   */
+  writeExecution(projectPath: string, orchestrationId: string, execution: OrchestrationExecution): Promise<void>;
+
+  /**
+   * Create backup of state file before recovery
+   * @param projectPath - Path to project root
+   * @returns Path to backup file
+   */
+  createBackup(projectPath: string): Promise<string>;
+}
+
+// =============================================================================
+// Workflow I/O Interface
+// =============================================================================
+
+/**
+ * Workflow management abstraction
+ */
+export interface WorkflowIO {
+  /**
+   * Get workflow by ID
+   * @param workflowId - Workflow UUID
+   * @param projectId - Project ID
+   * @returns Workflow execution or undefined
+   */
+  getWorkflow(workflowId: string, projectId: string): WorkflowExecution | undefined;
+
+  /**
+   * Check if orchestration has an active workflow
+   * @param projectId - Project ID
+   * @param orchestrationId - Orchestration UUID
+   * @returns True if active workflow exists
+   */
+  hasActiveWorkflow(projectId: string, orchestrationId: string): boolean;
+
+  /**
+   * Find active workflows by orchestration
+   * @param projectId - Project ID
+   * @param orchestrationId - Orchestration UUID
+   * @returns Array of active workflows
+   */
+  findActiveByOrchestration(projectId: string, orchestrationId: string): WorkflowExecution[];
+
+  /**
+   * Start a new workflow
+   * @param projectId - Project ID
+   * @param skill - Skill command to run
+   * @param timeout - Optional timeout
+   * @param resumeSessionId - Optional session ID to resume
+   * @param orchestrationId - Optional orchestration ID to link
+   * @returns Started workflow execution
+   */
+  startWorkflow(
+    projectId: string,
+    skill: string,
+    timeout?: number,
+    resumeSessionId?: string,
+    orchestrationId?: string
+  ): Promise<WorkflowExecution>;
+
+  /**
+   * Kill a running workflow
+   * @param workflowId - Workflow UUID
+   */
+  killWorkflow(workflowId: string): Promise<void>;
+}
+
+// =============================================================================
+// Orchestration Service Interface
+// =============================================================================
+
+/**
+ * Orchestration service abstraction
+ */
+export interface OrchestrationIO {
+  /**
+   * Get orchestration execution by ID
+   */
+  get(projectPath: string, orchestrationId: string): OrchestrationExecution | null;
+
+  /**
+   * Update orchestration state
+   */
+  update(projectPath: string, orchestrationId: string, updates: Partial<OrchestrationExecution>): void;
+
+  /**
+   * Transition to next phase
+   */
+  transitionToNextPhase(projectPath: string, orchestrationId: string): void;
+
+  /**
+   * Link workflow execution to orchestration
+   */
+  linkWorkflowExecution(projectPath: string, orchestrationId: string, workflowId: string): void;
+
+  /**
+   * Add cost to orchestration
+   */
+  addCost(projectPath: string, orchestrationId: string, cost: number): void;
+
+  /**
+   * Update batch tracking
+   */
+  updateBatches(projectPath: string, orchestrationId: string, batchPlan: BatchPlan): void;
+
+  /**
+   * Complete current batch
+   */
+  completeBatch(projectPath: string, orchestrationId: string): void;
+
+  /**
+   * Mark batch as healed
+   */
+  healBatch(projectPath: string, orchestrationId: string, healerSessionId: string): void;
+
+  /**
+   * Increment heal attempt counter
+   */
+  incrementHealAttempt(projectPath: string, orchestrationId: string): void;
+
+  /**
+   * Check if batch can be healed (has remaining attempts)
+   */
+  canHealBatch(projectPath: string, orchestrationId: string): boolean;
+
+  /**
+   * Set orchestration to needs_attention status
+   */
+  setNeedsAttention(
+    projectPath: string,
+    orchestrationId: string,
+    issue: string,
+    options: Array<'retry' | 'skip' | 'abort'>,
+    failedWorkflowId?: string
+  ): void;
+
+  /**
+   * Pause orchestration
+   */
+  pause(projectPath: string, orchestrationId: string): void;
+
+  /**
+   * Resume orchestration from paused state
+   */
+  resume(projectPath: string, orchestrationId: string): void;
+
+  /**
+   * Trigger merge phase
+   */
+  triggerMerge(projectPath: string, orchestrationId: string): void;
+
+  /**
+   * Mark orchestration as failed
+   */
+  fail(projectPath: string, orchestrationId: string, errorMessage: string): void;
+}
+
+// =============================================================================
+// Batch Parser Interface
+// =============================================================================
+
+/**
+ * Batch parsing abstraction
+ */
+export interface BatchParser {
+  /**
+   * Parse batches from project's tasks.md
+   * @param projectPath - Path to project root
+   * @param fallbackBatchSize - Batch size if no sections found
+   * @returns Batch plan or null if no tasks
+   */
+  parseBatches(projectPath: string, fallbackBatchSize: number): BatchPlan | null;
+}
+
+// =============================================================================
+// File Activity Interface
+// =============================================================================
+
+/**
+ * File activity tracking abstraction
+ */
+export interface FileActivityTracker {
+  /**
+   * Get last modification time of any relevant file
+   * @param projectPath - Path to project root
+   * @returns Timestamp in milliseconds
+   */
+  getLastFileChangeTime(projectPath: string): number;
+}
+
+// =============================================================================
+// Main Dependencies Interface (NFR-003)
+// =============================================================================
+
+/**
+ * All external dependencies for the orchestration runner
+ *
+ * This interface enables:
+ * - Unit testing with mocks
+ * - Separation of pure logic from I/O
+ * - Easy swapping of implementations
+ */
+export interface OrchestrationDeps {
+  /** Clock for time operations */
+  clock: Clock;
+
+  /** State file I/O */
+  stateIO: StateIO;
+
+  /** Workflow management */
+  workflowIO: WorkflowIO;
+
+  /** Orchestration service */
+  orchestrationIO: OrchestrationIO;
+
+  /** Batch parser */
+  batchParser: BatchParser;
+
+  /** File activity tracking */
+  fileActivity: FileActivityTracker;
+}
+
+// =============================================================================
+// Runner Context
+// =============================================================================
+
+/**
+ * Context passed through the orchestration runner
+ */
+export interface RunnerContext {
+  /** Project ID from registry */
+  projectId: string;
+  /** Path to project root */
+  projectPath: string;
+  /** Orchestration UUID */
+  orchestrationId: string;
+  /** Polling interval in ms */
+  pollingInterval: number;
+  /** Max polling attempts before timeout */
+  maxPollingAttempts: number;
+  /** Counter for consecutive unclear decisions */
+  consecutiveUnclearChecks: number;
+  /** Dependencies */
+  deps: OrchestrationDeps;
+}
+
+// =============================================================================
+// Spawn Intent Pattern Types (FR-006)
+// =============================================================================
+
+/**
+ * Spawn intent for preventing duplicate workflow spawns
+ */
+export interface SpawnIntent {
+  /** Skill being spawned */
+  skill: string;
+  /** Timestamp when intent was created */
+  timestamp: number;
+  /** Context for implement batches */
+  context?: string;
+}
diff --git a/packages/dashboard/src/lib/services/orchestration-validation.ts b/packages/dashboard/src/lib/services/orchestration-validation.ts
new file mode 100644
index 0000000..50e22b8
--- /dev/null
+++ b/packages/dashboard/src/lib/services/orchestration-validation.ts
@@ -0,0 +1,314 @@
+/**
+ * Orchestration State Validation - Pure Functions
+ *
+ * This module validates orchestration state files and ensures consistency
+ * between the project state file and execution state.
+ *
+ * Key validations (NFR-002):
+ * - step.index === STEP_INDEX_MAP[step.current]
+ * - step.current is valid
+ * - step.status is valid
+ * - batches.items[i].index === i
+ * - batches.current < batches.total (unless all complete)
+ * - recoveryContext exists when status === 'needs_attention'
+ * - Cross-file consistency
+ */
+
+import type { OrchestrationExecution, OrchestrationState, StepStatus } from '@specflow/shared';
+import { STEP_INDEX_MAP } from '@specflow/shared';
+
+// =============================================================================
+// Types
+// =============================================================================
+
+/**
+ * Result of state validation
+ */
+export interface ValidationResult {
+  /** Whether the state is valid */
+  valid: boolean;
+  /** List of validation issues found */
+  issues: string[];
+  /** Severity of the issues */
+  severity: 'none' | 'warning' | 'error';
+}
+
+/**
+ * Issue severity levels
+ */
+export type IssueSeverity = 'warning' | 'error';
+
+/**
+ * A single validation issue
+ */
+export interface ValidationIssue {
+  code: string;
+  message: string;
+  severity: IssueSeverity;
+  /** Suggested fix if available */
+  suggestedFix?: string;
+}
+
+// =============================================================================
+// Constants
+// =============================================================================
+
+/** Valid step names */
+const VALID_STEPS = ['design', 'analyze', 'implement', 'verify', 'merge'] as const;
+
+/** Valid step status values */
+const VALID_STATUSES: StepStatus[] = [
+  'not_started',
+  'pending',
+  'in_progress',
+  'complete',
+  'failed',
+  'blocked',
+  'skipped',
+];
+
+/** Valid batch status values */
+const VALID_BATCH_STATUSES = ['pending', 'running', 'completed', 'failed', 'healed'] as const;
+
+/** Valid orchestration status values */
+const VALID_ORCHESTRATION_STATUSES = [
+  'running',
+  'paused',
+  'waiting_merge',
+  'needs_attention',
+  'completed',
+  'failed',
+  'cancelled',
+] as const;
+
+// =============================================================================
+// Validation Functions (Pure)
+// =============================================================================
+
+/**
+ * Validate the orchestration state file
+ *
+ * Checks:
+ * - Phase exists
+ * - Step is valid
+ * - Status is valid
+ * - Step index matches step name
+ *
+ * @param state - Orchestration state from state file
+ * @returns Validation issues found
+ */
+export function validateOrchestrationState(state: OrchestrationState): ValidationIssue[] {
+  const issues: ValidationIssue[] = [];
+
+  // Check phase exists
+  if (!state.orchestration?.phase?.number) {
+    issues.push({
+      code: 'NO_ACTIVE_PHASE',
+      message: 'No active phase set in orchestration state',
+      severity: 'error',
+    });
+  }
+
+  // Check step is valid
+  const stepCurrent = state.orchestration?.step?.current;
+  if (stepCurrent && !VALID_STEPS.includes(stepCurrent as typeof VALID_STEPS[number])) {
+    issues.push({
+      code: 'INVALID_STEP',
+      message: `Invalid step: ${stepCurrent}. Must be one of: ${VALID_STEPS.join(', ')}`,
+      severity: 'error',
+      suggestedFix: 'Set step.current to a valid step name',
+    });
+  }
+
+  // Check status is valid
+  const stepStatus = state.orchestration?.step?.status;
+  if (stepStatus && !VALID_STATUSES.includes(stepStatus)) {
+    issues.push({
+      code: 'INVALID_STATUS',
+      message: `Invalid step status: ${stepStatus}. Must be one of: ${VALID_STATUSES.join(', ')}`,
+      severity: 'error',
+      suggestedFix: 'Set step.status to a valid status value',
+    });
+  }
+
+  // Check step.index matches step.current (G7.1)
+  if (stepCurrent && VALID_STEPS.includes(stepCurrent as typeof VALID_STEPS[number])) {
+    const expectedIndex = STEP_INDEX_MAP[stepCurrent as keyof typeof STEP_INDEX_MAP];
+    const actualIndex = state.orchestration?.step?.index;
+    if (expectedIndex !== undefined && actualIndex !== undefined && actualIndex !== expectedIndex) {
+      issues.push({
+        code: 'STEP_INDEX_MISMATCH',
+        message: `Step index mismatch: ${stepCurrent} should be index ${expectedIndex}, but got ${actualIndex}`,
+        severity: 'warning',
+        suggestedFix: `Set step.index to ${expectedIndex}`,
+      });
+    }
+  }
+
+  return issues;
+}
+
+/**
+ * Validate the orchestration execution state
+ *
+ * Checks:
+ * - Status is valid
+ * - Batch indices are sequential
+ * - batches.current < batches.total
+ * - recoveryContext exists when needed
+ *
+ * @param execution - Orchestration execution state
+ * @returns Validation issues found
+ */
+export function validateExecutionState(execution: OrchestrationExecution): ValidationIssue[] {
+  const issues: ValidationIssue[] = [];
+
+  // Check execution status is valid
+  if (!VALID_ORCHESTRATION_STATUSES.includes(execution.status)) {
+    issues.push({
+      code: 'INVALID_EXECUTION_STATUS',
+      message: `Invalid execution status: ${execution.status}`,
+      severity: 'error',
+    });
+  }
+
+  // Check batch indices match position (G7.4)
+  execution.batches.items.forEach((batch, index) => {
+    if (batch.index !== index) {
+      issues.push({
+        code: 'BATCH_INDEX_MISMATCH',
+        message: `Batch at position ${index} has index ${batch.index}`,
+        severity: 'error',
+        suggestedFix: `Set batch.index to ${index}`,
+      });
+    }
+
+    // Validate batch status
+    if (!VALID_BATCH_STATUSES.includes(batch.status)) {
+      issues.push({
+        code: 'INVALID_BATCH_STATUS',
+        message: `Batch ${index} has invalid status: ${batch.status}`,
+        severity: 'error',
+      });
+    }
+  });
+
+  // Check batches.current is valid (G7.5)
+  if (execution.batches.total > 0 && execution.batches.current >= execution.batches.total) {
+    // Only an issue if not all batches are complete
+    const allComplete = execution.batches.items.every(
+      (b) => b.status === 'completed' || b.status === 'healed'
+    );
+    if (!allComplete) {
+      issues.push({
+        code: 'BATCH_CURRENT_OUT_OF_BOUNDS',
+        message: `batches.current (${execution.batches.current}) >= batches.total (${execution.batches.total})`,
+        severity: 'error',
+        suggestedFix: `Set batches.current to a value less than ${execution.batches.total}`,
+      });
+    }
+  }
+
+  // Check recoveryContext exists when status is needs_attention (G7.6)
+  if (execution.status === 'needs_attention' && !execution.recoveryContext) {
+    issues.push({
+      code: 'MISSING_RECOVERY_CONTEXT',
+      message: 'needs_attention status requires recoveryContext to be set',
+      severity: 'error',
+      suggestedFix: 'Set recoveryContext with issue, options, and optionally failedWorkflowId',
+    });
+  }
+
+  // Check heal attempts are non-negative
+  execution.batches.items.forEach((batch, index) => {
+    if (batch.healAttempts < 0) {
+      issues.push({
+        code: 'INVALID_HEAL_ATTEMPTS',
+        message: `Batch ${index} has negative healAttempts: ${batch.healAttempts}`,
+        severity: 'error',
+      });
+    }
+  });
+
+  return issues;
+}
+
+/**
+ * Validate cross-file consistency between state and execution
+ *
+ * Checks:
+ * - Step in state matches currentPhase in execution
+ *
+ * @param state - Orchestration state from state file
+ * @param execution - Orchestration execution state
+ * @returns Validation issues found
+ */
+export function validateCrossFileConsistency(
+  state: OrchestrationState,
+  execution: OrchestrationExecution
+): ValidationIssue[] {
+  const issues: ValidationIssue[] = [];
+
+  // Check step/phase alignment (G7.7)
+  const stepCurrent = state.orchestration?.step?.current;
+  const execPhase = execution.currentPhase;
+
+  if (stepCurrent && execPhase && execPhase !== 'complete') {
+    if (stepCurrent !== execPhase) {
+      issues.push({
+        code: 'STEP_PHASE_MISMATCH',
+        message: `State has step '${stepCurrent}' but execution has phase '${execPhase}'`,
+        severity: 'warning',
+        suggestedFix: `Align state.orchestration.step.current with execution.currentPhase`,
+      });
+    }
+  }
+
+  return issues;
+}
+
+/**
+ * Validate both state files and their consistency
+ *
+ * This is the main validation entry point that runs all checks.
+ *
+ * @param state - Orchestration state from state file
+ * @param execution - Orchestration execution state
+ * @returns Combined validation result
+ */
+export function validateState(
+  state: OrchestrationState,
+  execution: OrchestrationExecution
+): ValidationResult {
+  const stateIssues = validateOrchestrationState(state);
+  const executionIssues = validateExecutionState(execution);
+  const crossFileIssues = validateCrossFileConsistency(state, execution);
+
+  const allIssues = [...stateIssues, ...executionIssues, ...crossFileIssues];
+  const hasErrors = allIssues.some((i) => i.severity === 'error');
+  const hasWarnings = allIssues.some((i) => i.severity === 'warning');
+
+  return {
+    valid: allIssues.length === 0,
+    issues: allIssues.map((i) => i.message),
+    severity: hasErrors ? 'error' : hasWarnings ? 'warning' : 'none',
+  };
+}
+
+/**
+ * Get detailed validation issues with codes and suggested fixes
+ *
+ * @param state - Orchestration state from state file
+ * @param execution - Orchestration execution state
+ * @returns Detailed validation issues
+ */
+export function getDetailedValidationIssues(
+  state: OrchestrationState,
+  execution: OrchestrationExecution
+): ValidationIssue[] {
+  const stateIssues = validateOrchestrationState(state);
+  const executionIssues = validateExecutionState(execution);
+  const crossFileIssues = validateCrossFileConsistency(state, execution);
+
+  return [...stateIssues, ...executionIssues, ...crossFileIssues];
+}
diff --git a/packages/dashboard/src/lib/services/workflow-service.ts b/packages/dashboard/src/lib/services/workflow-service.ts
index 780a2bf..cba408a 100644
--- a/packages/dashboard/src/lib/services/workflow-service.ts
+++ b/packages/dashboard/src/lib/services/workflow-service.ts
@@ -1303,6 +1303,16 @@ ${claudePath} -p --output-format json --dangerously-skip-permissions --disallowe
           exec.logs.push(
             `[WAITING] ${cliResult.structured_output.questions?.length || 0} questions`
           );
+
+          // Broadcast questions via SSE so the UI can display them
+          if (cliResult.structured_output.questions && exec.sessionId) {
+            const { broadcastWorkflowQuestions } = require('../watcher');
+            broadcastWorkflowQuestions(
+              exec.sessionId,
+              exec.projectId,
+              cliResult.structured_output.questions
+            );
+          }
         } else if (cliResult.structured_output.status === 'completed') {
           exec.status = 'completed';
           exec.logs.push('[COMPLETE] Workflow finished!');
diff --git a/packages/dashboard/src/lib/session-parser.ts b/packages/dashboard/src/lib/session-parser.ts
index 8545c6c..d645ee5 100644
--- a/packages/dashboard/src/lib/session-parser.ts
+++ b/packages/dashboard/src/lib/session-parser.ts
@@ -1,3 +1,32 @@
+/**
+ * Question option from AskUserQuestion tool call.
+ */
+export interface QuestionOption {
+  label: string;
+  description?: string;
+}
+
+/**
+ * Question from AskUserQuestion tool call.
+ */
+export interface QuestionInfo {
+  question: string;
+  header?: string;
+  options: QuestionOption[];
+  multiSelect?: boolean;
+}
+
+/**
+ * Structured output from workflow completion (StructuredOutput tool call).
+ */
+export interface WorkflowOutput {
+  status: 'completed' | 'error' | 'needs_input' | 'cancelled' | string;
+  phase?: string;
+  message?: string;
+  artifacts?: Array<{ path: string; action: string }>;
+  questions?: QuestionInfo[];
+}
+
 /**
  * Session message from Claude JSONL files.
  * Only user and assistant messages are displayed; tool calls are parsed for metrics.
@@ -14,6 +43,10 @@ export interface SessionMessage {
   commandName?: string;
   /** Whether this is a session end indicator */
   isSessionEnd?: boolean;
+  /** Questions from AskUserQuestion tool call (for assistant messages) */
+  questions?: QuestionInfo[];
+  /** Agent tasks launched from this message */
+  agentTasks?: AgentTaskInfo[];
 }
 
 /**
@@ -29,11 +62,21 @@ export interface ToolCallMetrics {
  */
 export interface ToolCallInfo {
   name: string;
-  operation: 'read' | 'write' | 'edit' | 'search' | 'execute' | 'todo';
+  operation: 'read' | 'write' | 'edit' | 'search' | 'execute' | 'todo' | 'agent';
   files: string[];
   input?: Record<string, unknown>;
 }
 
+/**
+ * Agent task information from Task tool calls.
+ */
+export interface AgentTaskInfo {
+  id: string;
+  description: string;
+  subagentType: string;
+  status: 'running' | 'completed';
+}
+
 /**
  * Todo item from TodoWrite tool calls.
  */
@@ -51,6 +94,10 @@ export interface ParseResult {
   toolCall?: ToolCallMetrics;
   toolCalls?: ToolCallInfo[];
   todos?: TodoItem[];
+  workflowOutput?: WorkflowOutput;
+  agentTasks?: AgentTaskInfo[];
+  /** Tool IDs that received results (to mark agents as completed) */
+  completedToolIds?: string[];
 }
 
 /**
@@ -62,6 +109,10 @@ export interface SessionData {
   startTime?: string;
   toolCalls: ToolCallInfo[];
   currentTodos: TodoItem[];
+  /** Final structured output from workflow completion (if any) */
+  workflowOutput?: WorkflowOutput;
+  /** Currently running or recently completed agent tasks */
+  agentTasks: AgentTaskInfo[];
 }
 
 /**
@@ -148,6 +199,8 @@ function getToolOperation(name: string): ToolCallInfo['operation'] {
       return 'search';
     case 'TodoWrite':
       return 'todo';
+    case 'Task':
+      return 'agent';
     case 'Bash':
     default:
       return 'execute';
@@ -157,12 +210,21 @@ function getToolOperation(name: string): ToolCallInfo['operation'] {
 /**
  * Extract detailed tool call information for UI display.
  */
-function extractToolCallInfos(content: unknown): { toolCalls: ToolCallInfo[]; todos: TodoItem[] } {
+function extractToolCallInfos(content: unknown): {
+  toolCalls: ToolCallInfo[];
+  todos: TodoItem[];
+  questions: QuestionInfo[];
+  workflowOutput?: WorkflowOutput;
+  agentTasks: AgentTaskInfo[];
+} {
   const toolCalls: ToolCallInfo[] = [];
   let todos: TodoItem[] = [];
+  const questions: QuestionInfo[] = [];
+  let workflowOutput: WorkflowOutput | undefined;
+  const agentTasks: AgentTaskInfo[] = [];
 
   if (!Array.isArray(content)) {
-    return { toolCalls, todos };
+    return { toolCalls, todos, questions, agentTasks };
   }
 
   for (const block of content) {
@@ -221,6 +283,100 @@ function extractToolCallInfos(content: unknown): { toolCalls: ToolCallInfo[]; to
             }
             break;
           }
+          case 'AskUserQuestion': {
+            // Extract questions from AskUserQuestion calls
+            const questionItems = input?.questions;
+            if (Array.isArray(questionItems)) {
+              for (const q of questionItems) {
+                if (typeof q === 'object' && q !== null && typeof q.question === 'string') {
+                  const questionInfo: QuestionInfo = {
+                    question: q.question,
+                    header: typeof q.header === 'string' ? q.header : undefined,
+                    options: [],
+                    multiSelect: typeof q.multiSelect === 'boolean' ? q.multiSelect : false,
+                  };
+                  // Extract options
+                  if (Array.isArray(q.options)) {
+                    for (const opt of q.options) {
+                      if (typeof opt === 'object' && opt !== null && typeof opt.label === 'string') {
+                        questionInfo.options.push({
+                          label: opt.label,
+                          description: typeof opt.description === 'string' ? opt.description : undefined,
+                        });
+                      }
+                    }
+                  }
+                  questions.push(questionInfo);
+                }
+              }
+            }
+            break;
+          }
+          case 'StructuredOutput': {
+            // Extract structured output from workflow completion
+            if (input && typeof input.status === 'string') {
+              workflowOutput = {
+                status: input.status as WorkflowOutput['status'],
+                phase: typeof input.phase === 'string' ? input.phase : undefined,
+                message: typeof input.message === 'string' ? input.message : undefined,
+              };
+              // Extract artifacts if present
+              if (Array.isArray(input.artifacts)) {
+                workflowOutput.artifacts = input.artifacts
+                  .filter(
+                    (a): a is { path: string; action: string } =>
+                      typeof a === 'object' &&
+                      a !== null &&
+                      typeof a.path === 'string' &&
+                      typeof a.action === 'string'
+                  );
+              }
+              // Extract questions if present (for needs_input status)
+              if (Array.isArray(input.questions)) {
+                workflowOutput.questions = input.questions
+                  .filter(
+                    (q): q is { question: string } =>
+                      typeof q === 'object' && q !== null && typeof q.question === 'string'
+                  )
+                  .map((q) => ({
+                    question: q.question,
+                    header: typeof (q as Record<string, unknown>).header === 'string'
+                      ? (q as Record<string, unknown>).header as string
+                      : undefined,
+                    options: Array.isArray((q as Record<string, unknown>).options)
+                      ? ((q as Record<string, unknown>).options as unknown[])
+                          .filter(
+                            (o): o is { label: string } =>
+                              typeof o === 'object' && o !== null && typeof (o as Record<string, unknown>).label === 'string'
+                          )
+                          .map((o) => ({
+                            label: (o as Record<string, unknown>).label as string,
+                            description: typeof (o as Record<string, unknown>).description === 'string'
+                              ? (o as Record<string, unknown>).description as string
+                              : undefined,
+                          }))
+                      : [],
+                    multiSelect: typeof (q as Record<string, unknown>).multiSelect === 'boolean'
+                      ? (q as Record<string, unknown>).multiSelect as boolean
+                      : false,
+                  }));
+              }
+            }
+            break;
+          }
+          case 'Task': {
+            // Extract agent task information
+            const id = 'id' in block ? String(block.id) : '';
+            const description = typeof input?.description === 'string' ? input.description : 'Running task...';
+            const subagentType = typeof input?.subagent_type === 'string' ? input.subagent_type : 'general-purpose';
+            agentTasks.push({
+              id,
+              description,
+              subagentType,
+              status: 'running', // Will be updated to 'completed' when result is found
+            });
+            break;
+          }
         }
 
         toolCalls.push({
@@ -233,7 +389,7 @@ function extractToolCallInfos(content: unknown): { toolCalls: ToolCallInfo[]; to
     }
   }
 
-  return { toolCalls, todos };
+  return { toolCalls, todos, questions, workflowOutput, agentTasks };
 }
 
 /**
@@ -337,18 +493,32 @@ export function parseSessionLine(line: string): ParseResult {
       const textContent = extractTextContent(messageContent);
 
       // Extract detailed tool call info (for assistant messages)
-      const { toolCalls: detailedToolCalls, todos } = extractToolCallInfos(messageContent);
+      const { toolCalls: detailedToolCalls, todos, questions, workflowOutput, agentTasks } = extractToolCallInfos(messageContent);
+
+      // Extract completed tool IDs from tool_result blocks (user messages contain these)
+      const completedToolIds: string[] = [];
+      if (Array.isArray(messageContent)) {
+        for (const block of messageContent) {
+          if (typeof block === 'object' && block !== null && 'type' in block && block.type === 'tool_result' && 'tool_use_id' in block) {
+            completedToolIds.push(String(block.tool_use_id));
+          }
+        }
+      }
 
       // Skip messages that are only tool calls (no text content)
-      if (!textContent) {
+      // BUT: If there are questions, workflowOutput, or agentTasks, we still want to capture them
+      if (!textContent && questions.length === 0 && !workflowOutput && agentTasks.length === 0) {
         // But still extract tool call metrics
         const toolCallMetrics = extractToolCallMetrics(messageContent);
-        if (toolCallMetrics.length > 0 || detailedToolCalls.length > 0) {
+        if (toolCallMetrics.length > 0 || detailedToolCalls.length > 0 || completedToolIds.length > 0) {
           return {
             message: null,
             toolCall: toolCallMetrics[0],
             toolCalls: detailedToolCalls.length > 0 ? detailedToolCalls : undefined,
             todos: todos.length > 0 ? todos : undefined,
+            workflowOutput,
+            agentTasks: agentTasks.length > 0 ? agentTasks : undefined,
+            completedToolIds: completedToolIds.length > 0 ? completedToolIds : undefined,
           };
         }
         return { message: null };
@@ -364,15 +534,20 @@ export function parseSessionLine(line: string): ParseResult {
       return {
         message: {
           role: data.type,
-          content: textContent,
+          content: textContent || '', // May be empty if only questions
           timestamp: data.timestamp,
           toolCalls: detailedToolCalls.length > 0 ? detailedToolCalls : undefined,
           isCommandInjection: commandInfo?.isCommand,
           commandName: commandInfo?.commandName ?? undefined,
+          questions: questions.length > 0 ? questions : undefined,
+          agentTasks: agentTasks.length > 0 ? agentTasks : undefined,
         },
         toolCall: toolCallMetrics.length > 0 ? toolCallMetrics[0] : undefined,
         toolCalls: detailedToolCalls.length > 0 ? detailedToolCalls : undefined,
         todos: todos.length > 0 ? todos : undefined,
+        workflowOutput,
+        agentTasks: agentTasks.length > 0 ? agentTasks : undefined,
+        completedToolIds: completedToolIds.length > 0 ? completedToolIds : undefined,
       };
     }
 
@@ -398,6 +573,9 @@ export function parseSessionLines(lines: string[]): SessionData {
   const allToolCalls: ToolCallInfo[] = [];
   let currentTodos: TodoItem[] = [];
   let startTime: string | undefined;
+  let workflowOutput: WorkflowOutput | undefined;
+  // Track agent tasks by ID for status updates
+  const agentTasksMap = new Map<string, AgentTaskInfo>();
 
   for (const line of lines) {
     const result = parseSessionLine(line);
@@ -416,6 +594,36 @@ export function parseSessionLines(lines: string[]): SessionData {
       }
     }
 
+    // Track agent tasks
+    if (result.agentTasks && result.agentTasks.length > 0) {
+      for (const task of result.agentTasks) {
+        agentTasksMap.set(task.id, task);
+      }
+      // Also associate with the message that launched them
+      if (result.message) {
+        result.message.agentTasks = result.agentTasks;
+      } else {
+        // Associate with last assistant message
+        const lastAssistantMessage = [...messages].reverse().find((m) => m.role === 'assistant');
+        if (lastAssistantMessage) {
+          lastAssistantMessage.agentTasks = [
+            ...(lastAssistantMessage.agentTasks ?? []),
+            ...result.agentTasks,
+          ];
+        }
+      }
+    }
+
+    // Mark agent tasks as completed when we see their tool_result
+    if (result.completedToolIds && result.completedToolIds.length > 0) {
+      for (const toolId of result.completedToolIds) {
+        const task = agentTasksMap.get(toolId);
+        if (task) {
+          task.status = 'completed';
+        }
+      }
+    }
+
     // Aggregate tool calls and associate with preceding assistant message
     if (result.toolCalls && result.toolCalls.length > 0) {
       allToolCalls.push(...result.toolCalls);
@@ -446,9 +654,17 @@ export function parseSessionLines(lines: string[]): SessionData {
     if (result.todos && result.todos.length > 0) {
       currentTodos = result.todos;
     }
+
+    // Track workflow output (last StructuredOutput wins)
+    if (result.workflowOutput) {
+      workflowOutput = result.workflowOutput;
+    }
   }
 
-  return { messages, filesModified, startTime, toolCalls: allToolCalls, currentTodos };
+  // Convert agent tasks map to array (preserves status updates)
+  const agentTasks = Array.from(agentTasksMap.values());
+
+  return { messages, filesModified, startTime, toolCalls: allToolCalls, currentTodos, workflowOutput, agentTasks };
 }
 
 /**
diff --git a/packages/dashboard/src/lib/session-polling-manager.ts b/packages/dashboard/src/lib/session-polling-manager.ts
deleted file mode 100644
index 1ccf426..0000000
--- a/packages/dashboard/src/lib/session-polling-manager.ts
+++ /dev/null
@@ -1,333 +0,0 @@
-/**
- * SINGLE SOURCE OF TRUTH for session content polling.
- *
- * Why polling? Session JSONL files live in ~/.claude/projects/{hash}/
- * which is outside project directories and cannot be file-watched.
- *
- * Key behaviors:
- * - Single 3-second poll loop (not per-subscription)
- * - Auto-detects session end from JSONL content
- * - Stops polling when no active subscriptions
- * - Emits updates via listener pattern (like watcher.ts)
- *
- * Usage:
- *   import { sessionPollingManager } from '@/lib/session-polling-manager';
- *
- *   // Subscribe to session updates
- *   sessionPollingManager.subscribe(sessionId, projectPath);
- *
- *   // Listen for updates
- *   const unsubscribe = sessionPollingManager.addListener((event) => {
- *     if (event.sessionId === mySessionId) {
- *       setContent(event.content);
- *     }
- *   });
- *
- *   // Cleanup
- *   sessionPollingManager.unsubscribe(sessionId);
- *   unsubscribe();
- */
-
-import type { SessionMessage, ToolCallInfo, TodoItem } from './session-parser';
-
-const POLL_INTERVAL_MS = 5000; // 5 seconds - balanced between responsiveness and efficiency
-const DEFAULT_TAIL_LIMIT = 100;
-
-/**
- * Session content returned from polling
- */
-export interface SessionContent {
-  messages: SessionMessage[];
-  filesModified: number;
-  elapsed: number;
-  sessionId: string;
-  toolCalls?: ToolCallInfo[];
-  currentTodos?: TodoItem[];
-  /** True if session has ended (detected from JSONL) */
-  hasEnded?: boolean;
-}
-
-/**
- * Update event emitted when session content changes
- */
-export interface SessionUpdateEvent {
-  sessionId: string;
-  projectPath: string;
-  content: SessionContent;
-  error?: string;
-}
-
-/**
- * Internal subscription tracking
- */
-interface SessionSubscription {
-  sessionId: string;
-  projectPath: string;
-  /** Last known content hash to detect changes */
-  lastHash: string;
-  /** Whether this subscription is still active */
-  active: boolean;
-}
-
-/**
- * Fetch session content from API
- */
-async function fetchSessionContent(
-  projectPath: string,
-  sessionId: string,
-  tail: number = DEFAULT_TAIL_LIMIT
-): Promise<SessionContent> {
-  const params = new URLSearchParams({
-    projectPath,
-    sessionId,
-    tail: String(tail),
-  });
-
-  const res = await fetch(`/api/session/content?${params}`);
-  const data = await res.json();
-
-  if (!res.ok) {
-    throw new Error(data.error || `Failed to fetch session: ${res.status}`);
-  }
-
-  return data as SessionContent;
-}
-
-/**
- * Simple hash function for content comparison
- */
-function hashContent(content: SessionContent): string {
-  return `${content.messages.length}:${content.elapsed}:${content.hasEnded}`;
-}
-
-/**
- * Session Polling Manager - Singleton
- *
- * Centralizes all session content polling into a single coordinated loop.
- */
-class SessionPollingManager {
-  private subscriptions = new Map<string, SessionSubscription>();
-  private pollInterval: NodeJS.Timeout | null = null;
-  private listeners = new Set<(event: SessionUpdateEvent) => void>();
-  private cache = new Map<string, SessionContent>();
-  private isPolling = false;
-
-  /**
-   * Subscribe to session updates
-   * Starts polling if this is the first subscription
-   */
-  subscribe(sessionId: string, projectPath: string): void {
-    const existing = this.subscriptions.get(sessionId);
-    if (existing) {
-      // Reactivate if was inactive
-      existing.active = true;
-      existing.projectPath = projectPath;
-      return;
-    }
-
-    this.subscriptions.set(sessionId, {
-      sessionId,
-      projectPath,
-      lastHash: '',
-      active: true,
-    });
-
-    console.log(`[SessionPolling] Subscribed: ${sessionId}`);
-
-    // Start polling if not already running
-    if (!this.isPolling) {
-      this.startPolling();
-    }
-
-    // Immediately poll this session for initial data
-    this.pollSession(sessionId, projectPath).catch(console.error);
-  }
-
-  /**
-   * Unsubscribe from session updates
-   * Stops polling if this was the last subscription
-   */
-  unsubscribe(sessionId: string): void {
-    const subscription = this.subscriptions.get(sessionId);
-    if (subscription) {
-      subscription.active = false;
-      console.log(`[SessionPolling] Unsubscribed: ${sessionId}`);
-
-      // Check if any active subscriptions remain
-      const hasActive = Array.from(this.subscriptions.values()).some(s => s.active);
-      if (!hasActive) {
-        this.stopPolling();
-      }
-    }
-  }
-
-  /**
-   * Add listener for session updates
-   * Returns cleanup function
-   */
-  addListener(fn: (event: SessionUpdateEvent) => void): () => void {
-    this.listeners.add(fn);
-    return () => {
-      this.listeners.delete(fn);
-    };
-  }
-
-  /**
-   * Get cached content for a session (for initial render)
-   */
-  getCache(sessionId: string): SessionContent | null {
-    return this.cache.get(sessionId) ?? null;
-  }
-
-  /**
-   * Clear all subscriptions and stop polling
-   */
-  clear(): void {
-    this.stopPolling();
-    this.subscriptions.clear();
-    this.cache.clear();
-    this.listeners.clear();
-  }
-
-  /**
-   * Start the polling loop
-   */
-  private startPolling(): void {
-    if (this.isPolling) return;
-
-    this.isPolling = true;
-    console.log('[SessionPolling] Starting poll loop');
-
-    this.pollInterval = setInterval(() => {
-      this.pollAll();
-    }, POLL_INTERVAL_MS);
-  }
-
-  /**
-   * Stop the polling loop
-   */
-  private stopPolling(): void {
-    if (this.pollInterval) {
-      clearInterval(this.pollInterval);
-      this.pollInterval = null;
-    }
-    this.isPolling = false;
-    console.log('[SessionPolling] Stopped poll loop');
-  }
-
-  /**
-   * Poll all active subscriptions
-   */
-  private async pollAll(): Promise<void> {
-    const activeSubscriptions = Array.from(this.subscriptions.values()).filter(
-      s => s.active
-    );
-
-    // Poll in parallel but don't fail on individual errors
-    await Promise.allSettled(
-      activeSubscriptions.map(sub =>
-        this.pollSession(sub.sessionId, sub.projectPath)
-      )
-    );
-  }
-
-  /**
-   * Poll a single session and emit update if changed
-   */
-  private async pollSession(
-    sessionId: string,
-    projectPath: string
-  ): Promise<void> {
-    const subscription = this.subscriptions.get(sessionId);
-    if (!subscription || !subscription.active) return;
-
-    try {
-      const content = await fetchSessionContent(projectPath, sessionId);
-
-      // Check if content changed
-      const hash = hashContent(content);
-      if (hash === subscription.lastHash) {
-        return; // No change
-      }
-
-      subscription.lastHash = hash;
-      this.cache.set(sessionId, content);
-
-      // Emit update to listeners
-      const event: SessionUpdateEvent = {
-        sessionId,
-        projectPath,
-        content,
-      };
-
-      this.listeners.forEach(listener => {
-        try {
-          listener(event);
-        } catch (err) {
-          console.error('[SessionPolling] Listener error:', err);
-        }
-      });
-
-      // If session has ended, mark subscription inactive
-      if (content.hasEnded) {
-        subscription.active = false;
-        console.log(`[SessionPolling] Session ended: ${sessionId}`);
-
-        // Check if any active subscriptions remain
-        const hasActive = Array.from(this.subscriptions.values()).some(s => s.active);
-        if (!hasActive) {
-          this.stopPolling();
-        }
-      }
-    } catch (err) {
-      const errorMessage = err instanceof Error ? err.message : 'Unknown error';
-      console.error(`[SessionPolling] Error polling ${sessionId}:`, errorMessage);
-
-      // Emit error event
-      const event: SessionUpdateEvent = {
-        sessionId,
-        projectPath,
-        content: this.cache.get(sessionId) ?? {
-          messages: [],
-          filesModified: 0,
-          elapsed: 0,
-          sessionId,
-        },
-        error: errorMessage,
-      };
-
-      this.listeners.forEach(listener => {
-        try {
-          listener(event);
-        } catch (listenerErr) {
-          console.error('[SessionPolling] Listener error:', listenerErr);
-        }
-      });
-    }
-  }
-
-  /**
-   * Force an immediate poll for a session
-   */
-  async forcePoll(sessionId: string): Promise<SessionContent | null> {
-    const subscription = this.subscriptions.get(sessionId);
-    if (!subscription) return null;
-
-    await this.pollSession(sessionId, subscription.projectPath);
-    return this.cache.get(sessionId) ?? null;
-  }
-
-  /**
-   * Get subscription count (for debugging)
-   */
-  getSubscriptionCount(): { total: number; active: number } {
-    const all = Array.from(this.subscriptions.values());
-    return {
-      total: all.length,
-      active: all.filter(s => s.active).length,
-    };
-  }
-}
-
-// Export singleton instance
-export const sessionPollingManager = new SessionPollingManager();
diff --git a/packages/dashboard/src/lib/watcher.ts b/packages/dashboard/src/lib/watcher.ts
index 4732aae..87a1ff3 100644
--- a/packages/dashboard/src/lib/watcher.ts
+++ b/packages/dashboard/src/lib/watcher.ts
@@ -11,9 +11,14 @@ import {
   type SSEEvent,
   type TasksData,
   type WorkflowIndex,
+  type WorkflowIndexEntry,
   type WorkflowData,
   type PhasesData,
+  type SessionContent,
+  type SessionQuestion,
 } from '@specflow/shared';
+import { readdirSync, statSync, existsSync, readFileSync } from 'fs';
+import { v4 as uuidv4 } from 'uuid';
 import { parseTasks, type ParseTasksOptions } from './task-parser';
 import { parseRoadmapToPhasesData } from './roadmap-parser';
 import {
@@ -21,6 +26,9 @@ import {
   getStateFilePathSync,
   migrateStateFiles,
 } from './state-paths';
+import { getProjectSessionDir, getClaudeProjectsDir } from './project-hash';
+import { reconcileRunners } from './services/orchestration-runner';
+import { orchestrationService } from './services/orchestration-service';
 
 // Debounce delay in milliseconds
 const DEBOUNCE_MS = 200;
@@ -30,12 +38,14 @@ const HEARTBEAT_MS = 30000;
 
 // Global state for the watcher singleton
 let watcher: FSWatcher | null = null;
+let sessionWatcher: FSWatcher | null = null;
 let registryPath: string;
 let currentRegistry: Registry | null = null;
 let watchedStatePaths: Set<string> = new Set();
 let watchedTasksPaths: Set<string> = new Set();
 let watchedWorkflowPaths: Set<string> = new Set();
 let watchedPhasesPaths: Set<string> = new Set();
+let watchedSessionDirs: Set<string> = new Set();
 
 // Cache workflow data to detect actual changes
 const workflowCache: Map<string, string> = new Map(); // projectId -> JSON string
@@ -43,6 +53,12 @@ const workflowCache: Map<string, string> = new Map(); // projectId -> JSON strin
 // Cache phases data to detect actual changes
 const phasesCache: Map<string, string> = new Map(); // projectId -> JSON string
 
+// Cache session content to detect actual changes
+const sessionCache: Map<string, string> = new Map(); // sessionId -> JSON string
+
+// Session debounce (faster for real-time feel)
+const SESSION_DEBOUNCE_MS = 100;
+
 // Event listeners (SSE connections)
 type EventListener = (event: SSEEvent) => void;
 const listeners: Set<EventListener> = new Set();
@@ -54,7 +70,7 @@ const debounceTimers: Map<string, NodeJS.Timeout> = new Map();
 /**
  * Broadcast event to all connected listeners
  */
-function broadcast(event: SSEEvent): void {
+export function broadcast(event: SSEEvent): void {
   listeners.forEach((listener) => {
     try {
       listener(event);
@@ -64,6 +80,43 @@ function broadcast(event: SSEEvent): void {
   });
 }
 
+/**
+ * Broadcast a session:question event for workflow-mode questions
+ * Called by workflow-service when structured_output has questions
+ */
+export function broadcastWorkflowQuestions(
+  sessionId: string,
+  projectId: string,
+  questions: Array<{
+    question: string;
+    header?: string;
+    options?: Array<{ label: string; description?: string }>;
+    multiSelect?: boolean;
+  }>
+): void {
+  if (!questions || questions.length === 0) return;
+
+  const mappedQuestions = questions.map((q) => ({
+    question: q.question,
+    header: q.header,
+    options: (q.options || []).map((opt) => ({
+      label: opt.label,
+      description: opt.description ?? '',
+    })),
+    multiSelect: q.multiSelect,
+  }));
+
+  broadcast({
+    type: 'session:question',
+    timestamp: new Date().toISOString(),
+    projectId,
+    sessionId,
+    data: {
+      questions: mappedQuestions,
+    },
+  });
+}
+
 /**
  * Debounced file change handler
  */
@@ -112,18 +165,28 @@ async function readState(projectId: string, statePath: string): Promise<Orchestr
       fs.readFile(statePath, 'utf-8'),
       fs.stat(statePath),
     ]);
-    const parsed = OrchestrationStateSchema.parse(JSON.parse(content));
+    // Use safeParse to gracefully handle older/incompatible state file formats
+    // from other projects without spamming logs
+    const result = OrchestrationStateSchema.safeParse(JSON.parse(content));
+    if (!result.success) {
+      // Silently skip projects with incompatible state schemas
+      // These are typically older projects that haven't been updated
+      return null;
+    }
     // Add file mtime for activity tracking (more reliable than last_updated field)
     return {
-      ...parsed,
+      ...result.data,
       _fileMtime: stats.mtime.toISOString(),
     };
   } catch (error) {
-    // Silently return null for missing files (ENOENT)
-    // Only log actual errors
+    // Silently return null for missing files (ENOENT) or JSON parse errors
     if (error && typeof error === 'object' && 'code' in error && error.code === 'ENOENT') {
       return null;
     }
+    // Also silently handle JSON parse errors (corrupted files)
+    if (error instanceof SyntaxError) {
+      return null;
+    }
     console.error(`[Watcher] Error reading state for ${projectId}:`, error);
     return null;
   }
@@ -146,6 +209,9 @@ async function handleRegistryChange(): Promise<void> {
   // Update watched state paths
   await updateWatchedPaths(newRegistry);
   currentRegistry = newRegistry;
+
+  // Update project path map for session watching
+  updateProjectPathMap();
 }
 
 /**
@@ -245,13 +311,148 @@ function buildWorkflowData(index: WorkflowIndex): WorkflowData {
 }
 
 /**
- * Handle workflow index file change
+ * Discover CLI sessions from Claude projects directory.
+ * Scans ~/.claude/projects/{hash}/ for .jsonl files and creates WorkflowIndexEntry objects.
+ * These are sessions started from CLI that weren't tracked by the dashboard.
+ *
+ * @param projectPath - Absolute path to the project
+ * @param trackedSessionIds - Set of session IDs already tracked by dashboard (to avoid duplicates)
+ * @param limit - Maximum number of sessions to return (default 50)
+ */
+function discoverCliSessions(
+  projectPath: string,
+  trackedSessionIds: Set<string>,
+  limit: number = 50
+): WorkflowIndexEntry[] {
+  const sessionDir = getProjectSessionDir(projectPath);
+
+  if (!existsSync(sessionDir)) {
+    return [];
+  }
+
+  try {
+    const files = readdirSync(sessionDir);
+    const jsonlFiles = files.filter(f => f.endsWith('.jsonl'));
+
+    // Get file stats and create entries
+    const entries: WorkflowIndexEntry[] = [];
+
+    for (const file of jsonlFiles) {
+      const sessionId = file.replace('.jsonl', '');
+
+      // Skip if already tracked by dashboard
+      if (trackedSessionIds.has(sessionId)) {
+        continue;
+      }
+
+      const fullPath = path.join(sessionDir, file);
+      try {
+        const stats = statSync(fullPath);
+
+        // Try to extract skill from first line of JSONL (lazy - only read if needed)
+        let skill = 'CLI Session';
+        try {
+          // Read just the first few KB to find skill info
+          const fd = require('fs').openSync(fullPath, 'r');
+          const buffer = Buffer.alloc(4096);
+          require('fs').readSync(fd, buffer, 0, 4096, 0);
+          require('fs').closeSync(fd);
+
+          const firstLines = buffer.toString('utf-8').split('\n').slice(0, 5);
+          for (const line of firstLines) {
+            if (!line.trim()) continue;
+            try {
+              const msg = JSON.parse(line);
+              // Look for skill in various places
+              if (msg.skill) {
+                skill = msg.skill;
+                break;
+              }
+              if (msg.message?.content && typeof msg.message.content === 'string') {
+                // Check for /flow.* commands in first user message
+                const flowMatch = msg.message.content.match(/\/flow\.(\w+)/);
+                if (flowMatch) {
+                  skill = `flow.${flowMatch[1]}`;
+                  break;
+                }
+              }
+            } catch {
+              // Invalid JSON line, continue
+            }
+          }
+        } catch {
+          // Could not read file content, use default skill
+        }
+
+        // Determine status based on file age
+        const fileAgeMs = Date.now() - stats.mtime.getTime();
+        const isRecent = fileAgeMs < 30 * 60 * 1000; // 30 minutes
+        const status: WorkflowIndexEntry['status'] = isRecent ? 'detached' : 'completed';
+
+        entries.push({
+          sessionId,
+          executionId: uuidv4(), // Generate placeholder ID for CLI sessions
+          skill,
+          status,
+          startedAt: stats.birthtime.toISOString(),
+          updatedAt: stats.mtime.toISOString(),
+          costUsd: 0, // Unknown for CLI sessions
+        });
+      } catch {
+        // Could not stat file, skip
+      }
+    }
+
+    // Sort by updatedAt descending (newest first)
+    entries.sort((a, b) => new Date(b.updatedAt).getTime() - new Date(a.updatedAt).getTime());
+
+    // Return limited number
+    return entries.slice(0, limit);
+  } catch {
+    return [];
+  }
+}
+
+/**
+ * Handle workflow index file change.
+ * Merges dashboard-tracked sessions with discovered CLI sessions.
  */
 async function handleWorkflowChange(projectId: string, indexPath: string): Promise<void> {
   const index = await readWorkflowIndex(indexPath);
   if (!index) return;
 
-  const data = buildWorkflowData(index);
+  // Get project path for CLI session discovery
+  const projectPath = projectPathMap.get(projectId);
+
+  // Get tracked session IDs to avoid duplicates
+  const trackedSessionIds = new Set<string>(
+    index.sessions.map(s => s.sessionId)
+  );
+
+  // Discover CLI sessions that aren't tracked by dashboard
+  const cliSessions = projectPath
+    ? discoverCliSessions(projectPath, trackedSessionIds, 50)
+    : [];
+
+  // Merge sessions: dashboard-tracked first, then CLI-discovered
+  const allSessions = [
+    ...index.sessions,
+    ...cliSessions,
+  ];
+
+  // Sort all sessions by updatedAt (newest first)
+  allSessions.sort((a, b) =>
+    new Date(b.updatedAt).getTime() - new Date(a.updatedAt).getTime()
+  );
+
+  // Build workflow data with merged sessions
+  const activeStates = ['running', 'waiting_for_input', 'detached', 'stale'];
+  const currentExecution = allSessions.find(s => activeStates.includes(s.status)) ?? null;
+
+  const data: WorkflowData = {
+    currentExecution,
+    sessions: allSessions.slice(0, 100), // Limit to 100 total sessions
+  };
 
   // Check if data actually changed (avoid duplicate broadcasts)
   const dataJson = JSON.stringify(data);
@@ -430,10 +631,32 @@ async function updateWatchedPaths(registry: Registry): Promise<void> {
       watcher.add(workflowIndexPath);
       console.log(`[Watcher] Added workflow index: ${workflowIndexPath}`);
 
-      // Broadcast initial workflow data
+      // Broadcast initial workflow data (including CLI sessions)
       const index = await readWorkflowIndex(workflowIndexPath);
       if (index) {
-        const data = buildWorkflowData(index);
+        // Get tracked session IDs to avoid duplicates
+        const trackedSessionIds = new Set<string>(
+          index.sessions.map(s => s.sessionId)
+        );
+
+        // Discover CLI sessions
+        const cliSessions = discoverCliSessions(project.path, trackedSessionIds, 50);
+
+        // Merge sessions
+        const allSessions = [...index.sessions, ...cliSessions];
+        allSessions.sort((a, b) =>
+          new Date(b.updatedAt).getTime() - new Date(a.updatedAt).getTime()
+        );
+
+        // Build workflow data with merged sessions
+        const activeStates = ['running', 'waiting_for_input', 'detached', 'stale'];
+        const currentExecution = allSessions.find(s => activeStates.includes(s.status)) ?? null;
+
+        const data: WorkflowData = {
+          currentExecution,
+          sessions: allSessions.slice(0, 100),
+        };
+
         workflowCache.set(projectId, JSON.stringify(data));
         broadcast({
           type: 'workflow',
@@ -603,8 +826,22 @@ export async function initWatcher(): Promise<void> {
   currentRegistry = await readRegistry();
   if (currentRegistry) {
     await updateWatchedPaths(currentRegistry);
+    updateProjectPathMap(); // For session watching
+
+    // G5.10: Reconcile runners for all registered projects on startup
+    // This detects orphaned runner state files from crashed processes
+    for (const [projectId, project] of Object.entries(currentRegistry.projects)) {
+      try {
+        reconcileRunners(project.path);
+      } catch (error) {
+        console.error(`[Watcher] Error reconciling runners for ${projectId}:`, error);
+      }
+    }
   }
 
+  // Initialize session file watcher
+  await initSessionWatcher();
+
   console.log('[Watcher] Initialized successfully');
 }
 
@@ -676,7 +913,8 @@ export async function getAllTasks(): Promise<Map<string, TasksData>> {
 }
 
 /**
- * Get all current workflow data for registered projects
+ * Get all current workflow data for registered projects.
+ * Includes both dashboard-tracked sessions AND discovered CLI sessions.
  */
 export async function getAllWorkflows(): Promise<Map<string, WorkflowData>> {
   const workflows = new Map<string, WorkflowData>();
@@ -686,12 +924,38 @@ export async function getAllWorkflows(): Promise<Map<string, WorkflowData>> {
   for (const [projectId, project] of Object.entries(currentRegistry.projects)) {
     const workflowIndexPath = path.join(project.path, '.specflow', 'workflows', 'index.json');
     const index = await readWorkflowIndex(workflowIndexPath);
-    if (index) {
-      const data = buildWorkflowData(index);
-      workflows.set(projectId, data);
-      // Update cache
-      workflowCache.set(projectId, JSON.stringify(data));
-    }
+
+    // Get tracked session IDs to avoid duplicates
+    const trackedSessionIds = new Set<string>(
+      index?.sessions.map(s => s.sessionId) ?? []
+    );
+
+    // Discover CLI sessions that aren't tracked by dashboard
+    const cliSessions = discoverCliSessions(project.path, trackedSessionIds, 50);
+
+    // Merge sessions: dashboard-tracked first, then CLI-discovered
+    const allSessions = [
+      ...(index?.sessions ?? []),
+      ...cliSessions,
+    ];
+
+    // Sort all sessions by updatedAt (newest first)
+    allSessions.sort((a, b) =>
+      new Date(b.updatedAt).getTime() - new Date(a.updatedAt).getTime()
+    );
+
+    // Build workflow data with merged sessions
+    const activeStates = ['running', 'waiting_for_input', 'detached', 'stale'];
+    const currentExecution = allSessions.find(s => activeStates.includes(s.status)) ?? null;
+
+    const data: WorkflowData = {
+      currentExecution,
+      sessions: allSessions.slice(0, 100), // Limit to 100 total sessions
+    };
+
+    workflows.set(projectId, data);
+    // Update cache
+    workflowCache.set(projectId, JSON.stringify(data));
   }
 
   return workflows;
@@ -718,6 +982,416 @@ export async function getAllPhases(): Promise<Map<string, PhasesData>> {
   return phases;
 }
 
+/**
+ * Session data with project context for initial load
+ */
+export interface SessionWithProject {
+  projectId: string;
+  sessionId: string;
+  content: SessionContent;
+}
+
+// Staleness threshold - sessions not modified in 30 minutes are considered stale
+const SESSION_STALE_MS = 30 * 60 * 1000;
+
+/**
+ * Check if a session file is stale (not modified recently)
+ */
+async function isSessionStale(sessionPath: string): Promise<boolean> {
+  try {
+    const stat = await fs.stat(sessionPath);
+    const age = Date.now() - stat.mtimeMs;
+    return age > SESSION_STALE_MS;
+  } catch {
+    return true; // File doesn't exist or can't be accessed
+  }
+}
+
+/**
+ * Get all current session content for active sessions
+ * Called on SSE connect to send initial session data
+ */
+export async function getAllSessions(): Promise<SessionWithProject[]> {
+  const sessions: SessionWithProject[] = [];
+
+  if (!currentRegistry) return sessions;
+
+  // Get workflow data to find active sessions
+  const workflows = await getAllWorkflows();
+
+  for (const [projectId, project] of Object.entries(currentRegistry.projects)) {
+    const workflowData = workflows.get(projectId);
+    if (!workflowData) continue;
+
+    // Collect session IDs to load - current execution and recent active sessions
+    const sessionIdsToLoad: string[] = [];
+
+    // Add current execution's session if it's active
+    if (workflowData.currentExecution) {
+      const status = workflowData.currentExecution.status;
+      if (status === 'running' || status === 'waiting_for_input' || status === 'detached') {
+        sessionIdsToLoad.push(workflowData.currentExecution.sessionId);
+      }
+    }
+
+    // Also check recent sessions that might be active
+    for (const session of workflowData.sessions) {
+      const status = session.status;
+      if ((status === 'running' || status === 'waiting_for_input' || status === 'detached') &&
+          !sessionIdsToLoad.includes(session.sessionId)) {
+        sessionIdsToLoad.push(session.sessionId);
+      }
+    }
+
+    // Load content for each session (skip stale sessions)
+    const sessionDir = getSessionDirectory(project.path);
+    for (const sessionId of sessionIdsToLoad) {
+      const sessionPath = path.join(sessionDir, `${sessionId}.jsonl`);
+      try {
+        // Skip stale sessions - they're marked as "running" but haven't been modified recently
+        if (await isSessionStale(sessionPath)) {
+          console.log(`[Watcher] Skipping stale session ${sessionId} (not modified in 30+ minutes)`);
+          continue;
+        }
+
+        const content = await parseSessionContent(sessionPath);
+        if (content) {
+          // Update caches for future change detection
+          sessionProjectMap.set(sessionId, projectId);
+          sessionCache.set(sessionId, JSON.stringify(content));
+
+          sessions.push({ projectId, sessionId, content });
+        }
+      } catch (error) {
+        // Session file might not exist yet or is inaccessible
+        console.log(`[Watcher] Could not load session ${sessionId} for project ${projectId}:`, error);
+      }
+    }
+  }
+
+  return sessions;
+}
+
+// ============================================================================
+// Session File Watching (T011-T015)
+// ============================================================================
+
+import { parseSessionLines, type SessionData } from './session-parser';
+
+/**
+ * Map of projectId to projectPath for session directory lookup
+ */
+const projectPathMap: Map<string, string> = new Map();
+
+/**
+ * Map of sessionId to projectId for event broadcasting
+ */
+const sessionProjectMap: Map<string, string> = new Map();
+
+/**
+ * Get session directory path for a project
+ * T011: Uses getProjectSessionDir from project-hash.ts
+ */
+function getSessionDirectory(projectPath: string): string {
+  return getProjectSessionDir(projectPath);
+}
+
+/**
+ * Parse session JSONL file and return SessionContent for SSE
+ * T013/T014: Parse JSONL and extract messages
+ */
+async function parseSessionContent(sessionPath: string): Promise<SessionContent | null> {
+  try {
+    const content = await fs.readFile(sessionPath, 'utf-8');
+    const lines = content.split('\n').filter(line => line.trim());
+    const sessionData = parseSessionLines(lines);
+
+    if (!sessionData || sessionData.messages.length === 0) {
+      return null;
+    }
+
+    return {
+      messages: sessionData.messages,
+      filesModified: Array.from(sessionData.filesModified),
+      elapsedMs: calculateElapsedMs(sessionData.startTime),
+      currentTodos: sessionData.currentTodos,
+      workflowOutput: sessionData.workflowOutput,
+      agentTasks: sessionData.agentTasks,
+    };
+  } catch (error) {
+    console.error(`[Watcher] Error parsing session file ${sessionPath}:`, error);
+    return null;
+  }
+}
+
+/**
+ * Calculate elapsed time from start time
+ */
+function calculateElapsedMs(startTime?: string): number {
+  if (!startTime) return 0;
+  try {
+    return Date.now() - new Date(startTime).getTime();
+  } catch {
+    return 0;
+  }
+}
+
+/**
+ * Extract questions from session content for session:question events
+ * T015: Detect AskUserQuestion tool calls AND structured_output questions (CLI mode)
+ */
+function extractPendingQuestions(content: SessionContent): SessionQuestion[] {
+  const questions: SessionQuestion[] = [];
+
+  // Helper to process a questions array
+  const processQuestions = (questionList: unknown[]) => {
+    for (const q of questionList) {
+      if (typeof q === 'object' && q !== null && 'question' in q) {
+        const qObj = q as Record<string, unknown>;
+        // Map to SessionQuestion format, ensuring description has a default value
+        const options = Array.isArray(qObj.options)
+          ? qObj.options.map((opt: { label: string; description?: string }) => ({
+              label: opt.label,
+              description: opt.description ?? '', // Default to empty string
+            }))
+          : [];
+
+        questions.push({
+          question: String(qObj.question),
+          header: typeof qObj.header === 'string' ? qObj.header : undefined,
+          options,
+          multiSelect: typeof qObj.multiSelect === 'boolean' ? qObj.multiSelect : undefined,
+        });
+      }
+    }
+  };
+
+  for (const message of content.messages) {
+    // Check for AskUserQuestion tool calls (interactive mode)
+    if (message.role === 'assistant' && message.toolCalls) {
+      for (const toolCall of message.toolCalls) {
+        if (toolCall.name === 'AskUserQuestion' && toolCall.input) {
+          const input = toolCall.input as Record<string, unknown>;
+          const questionList = input?.questions;
+          if (Array.isArray(questionList)) {
+            processQuestions(questionList);
+          }
+        }
+      }
+    }
+
+    // Check for structured_output questions (CLI/workflow mode)
+    // In CLI mode, questions are in the result's structured_output when status is 'needs_input'
+    const msgAny = message as Record<string, unknown>;
+    if (msgAny.type === 'result' && msgAny.structured_output) {
+      const structured = msgAny.structured_output as Record<string, unknown>;
+      if (structured.status === 'needs_input' && Array.isArray(structured.questions)) {
+        processQuestions(structured.questions);
+      }
+    }
+  }
+
+  return questions;
+}
+
+/**
+ * Handle session file change
+ * T013: Called when JSONL file changes, parses and broadcasts events
+ */
+async function handleSessionFileChange(sessionPath: string): Promise<void> {
+  const sessionId = path.basename(sessionPath, '.jsonl');
+  const projectId = sessionProjectMap.get(sessionId);
+
+  console.log(`[Watcher] Session file change: ${sessionId}, cached projectId: ${projectId || 'none'}`);
+
+  if (!projectId) {
+    // Try to find project from path
+    const claudeProjectsDir = getClaudeProjectsDir();
+    const relativePath = sessionPath.replace(claudeProjectsDir + path.sep, '');
+    const dirName = relativePath.split(path.sep)[0];
+
+    console.log(`[Watcher] Looking up project for session ${sessionId}: dir=${dirName}, projectPathMap size=${projectPathMap.size}`);
+
+    // Find project with matching hash
+    for (const [id, projectPath] of projectPathMap.entries()) {
+      const expectedDir = path.basename(getSessionDirectory(projectPath));
+      console.log(`[Watcher]   Checking project ${id}: expectedDir=${expectedDir}, match=${dirName === expectedDir}`);
+      if (dirName === expectedDir) {
+        sessionProjectMap.set(sessionId, id);
+        console.log(`[Watcher]   Matched! Setting sessionProjectMap[${sessionId}] = ${id}`);
+        break;
+      }
+    }
+  }
+
+  const resolvedProjectId = sessionProjectMap.get(sessionId);
+  if (!resolvedProjectId) {
+    // Session from external CLI not registered with dashboard - this is expected
+    console.log(`[Watcher] Could not resolve projectId for session ${sessionId}, skipping`);
+    return;
+  }
+
+  console.log(`[Watcher] Processing session ${sessionId} for project ${resolvedProjectId}`);
+
+  const content = await parseSessionContent(sessionPath);
+  if (!content) return;
+
+  // Check if content actually changed
+  const cacheKey = sessionId;
+  const contentJson = JSON.stringify(content);
+  if (sessionCache.get(cacheKey) === contentJson) {
+    return; // No actual change
+  }
+  sessionCache.set(cacheKey, contentJson);
+
+  // G6.6: Update orchestration activity when external session activity is detected
+  const projectPath = projectPathMap.get(resolvedProjectId);
+  if (projectPath) {
+    const activeOrchestration = orchestrationService.getActive(projectPath);
+    if (activeOrchestration) {
+      orchestrationService.touchActivity(projectPath, activeOrchestration.id);
+    }
+  }
+
+  // Broadcast session:message event
+  console.log(`[Watcher] Broadcasting session:message for ${sessionId} (${content.messages.length} messages)`);
+  broadcast({
+    type: 'session:message',
+    timestamp: new Date().toISOString(),
+    projectId: resolvedProjectId,
+    sessionId,
+    data: content,
+  });
+
+  // Check for pending questions
+  const questions = extractPendingQuestions(content);
+  if (questions.length > 0) {
+    broadcast({
+      type: 'session:question',
+      timestamp: new Date().toISOString(),
+      projectId: resolvedProjectId,
+      sessionId,
+      data: { questions },
+    });
+  }
+
+  // Check for session end
+  if (content.messages.some(m => m.isSessionEnd)) {
+    broadcast({
+      type: 'session:end',
+      timestamp: new Date().toISOString(),
+      projectId: resolvedProjectId,
+      sessionId,
+    });
+  }
+}
+
+/**
+ * Find project ID for a session file path
+ * Used for emitting session:created and session:activity events (G6.4, G6.5)
+ */
+function findProjectIdForSession(sessionPath: string): string | undefined {
+  const claudeProjectsDir = getClaudeProjectsDir();
+  const relativePath = sessionPath.replace(claudeProjectsDir + path.sep, '');
+  const dirName = relativePath.split(path.sep)[0];
+
+  // Find project with matching hash
+  for (const [id, projectPath] of projectPathMap.entries()) {
+    const expectedDir = path.basename(getSessionDirectory(projectPath));
+    if (dirName === expectedDir) {
+      return id;
+    }
+  }
+  return undefined;
+}
+
+/**
+ * Initialize session file watcher
+ * T012: Watch ~/.claude/projects/{hash}/*.jsonl files
+ */
+async function initSessionWatcher(): Promise<void> {
+  if (sessionWatcher) return; // Already initialized
+
+  const claudeProjectsDir = getClaudeProjectsDir();
+  console.log(`[Watcher] Initializing session watcher for ${claudeProjectsDir}`);
+
+  // Build mapping of project paths
+  if (currentRegistry) {
+    for (const [projectId, project] of Object.entries(currentRegistry.projects)) {
+      projectPathMap.set(projectId, project.path);
+    }
+  }
+
+  // Watch all JSONL files in the Claude projects directory
+  sessionWatcher = chokidar.watch(`${claudeProjectsDir}/**/*.jsonl`, {
+    persistent: true,
+    ignoreInitial: true, // Don't emit events for existing files
+    awaitWriteFinish: {
+      stabilityThreshold: SESSION_DEBOUNCE_MS,
+      pollInterval: 50,
+    },
+    depth: 2, // Only go 2 levels deep (project dir -> session file)
+  });
+
+  // Handle session file changes (G6.5: session:activity)
+  sessionWatcher.on('change', (filePath) => {
+    debouncedChange(filePath, async () => {
+      await handleSessionFileChange(filePath);
+      // G6.5: Emit session:activity for file modifications
+      const sessionId = path.basename(filePath, '.jsonl');
+      const projectId = sessionProjectMap.get(sessionId) || findProjectIdForSession(filePath);
+      if (projectId) {
+        broadcast({
+          type: 'session:activity',
+          timestamp: new Date().toISOString(),
+          projectId,
+          sessionId,
+        });
+      }
+    });
+  });
+
+  // Handle new session files (G6.4: session:created)
+  sessionWatcher.on('add', (filePath) => {
+    debouncedChange(filePath, async () => {
+      await handleSessionFileChange(filePath);
+      // G6.4: Emit session:created for new files
+      const sessionId = path.basename(filePath, '.jsonl');
+      const projectId = sessionProjectMap.get(sessionId) || findProjectIdForSession(filePath);
+      if (projectId) {
+        broadcast({
+          type: 'session:created',
+          timestamp: new Date().toISOString(),
+          projectId,
+          sessionId,
+        });
+      }
+    });
+  });
+
+  sessionWatcher.on('error', (error) => {
+    console.error('[Watcher] Session watcher error:', error);
+  });
+
+  console.log('[Watcher] Session watcher initialized');
+}
+
+/**
+ * Update project path mapping when registry changes
+ */
+function updateProjectPathMap(): void {
+  projectPathMap.clear();
+  if (currentRegistry) {
+    for (const [projectId, project] of Object.entries(currentRegistry.projects)) {
+      projectPathMap.set(projectId, project.path);
+    }
+  }
+}
+
+// ============================================================================
+// End Session File Watching
+// ============================================================================
+
 /**
  * Start heartbeat timer for a listener
  */
@@ -742,12 +1416,23 @@ export async function closeWatcher(): Promise<void> {
     watchedTasksPaths.clear();
     watchedWorkflowPaths.clear();
     watchedPhasesPaths.clear();
+    watchedSessionDirs.clear();
     projectTasksPaths.clear();
     workflowCache.clear();
     phasesCache.clear();
+    sessionCache.clear();
+    projectPathMap.clear();
+    sessionProjectMap.clear();
     currentRegistry = null;
     debounceTimers.forEach((timer) => clearTimeout(timer));
     debounceTimers.clear();
     console.log('[Watcher] Closed');
   }
+
+  // Close session watcher
+  if (sessionWatcher) {
+    await sessionWatcher.close();
+    sessionWatcher = null;
+    console.log('[Watcher] Session watcher closed');
+  }
 }
diff --git a/packages/dashboard/tests/e2e/orchestration-harness.test.ts b/packages/dashboard/tests/e2e/orchestration-harness.test.ts
new file mode 100644
index 0000000..cc0e974
--- /dev/null
+++ b/packages/dashboard/tests/e2e/orchestration-harness.test.ts
@@ -0,0 +1,245 @@
+/**
+ * E2E Test Harness for Orchestration
+ * T123/G12.29-35: End-to-end orchestration testing
+ *
+ * This harness allows running orchestration flows in a controlled test environment
+ * with mock services and filesystem isolation.
+ *
+ * Usage:
+ *   pnpm test:e2e:orchestration
+ *   pnpm test:e2e:orchestration --scenario design-only
+ *   pnpm test:e2e:orchestration --scenario full-flow
+ */
+
+import { describe, it, expect, beforeAll, afterAll, vi } from 'vitest';
+import { mkdtempSync, rmSync, mkdirSync, writeFileSync } from 'fs';
+import { join } from 'path';
+import { tmpdir } from 'os';
+
+// =============================================================================
+// Test Environment Setup
+// =============================================================================
+
+interface TestEnvironment {
+  projectPath: string;
+  projectId: string;
+  cleanup: () => void;
+}
+
+/**
+ * Create an isolated test project directory
+ */
+function createTestProject(name: string = 'e2e-test'): TestEnvironment {
+  const projectPath = mkdtempSync(join(tmpdir(), `specflow-e2e-${name}-`));
+  const projectId = `e2e-${name}-${Date.now()}`;
+
+  // Create required directories
+  mkdirSync(join(projectPath, '.specflow', 'workflows'), { recursive: true });
+  mkdirSync(join(projectPath, 'specs', '0001-test-phase'), { recursive: true });
+
+  // Create minimal spec.md
+  writeFileSync(
+    join(projectPath, 'specs', '0001-test-phase', 'spec.md'),
+    `# Test Phase Specification\n\n## Requirements\n- REQ-001: Test requirement\n`
+  );
+
+  // Create minimal plan.md
+  writeFileSync(
+    join(projectPath, 'specs', '0001-test-phase', 'plan.md'),
+    `# Test Phase Plan\n\n## Architecture\nSimple test implementation\n`
+  );
+
+  // Create minimal tasks.md
+  writeFileSync(
+    join(projectPath, 'specs', '0001-test-phase', 'tasks.md'),
+    `# Tasks: 0001 Test Phase\n\n## Phase 1: Setup\n- [ ] T001 Create test file\n- [ ] T002 Add configuration\n`
+  );
+
+  return {
+    projectPath,
+    projectId,
+    cleanup: () => rmSync(projectPath, { recursive: true, force: true }),
+  };
+}
+
+// =============================================================================
+// Mock Service Factory
+// =============================================================================
+
+interface MockServices {
+  orchestrationService: {
+    get: ReturnType<typeof vi.fn>;
+    start: ReturnType<typeof vi.fn>;
+    transitionToNextPhase: ReturnType<typeof vi.fn>;
+    linkWorkflowExecution: ReturnType<typeof vi.fn>;
+    completeBatch: ReturnType<typeof vi.fn>;
+    failBatch: ReturnType<typeof vi.fn>;
+    fail: ReturnType<typeof vi.fn>;
+    pause: ReturnType<typeof vi.fn>;
+    resume: ReturnType<typeof vi.fn>;
+  };
+  workflowService: {
+    get: ReturnType<typeof vi.fn>;
+    start: ReturnType<typeof vi.fn>;
+    findActiveByOrchestration: ReturnType<typeof vi.fn>;
+    hasActiveWorkflow: ReturnType<typeof vi.fn>;
+  };
+}
+
+/**
+ * Create mock services for E2E testing
+ */
+function createMockServices(): MockServices {
+  return {
+    orchestrationService: {
+      get: vi.fn(),
+      start: vi.fn(),
+      transitionToNextPhase: vi.fn(),
+      linkWorkflowExecution: vi.fn(),
+      completeBatch: vi.fn(),
+      failBatch: vi.fn(),
+      fail: vi.fn(),
+      pause: vi.fn(),
+      resume: vi.fn(),
+    },
+    workflowService: {
+      get: vi.fn(),
+      start: vi.fn(() => Promise.resolve({ id: 'wf-e2e-001', status: 'running' })),
+      findActiveByOrchestration: vi.fn(() => []),
+      hasActiveWorkflow: vi.fn(() => false),
+    },
+  };
+}
+
+// =============================================================================
+// Test Scenarios
+// =============================================================================
+
+/**
+ * Scenario: Design phase only (skipAnalyze, skipImplement)
+ */
+async function runDesignOnlyScenario(env: TestEnvironment, services: MockServices) {
+  // Setup: Orchestration starts at design
+  const orchestration = {
+    id: 'orch-e2e-001',
+    projectId: env.projectId,
+    status: 'running' as const,
+    currentPhase: 'design' as const,
+    config: {
+      skipDesign: false,
+      skipAnalyze: true,
+      autoMerge: false,
+      autoHealEnabled: false,
+      maxHealAttempts: 0,
+      batchSizeFallback: 15,
+      pauseBetweenBatches: false,
+      additionalContext: '',
+      budget: { maxPerBatch: 5, maxTotal: 50, healingBudget: 2, decisionBudget: 0.5 },
+    },
+    batches: { total: 0, current: 0, items: [] },
+    executions: { implement: [], healers: [] },
+    startedAt: new Date().toISOString(),
+    updatedAt: new Date().toISOString(),
+    decisionLog: [],
+    totalCostUsd: 0,
+  };
+
+  services.orchestrationService.get.mockReturnValue(orchestration);
+
+  // Simulate workflow completion
+  services.workflowService.get.mockReturnValue({ id: 'wf-design', status: 'completed' });
+
+  return { orchestration, services };
+}
+
+/**
+ * Scenario: Full orchestration flow
+ */
+async function runFullFlowScenario(env: TestEnvironment, services: MockServices) {
+  const orchestration = {
+    id: 'orch-e2e-full',
+    projectId: env.projectId,
+    status: 'running' as const,
+    currentPhase: 'design' as const,
+    config: {
+      skipDesign: false,
+      skipAnalyze: false,
+      autoMerge: true,
+      autoHealEnabled: true,
+      maxHealAttempts: 2,
+      batchSizeFallback: 15,
+      pauseBetweenBatches: false,
+      additionalContext: '',
+      budget: { maxPerBatch: 5, maxTotal: 50, healingBudget: 2, decisionBudget: 0.5 },
+    },
+    batches: {
+      total: 1,
+      current: 0,
+      items: [{ index: 0, section: 'Setup', taskIds: ['T001', 'T002'], status: 'pending' as const, healAttempts: 0 }],
+    },
+    executions: { implement: [], healers: [] },
+    startedAt: new Date().toISOString(),
+    updatedAt: new Date().toISOString(),
+    decisionLog: [],
+    totalCostUsd: 0,
+  };
+
+  services.orchestrationService.get.mockReturnValue(orchestration);
+
+  return { orchestration, services };
+}
+
+// =============================================================================
+// E2E Test Suite
+// =============================================================================
+
+describe('Orchestration E2E', () => {
+  let env: TestEnvironment;
+  let services: MockServices;
+
+  beforeAll(() => {
+    env = createTestProject();
+    services = createMockServices();
+  });
+
+  afterAll(() => {
+    env.cleanup();
+  });
+
+  describe('Test Environment', () => {
+    it('should create isolated test project', () => {
+      expect(env.projectPath).toBeDefined();
+      expect(env.projectId).toContain('e2e');
+    });
+
+    it('should have required project structure', async () => {
+      const { existsSync } = await import('fs');
+      expect(existsSync(join(env.projectPath, '.specflow'))).toBe(true);
+      expect(existsSync(join(env.projectPath, 'specs', '0001-test-phase', 'spec.md'))).toBe(true);
+      expect(existsSync(join(env.projectPath, 'specs', '0001-test-phase', 'tasks.md'))).toBe(true);
+    });
+  });
+
+  describe('Design Only Scenario', () => {
+    it('should setup design-only orchestration', async () => {
+      const { orchestration } = await runDesignOnlyScenario(env, services);
+      expect(orchestration.currentPhase).toBe('design');
+      expect(orchestration.config.skipAnalyze).toBe(true);
+    });
+  });
+
+  describe('Full Flow Scenario', () => {
+    it('should setup full flow orchestration', async () => {
+      const { orchestration } = await runFullFlowScenario(env, services);
+      expect(orchestration.currentPhase).toBe('design');
+      expect(orchestration.config.autoMerge).toBe(true);
+      expect(orchestration.batches.total).toBe(1);
+    });
+  });
+});
+
+// =============================================================================
+// CLI Runner (for standalone execution)
+// =============================================================================
+
+export { createTestProject, createMockServices, runDesignOnlyScenario, runFullFlowScenario };
diff --git a/packages/dashboard/tests/fixtures/jsonl/helpers.ts b/packages/dashboard/tests/fixtures/jsonl/helpers.ts
new file mode 100644
index 0000000..d6d337d
--- /dev/null
+++ b/packages/dashboard/tests/fixtures/jsonl/helpers.ts
@@ -0,0 +1,63 @@
+/**
+ * JSONL test fixture helpers
+ * T122/G12.8: Utilities for loading and parsing JSONL test data
+ */
+
+import { readFileSync } from 'fs';
+import { join, dirname } from 'path';
+import { fileURLToPath } from 'url';
+
+// Get fixtures directory path
+const __dirname = dirname(fileURLToPath(import.meta.url));
+
+/**
+ * Load a JSONL fixture file and parse each line
+ */
+export function loadJsonlFixture<T = unknown>(filename: string): T[] {
+  const filepath = join(__dirname, filename);
+  const content = readFileSync(filepath, 'utf-8');
+  return content
+    .split('\n')
+    .filter((line) => line.trim())
+    .map((line) => JSON.parse(line) as T);
+}
+
+/**
+ * Load the sample session fixture
+ */
+export function loadSampleSession() {
+  return loadJsonlFixture('sample-session.jsonl');
+}
+
+/**
+ * Load the workflow events fixture
+ */
+export function loadWorkflowEvents() {
+  return loadJsonlFixture('workflow-events.jsonl');
+}
+
+/**
+ * Create a temporary JSONL file for testing
+ */
+export function createTempJsonlContent(events: unknown[]): string {
+  return events.map((e) => JSON.stringify(e)).join('\n');
+}
+
+/**
+ * Sample session event types
+ */
+export interface SessionEvent {
+  type: 'init' | 'user' | 'assistant' | 'tool_use' | 'tool_result' | 'end';
+  timestamp: string;
+  [key: string]: unknown;
+}
+
+/**
+ * Sample workflow event types
+ */
+export interface WorkflowEvent {
+  type: 'workflow_start' | 'workflow_progress' | 'workflow_complete';
+  timestamp: string;
+  workflowId: string;
+  [key: string]: unknown;
+}
diff --git a/packages/dashboard/tests/fixtures/jsonl/sample-session.jsonl b/packages/dashboard/tests/fixtures/jsonl/sample-session.jsonl
new file mode 100644
index 0000000..249948a
--- /dev/null
+++ b/packages/dashboard/tests/fixtures/jsonl/sample-session.jsonl
@@ -0,0 +1,10 @@
+{"type":"init","timestamp":"2026-01-24T10:00:00.000Z","sessionId":"test-session-001","projectPath":"/test/project"}
+{"type":"user","timestamp":"2026-01-24T10:00:01.000Z","message":"Help me implement feature X"}
+{"type":"assistant","timestamp":"2026-01-24T10:00:02.000Z","message":"I'll help you implement feature X. Let me start by..."}
+{"type":"tool_use","timestamp":"2026-01-24T10:00:03.000Z","tool":"Read","input":{"file_path":"/test/project/src/index.ts"}}
+{"type":"tool_result","timestamp":"2026-01-24T10:00:04.000Z","tool":"Read","output":"export function main() { ... }"}
+{"type":"assistant","timestamp":"2026-01-24T10:00:05.000Z","message":"I can see the main function. Now let me add the feature..."}
+{"type":"tool_use","timestamp":"2026-01-24T10:00:06.000Z","tool":"Edit","input":{"file_path":"/test/project/src/index.ts","old_string":"export function main()","new_string":"export function main(options: Options)"}}
+{"type":"tool_result","timestamp":"2026-01-24T10:00:07.000Z","tool":"Edit","output":"File updated successfully"}
+{"type":"assistant","timestamp":"2026-01-24T10:00:08.000Z","message":"I've added the options parameter. The feature is now implemented."}
+{"type":"end","timestamp":"2026-01-24T10:00:09.000Z","reason":"completed"}
diff --git a/packages/dashboard/tests/fixtures/jsonl/workflow-events.jsonl b/packages/dashboard/tests/fixtures/jsonl/workflow-events.jsonl
new file mode 100644
index 0000000..5702931
--- /dev/null
+++ b/packages/dashboard/tests/fixtures/jsonl/workflow-events.jsonl
@@ -0,0 +1,5 @@
+{"type":"workflow_start","timestamp":"2026-01-24T10:00:00.000Z","workflowId":"wf-001","skill":"flow.design","orchestrationId":"orch-001"}
+{"type":"workflow_progress","timestamp":"2026-01-24T10:00:30.000Z","workflowId":"wf-001","phase":"discovery","progress":25}
+{"type":"workflow_progress","timestamp":"2026-01-24T10:01:00.000Z","workflowId":"wf-001","phase":"specification","progress":50}
+{"type":"workflow_progress","timestamp":"2026-01-24T10:01:30.000Z","workflowId":"wf-001","phase":"planning","progress":75}
+{"type":"workflow_complete","timestamp":"2026-01-24T10:02:00.000Z","workflowId":"wf-001","status":"completed","costUsd":0.15}
diff --git a/packages/dashboard/tests/fixtures/orchestration/helpers.ts b/packages/dashboard/tests/fixtures/orchestration/helpers.ts
new file mode 100644
index 0000000..f40f217
--- /dev/null
+++ b/packages/dashboard/tests/fixtures/orchestration/helpers.ts
@@ -0,0 +1,357 @@
+/**
+ * Shared test fixtures and helpers for orchestration tests
+ * T121/G12.5-9: Centralized test utilities
+ */
+
+import { vi } from 'vitest';
+import type {
+  OrchestrationExecution,
+  OrchestrationConfig,
+  OrchestrationPhase,
+  BatchTracking,
+  BatchItem,
+} from '@specflow/shared';
+import type { OrchestrationDeps } from '../../../src/lib/services/orchestration-runner';
+
+// =============================================================================
+// Default Configurations
+// =============================================================================
+
+/**
+ * Default orchestration config for tests
+ */
+export const defaultConfig: OrchestrationConfig = {
+  autoMerge: false,
+  additionalContext: '',
+  skipDesign: false,
+  skipAnalyze: false,
+  skipImplement: false,
+  skipVerify: false,
+  autoHealEnabled: true,
+  maxHealAttempts: 2,
+  batchSizeFallback: 15,
+  pauseBetweenBatches: false,
+  budget: {
+    maxPerBatch: 5,
+    maxTotal: 50,
+    healingBudget: 2,
+    decisionBudget: 0.5,
+  },
+};
+
+/**
+ * Config with all skips enabled (fast path)
+ */
+export const skipAllConfig: OrchestrationConfig = {
+  ...defaultConfig,
+  skipDesign: true,
+  skipAnalyze: true,
+  skipImplement: true,
+  skipVerify: true,
+};
+
+// =============================================================================
+// Batch Fixtures
+// =============================================================================
+
+/**
+ * Create a batch item with defaults
+ */
+export function createBatchItem(overrides: Partial<BatchItem> = {}): BatchItem {
+  return {
+    index: 0,
+    section: 'Test Section',
+    taskIds: ['T001', 'T002'],
+    status: 'pending',
+    healAttempts: 0,
+    ...overrides,
+  };
+}
+
+/**
+ * Create batch tracking with defaults
+ */
+export function createBatchTracking(overrides: Partial<BatchTracking> = {}): BatchTracking {
+  return {
+    total: 2,
+    current: 0,
+    items: [
+      createBatchItem({ index: 0, section: 'Phase 1', taskIds: ['T001', 'T002', 'T003'] }),
+      createBatchItem({ index: 1, section: 'Phase 2', taskIds: ['T004', 'T005'] }),
+    ],
+    ...overrides,
+  };
+}
+
+// =============================================================================
+// Execution Fixtures
+// =============================================================================
+
+/**
+ * Create an orchestration execution with defaults
+ */
+export function createOrchestration(
+  overrides: Partial<OrchestrationExecution> = {}
+): OrchestrationExecution {
+  const id = overrides.id || 'orch-test-123';
+  const projectId = overrides.projectId || 'project-test';
+
+  return {
+    id,
+    projectId,
+    status: 'running',
+    config: defaultConfig,
+    currentPhase: 'design',
+    batches: createBatchTracking(),
+    executions: {
+      implement: [],
+      healers: [],
+    },
+    startedAt: new Date().toISOString(),
+    updatedAt: new Date().toISOString(),
+    decisionLog: [],
+    totalCostUsd: 0,
+    ...overrides,
+  };
+}
+
+/**
+ * Create an orchestration at a specific phase
+ */
+export function createOrchestrationAtPhase(
+  phase: OrchestrationPhase,
+  overrides: Partial<OrchestrationExecution> = {}
+): OrchestrationExecution {
+  const executions: OrchestrationExecution['executions'] = {
+    implement: [],
+    healers: [],
+  };
+
+  // Add workflow IDs for completed phases
+  if (['analyze', 'implement', 'verify', 'merge', 'complete'].includes(phase)) {
+    executions.design = 'wf-design-done';
+  }
+  if (['implement', 'verify', 'merge', 'complete'].includes(phase)) {
+    executions.analyze = 'wf-analyze-done';
+  }
+  if (['verify', 'merge', 'complete'].includes(phase)) {
+    executions.implement = ['wf-impl-1', 'wf-impl-2'];
+  }
+  if (['merge', 'complete'].includes(phase)) {
+    executions.verify = 'wf-verify-done';
+  }
+
+  return createOrchestration({
+    currentPhase: phase,
+    executions,
+    ...overrides,
+  });
+}
+
+// =============================================================================
+// Workflow Fixtures
+// =============================================================================
+
+export interface MockWorkflow {
+  id: string;
+  status: 'running' | 'completed' | 'failed' | 'cancelled' | 'waiting_for_input';
+  error?: string;
+  costUsd?: number;
+}
+
+/**
+ * Create a mock workflow
+ */
+export function createWorkflow(overrides: Partial<MockWorkflow> = {}): MockWorkflow {
+  return {
+    id: 'wf-test-123',
+    status: 'running',
+    ...overrides,
+  };
+}
+
+// =============================================================================
+// Specflow Status Fixtures
+// =============================================================================
+
+export interface MockSpecflowStatus {
+  context?: {
+    hasSpec?: boolean;
+    hasPlan?: boolean;
+    hasTasks?: boolean;
+  };
+  progress?: {
+    tasksTotal?: number;
+    tasksComplete?: number;
+    percentage?: number;
+  };
+  orchestration?: {
+    step?: {
+      current?: string;
+      status?: string;
+    };
+  };
+}
+
+/**
+ * Create a mock specflow status
+ */
+export function createSpecflowStatus(overrides: Partial<MockSpecflowStatus> = {}): MockSpecflowStatus {
+  return {
+    context: {
+      hasSpec: true,
+      hasPlan: true,
+      hasTasks: true,
+      ...overrides.context,
+    },
+    progress: {
+      tasksTotal: 10,
+      tasksComplete: 0,
+      percentage: 0,
+      ...overrides.progress,
+    },
+    orchestration: {
+      step: {
+        current: 'design',
+        status: 'in_progress',
+        ...overrides.orchestration?.step,
+      },
+      ...overrides.orchestration,
+    },
+  };
+}
+
+/**
+ * Create status showing design phase complete
+ */
+export function createDesignCompleteStatus(): MockSpecflowStatus {
+  return createSpecflowStatus({
+    context: { hasSpec: true, hasPlan: true, hasTasks: true },
+  });
+}
+
+/**
+ * Create status showing all tasks complete
+ */
+export function createAllTasksCompleteStatus(): MockSpecflowStatus {
+  return createSpecflowStatus({
+    progress: { tasksTotal: 10, tasksComplete: 10, percentage: 100 },
+  });
+}
+
+// =============================================================================
+// Decision Input Fixtures
+// =============================================================================
+
+export interface MockDecisionInput {
+  step: { current: string; status: string };
+  phase: { hasUserGate?: boolean; userGateStatus?: string };
+  execution: OrchestrationExecution;
+  workflow?: MockWorkflow;
+  lastFileChangeTime?: number;
+  lookupFailures?: number;
+  currentTime?: number;
+}
+
+/**
+ * Create a decision input for testing makeDecision
+ */
+export function createDecisionInput(overrides: Partial<MockDecisionInput> = {}): MockDecisionInput {
+  return {
+    step: { current: 'design', status: 'in_progress' },
+    phase: {},
+    execution: createOrchestration(),
+    ...overrides,
+  };
+}
+
+// =============================================================================
+// Mock Dependencies (G12.9)
+// =============================================================================
+
+/**
+ * Create a complete mock of OrchestrationDeps for testing
+ *
+ * @param overrides - Optional overrides to customize specific mock functions
+ * @returns A fully mocked OrchestrationDeps object
+ *
+ * @example
+ * ```typescript
+ * const deps = createMockDeps({
+ *   readState: vi.fn().mockResolvedValue(customState),
+ * });
+ * ```
+ */
+export function createMockDeps(
+  overrides: Partial<OrchestrationDeps> = {}
+): OrchestrationDeps {
+  // Default mock orchestration service with all methods
+  const mockOrchestrationService = {
+    get: vi.fn().mockReturnValue(createOrchestration()),
+    create: vi.fn().mockReturnValue(createOrchestration()),
+    update: vi.fn(),
+    updateBatches: vi.fn(),
+    completeBatch: vi.fn(),
+    incrementHealAttempt: vi.fn(),
+    healBatch: vi.fn(),
+    canHealBatch: vi.fn().mockReturnValue(true),
+    fail: vi.fn(),
+    pause: vi.fn(),
+    resume: vi.fn(),
+    cancel: vi.fn(),
+    addCost: vi.fn(),
+    transitionToNextPhase: vi.fn(),
+    triggerMerge: vi.fn(),
+    linkWorkflowExecution: vi.fn(),
+    setNeedsAttention: vi.fn(),
+    list: vi.fn().mockReturnValue([]),
+    delete: vi.fn(),
+  };
+
+  // Default mock workflow service with all methods
+  const mockWorkflowService = {
+    start: vi.fn().mockResolvedValue(createWorkflow()),
+    get: vi.fn().mockReturnValue(createWorkflow()),
+    list: vi.fn().mockReturnValue([]),
+    cancel: vi.fn(),
+    hasActiveWorkflow: vi.fn().mockReturnValue(false),
+    findActiveByOrchestration: vi.fn().mockReturnValue([]),
+    cleanup: vi.fn(),
+  };
+
+  return {
+    // Required dependencies
+    orchestrationService: {
+      ...mockOrchestrationService,
+      ...overrides.orchestrationService,
+    } as unknown as OrchestrationDeps['orchestrationService'],
+
+    workflowService: {
+      ...mockWorkflowService,
+      ...overrides.workflowService,
+    } as unknown as OrchestrationDeps['workflowService'],
+
+    getNextPhase: overrides.getNextPhase ?? vi.fn().mockReturnValue('implement'),
+
+    isPhaseComplete: overrides.isPhaseComplete ?? vi.fn().mockReturnValue(false),
+
+    // Optional dependencies with sensible defaults
+    attemptHeal: overrides.attemptHeal ?? vi.fn().mockResolvedValue({
+      success: true,
+      cost: 0.01,
+      result: { status: 'fixed' },
+    }),
+
+    quickDecision: overrides.quickDecision ?? vi.fn().mockResolvedValue({
+      result: { action: 'wait', reason: 'Test decision' },
+      cost: 0.01,
+    }),
+
+    parseBatchesFromProject: overrides.parseBatchesFromProject ?? vi.fn().mockReturnValue({
+      batches: [
+        { section: 'Test Section', taskIds: ['T001', 'T002'], incomplete: 2 },
+      ],
+      totalIncomplete: 2,
+    }),
+  };
+}
diff --git a/packages/dashboard/tests/fixtures/orchestration/index.ts b/packages/dashboard/tests/fixtures/orchestration/index.ts
new file mode 100644
index 0000000..83beaef
--- /dev/null
+++ b/packages/dashboard/tests/fixtures/orchestration/index.ts
@@ -0,0 +1,6 @@
+/**
+ * Orchestration test fixtures
+ * T121/G12.5-9: Centralized test utilities
+ */
+
+export * from './helpers';
diff --git a/packages/dashboard/tests/orchestration/external-cli-detection.test.ts b/packages/dashboard/tests/orchestration/external-cli-detection.test.ts
new file mode 100644
index 0000000..500f910
--- /dev/null
+++ b/packages/dashboard/tests/orchestration/external-cli-detection.test.ts
@@ -0,0 +1,368 @@
+/**
+ * Tests for external CLI session detection via file watching.
+ *
+ * Tests that the watcher correctly detects:
+ * - New JSONL files created in the Claude projects directory
+ * - Modified JSONL files (session activity)
+ * - Emits correct SSE events ('session:created', 'session:activity')
+ *
+ * G11.11: External CLI detection test coverage
+ *
+ * This test focuses on verifying the session watcher behavior by testing
+ * the session file change handler logic directly, without requiring full
+ * watcher initialization which has complex fs dependencies.
+ */
+
+import { describe, it, expect, vi, beforeEach } from 'vitest';
+import type { SSEEvent } from '@specflow/shared';
+import path from 'path';
+
+describe('External CLI Detection', () => {
+  /**
+   * These tests verify the expected behavior of session file detection
+   * by testing the core logic patterns used in the watcher.
+   */
+
+  describe('Session ID extraction', () => {
+    /**
+     * The watcher extracts session IDs from JSONL file paths.
+     * Path format: ~/.claude/projects/{project-hash}/{session-id}.jsonl
+     */
+    function extractSessionId(filePath: string): string {
+      const basename = path.basename(filePath, '.jsonl');
+      return basename;
+    }
+
+    it('should extract session ID from JSONL file path', () => {
+      const filePath = '/Users/test/.claude/projects/-Users-test-my-project/abc123.jsonl';
+      expect(extractSessionId(filePath)).toBe('abc123');
+    });
+
+    it('should handle session IDs with hyphens', () => {
+      const filePath = '/Users/test/.claude/projects/-Users-test-my-project/session-abc-456.jsonl';
+      expect(extractSessionId(filePath)).toBe('session-abc-456');
+    });
+
+    it('should handle complex session IDs', () => {
+      const filePath = '/Users/test/.claude/projects/-Users-test-project/uuid-like-12345-abcdef.jsonl';
+      expect(extractSessionId(filePath)).toBe('uuid-like-12345-abcdef');
+    });
+  });
+
+  describe('Project path extraction', () => {
+    /**
+     * The watcher extracts project paths from the parent directory of JSONL files.
+     * The project hash is the directory name (e.g., -Users-test-my-project).
+     */
+    function extractProjectHash(filePath: string): string {
+      const dir = path.dirname(filePath);
+      return path.basename(dir);
+    }
+
+    it('should extract project hash from JSONL file path', () => {
+      const filePath = '/Users/test/.claude/projects/-Users-test-my-project/session.jsonl';
+      expect(extractProjectHash(filePath)).toBe('-Users-test-my-project');
+    });
+  });
+
+  describe('Session event creation', () => {
+    /**
+     * When a new JSONL file is detected, the watcher creates a session:created event.
+     * When a JSONL file is modified, it creates a session:activity event.
+     */
+    interface SessionEvent {
+      type: 'session:created' | 'session:activity' | 'session:message';
+      sessionId: string;
+      projectHash: string;
+      timestamp: string;
+      data?: {
+        messages: Array<{ role: string; content: string }>;
+      };
+    }
+
+    function createSessionCreatedEvent(filePath: string): SessionEvent {
+      return {
+        type: 'session:created',
+        sessionId: path.basename(filePath, '.jsonl'),
+        projectHash: path.basename(path.dirname(filePath)),
+        timestamp: new Date().toISOString(),
+      };
+    }
+
+    function createSessionActivityEvent(filePath: string): SessionEvent {
+      return {
+        type: 'session:activity',
+        sessionId: path.basename(filePath, '.jsonl'),
+        projectHash: path.basename(path.dirname(filePath)),
+        timestamp: new Date().toISOString(),
+      };
+    }
+
+    function createSessionMessageEvent(
+      filePath: string,
+      messages: Array<{ role: string; content: string }>
+    ): SessionEvent {
+      return {
+        type: 'session:message',
+        sessionId: path.basename(filePath, '.jsonl'),
+        projectHash: path.basename(path.dirname(filePath)),
+        timestamp: new Date().toISOString(),
+        data: { messages },
+      };
+    }
+
+    it('should create session:created event with correct sessionId', () => {
+      const filePath = '/Users/test/.claude/projects/-Users-test-my-project/new-session-123.jsonl';
+      const event = createSessionCreatedEvent(filePath);
+
+      expect(event.type).toBe('session:created');
+      expect(event.sessionId).toBe('new-session-123');
+      expect(event.projectHash).toBe('-Users-test-my-project');
+    });
+
+    it('should create session:activity event with correct sessionId', () => {
+      const filePath = '/Users/test/.claude/projects/-Users-test-my-project/existing-session-789.jsonl';
+      const event = createSessionActivityEvent(filePath);
+
+      expect(event.type).toBe('session:activity');
+      expect(event.sessionId).toBe('existing-session-789');
+    });
+
+    it('should create session:message event with parsed content', () => {
+      const filePath = '/Users/test/.claude/projects/-Users-test-my-project/session.jsonl';
+      const messages = [
+        { role: 'user', content: 'Hello' },
+        { role: 'assistant', content: 'Hi there!' },
+      ];
+      const event = createSessionMessageEvent(filePath, messages);
+
+      expect(event.type).toBe('session:message');
+      expect(event.data?.messages).toEqual(messages);
+    });
+
+    it('should include valid ISO timestamp in events', () => {
+      const filePath = '/Users/test/.claude/projects/-Users-test-my-project/session.jsonl';
+      const event = createSessionCreatedEvent(filePath);
+
+      expect(event.timestamp).toBeDefined();
+      // Verify it's a valid ISO string
+      const date = new Date(event.timestamp);
+      expect(date.toISOString()).toBe(event.timestamp);
+    });
+  });
+
+  describe('Debouncing logic', () => {
+    /**
+     * The watcher debounces rapid file changes to reduce event noise.
+     * Multiple changes to the same file within the debounce window
+     * should result in a single event.
+     */
+    it('should debounce rapid changes to the same file', async () => {
+      const events: string[] = [];
+      const debounceTimers = new Map<string, NodeJS.Timeout>();
+      const DEBOUNCE_MS = 100;
+
+      function debouncedHandler(filePath: string) {
+        // Clear existing timer
+        const existing = debounceTimers.get(filePath);
+        if (existing) {
+          clearTimeout(existing);
+        }
+
+        // Set new timer
+        const timer = setTimeout(() => {
+          events.push(filePath);
+          debounceTimers.delete(filePath);
+        }, DEBOUNCE_MS);
+
+        debounceTimers.set(filePath, timer);
+      }
+
+      const sessionPath = '/Users/test/.claude/projects/-Users-test-my-project/rapid-session.jsonl';
+
+      // Simulate 5 rapid changes
+      for (let i = 0; i < 5; i++) {
+        debouncedHandler(sessionPath);
+      }
+
+      // Wait for debounce to complete
+      await new Promise(resolve => setTimeout(resolve, DEBOUNCE_MS + 50));
+
+      // Should only have one event due to debouncing
+      expect(events.length).toBe(1);
+      expect(events[0]).toBe(sessionPath);
+    });
+
+    it('should handle changes to different files independently', async () => {
+      const events: string[] = [];
+      const debounceTimers = new Map<string, NodeJS.Timeout>();
+      const DEBOUNCE_MS = 100;
+
+      function debouncedHandler(filePath: string) {
+        const existing = debounceTimers.get(filePath);
+        if (existing) {
+          clearTimeout(existing);
+        }
+
+        const timer = setTimeout(() => {
+          events.push(filePath);
+          debounceTimers.delete(filePath);
+        }, DEBOUNCE_MS);
+
+        debounceTimers.set(filePath, timer);
+      }
+
+      const session1 = '/Users/test/.claude/projects/-proj1/session1.jsonl';
+      const session2 = '/Users/test/.claude/projects/-proj1/session2.jsonl';
+
+      // Changes to different files
+      debouncedHandler(session1);
+      debouncedHandler(session2);
+
+      await new Promise(resolve => setTimeout(resolve, DEBOUNCE_MS + 50));
+
+      // Should have events for both files
+      expect(events.length).toBe(2);
+      expect(events).toContain(session1);
+      expect(events).toContain(session2);
+    });
+  });
+
+  describe('JSONL file pattern matching', () => {
+    /**
+     * The watcher should only process .jsonl files.
+     */
+    function isSessionFile(filePath: string): boolean {
+      return filePath.endsWith('.jsonl');
+    }
+
+    it('should match JSONL files', () => {
+      expect(isSessionFile('/path/to/session.jsonl')).toBe(true);
+      expect(isSessionFile('/path/to/another-session-123.jsonl')).toBe(true);
+    });
+
+    it('should not match non-JSONL files', () => {
+      expect(isSessionFile('/path/to/file.json')).toBe(false);
+      expect(isSessionFile('/path/to/file.txt')).toBe(false);
+      expect(isSessionFile('/path/to/file.jsonl.bak')).toBe(false);
+    });
+  });
+
+  describe('Claude projects directory pattern', () => {
+    /**
+     * The watcher watches ~/.claude/projects/**\/*.jsonl
+     * Files should be at depth 1 within the projects directory.
+     */
+    function isValidSessionPath(filePath: string): boolean {
+      // Path should match: ~/.claude/projects/{project-hash}/{session-id}.jsonl
+      const claudeProjectsPattern = /\.claude\/projects\/[^/]+\/[^/]+\.jsonl$/;
+      return claudeProjectsPattern.test(filePath);
+    }
+
+    it('should match valid session file paths', () => {
+      expect(isValidSessionPath('/Users/test/.claude/projects/-Users-test-my-project/session.jsonl')).toBe(true);
+    });
+
+    it('should not match files at wrong depth', () => {
+      // Too shallow (directly in projects/)
+      expect(isValidSessionPath('/Users/test/.claude/projects/session.jsonl')).toBe(false);
+
+      // Too deep (nested subdirectory)
+      expect(isValidSessionPath('/Users/test/.claude/projects/-proj/subdir/session.jsonl')).toBe(false);
+    });
+  });
+
+  describe('Chokidar watcher configuration', () => {
+    /**
+     * The session watcher should be configured with specific options:
+     * - persistent: true (keep watching)
+     * - ignoreInitial: true (don't emit for existing files)
+     * - depth: 2 (project-hash/session-id.jsonl)
+     */
+    it('should specify correct watcher options', () => {
+      const expectedOptions = {
+        persistent: true,
+        ignoreInitial: true,
+        depth: 2,
+      };
+
+      // Verify the expected configuration
+      expect(expectedOptions.persistent).toBe(true);
+      expect(expectedOptions.ignoreInitial).toBe(true);
+      expect(expectedOptions.depth).toBe(2);
+    });
+
+    it('should watch the correct glob pattern', () => {
+      const homeDir = '/Users/test';
+      const expectedPattern = `${homeDir}/.claude/projects/**/*.jsonl`;
+
+      expect(expectedPattern).toContain('/.claude/projects/');
+      expect(expectedPattern).toContain('**/*.jsonl');
+    });
+  });
+
+  describe('Event handler registration', () => {
+    /**
+     * The watcher should register handlers for:
+     * - 'add': New session file created
+     * - 'change': Session file modified
+     * - 'error': Watcher error
+     */
+    it('should register all required event handlers', () => {
+      const requiredEvents = ['add', 'change', 'error'];
+      const registeredHandlers = new Map<string, () => void>();
+
+      // Simulate registering handlers
+      const mockWatcher = {
+        on: (event: string, handler: () => void) => {
+          registeredHandlers.set(event, handler);
+          return mockWatcher;
+        },
+      };
+
+      // Register handlers as watcher does
+      mockWatcher
+        .on('add', () => { /* handle new file */ })
+        .on('change', () => { /* handle file change */ })
+        .on('error', () => { /* handle error */ });
+
+      // Verify all required handlers are registered
+      for (const event of requiredEvents) {
+        expect(registeredHandlers.has(event)).toBe(true);
+      }
+    });
+  });
+
+  describe('Error handling', () => {
+    /**
+     * The watcher should handle errors gracefully without crashing.
+     */
+    it('should handle watcher errors without throwing', () => {
+      const errorHandler = (error: Error) => {
+        console.error('[Watcher] Error:', error.message);
+        // Don't rethrow - handle gracefully
+      };
+
+      // Should not throw
+      expect(() => {
+        errorHandler(new Error('Test watcher error'));
+      }).not.toThrow();
+    });
+
+    it('should handle file read errors without throwing', async () => {
+      const handleFileChange = async (filePath: string) => {
+        try {
+          // Simulate file read that throws
+          throw new Error('ENOENT: file not found');
+        } catch {
+          // Gracefully handle - file might have been deleted
+          return null;
+        }
+      };
+
+      // Should not throw
+      const result = await handleFileChange('/path/to/deleted.jsonl');
+      expect(result).toBeNull();
+    });
+  });
+});
diff --git a/packages/dashboard/tests/orchestration/orchestration-decisions.test.ts b/packages/dashboard/tests/orchestration/orchestration-decisions.test.ts
new file mode 100644
index 0000000..1a3cb9a
--- /dev/null
+++ b/packages/dashboard/tests/orchestration/orchestration-decisions.test.ts
@@ -0,0 +1,755 @@
+/**
+ * Tests for orchestration-decisions.ts
+ *
+ * These tests verify the pure decision logic extracted from orchestration-runner.ts.
+ * Each test covers a specific condition from the decision matrix (G1.x, G2.x goals).
+ */
+
+import { describe, it, expect } from 'vitest';
+import {
+  makeDecision,
+  handleImplementBatching,
+  getSkillForStep,
+  getNextStep,
+  calculateExponentialBackoff,
+  areAllBatchesComplete,
+  STALE_THRESHOLD_MS,
+  type DecisionInput,
+  type WorkflowState,
+} from '../../src/lib/services/orchestration-decisions';
+import type { OrchestrationExecution } from '@specflow/shared';
+
+// =============================================================================
+// Test Fixtures
+// =============================================================================
+
+function createMockExecution(overrides: Partial<OrchestrationExecution> = {}): OrchestrationExecution {
+  return {
+    id: 'test-orch-id',
+    projectId: 'test-project',
+    status: 'running',
+    config: {
+      autoMerge: false,
+      skipDesign: false,
+      skipAnalyze: false,
+      autoHealEnabled: true,
+      maxHealAttempts: 3,
+      pauseBetweenBatches: false,
+      batchSizeFallback: 10,
+      additionalContext: '',
+      budget: {
+        maxTotal: 50,
+        maxPerBatch: 5,
+        healingBudget: 5,
+        decisionBudget: 2,
+      },
+    },
+    currentPhase: 'implement',
+    batches: {
+      total: 0,
+      current: 0,
+      items: [],
+    },
+    executions: {
+      implement: [],
+      healers: [],
+    },
+    startedAt: new Date().toISOString(),
+    updatedAt: new Date().toISOString(),
+    decisionLog: [],
+    totalCostUsd: 0,
+    ...overrides,
+  };
+}
+
+function createMockInput(overrides: Partial<DecisionInput> = {}): DecisionInput {
+  return {
+    step: {
+      current: 'implement',
+      index: 2,
+      status: 'in_progress',
+    },
+    phase: {},
+    execution: createMockExecution(),
+    workflow: null,
+    ...overrides,
+  };
+}
+
+function createMockWorkflow(overrides: Partial<WorkflowState> = {}): WorkflowState {
+  return {
+    id: 'test-workflow-id',
+    status: 'running',
+    ...overrides,
+  };
+}
+
+// =============================================================================
+// Helper Function Tests
+// =============================================================================
+
+describe('getSkillForStep', () => {
+  it('returns correct skill for each step', () => {
+    expect(getSkillForStep('design')).toBe('flow.design');
+    expect(getSkillForStep('analyze')).toBe('flow.analyze');
+    expect(getSkillForStep('implement')).toBe('flow.implement');
+    expect(getSkillForStep('verify')).toBe('flow.verify');
+    expect(getSkillForStep('merge')).toBe('flow.merge');
+  });
+
+  it('returns flow.implement for unknown step', () => {
+    expect(getSkillForStep('unknown')).toBe('flow.implement');
+  });
+});
+
+describe('getNextStep', () => {
+  it('returns correct next step', () => {
+    expect(getNextStep('design')).toBe('analyze');
+    expect(getNextStep('analyze')).toBe('implement');
+    expect(getNextStep('implement')).toBe('verify');
+    expect(getNextStep('verify')).toBe('merge');
+  });
+
+  it('returns null for merge (last step)', () => {
+    expect(getNextStep('merge')).toBeNull();
+  });
+
+  it('returns null for unknown step', () => {
+    expect(getNextStep('unknown')).toBeNull();
+  });
+});
+
+describe('calculateExponentialBackoff', () => {
+  it('calculates backoff correctly', () => {
+    expect(calculateExponentialBackoff(0)).toBe(1000);   // 1s
+    expect(calculateExponentialBackoff(1)).toBe(2000);   // 2s
+    expect(calculateExponentialBackoff(2)).toBe(4000);   // 4s
+    expect(calculateExponentialBackoff(3)).toBe(8000);   // 8s
+    expect(calculateExponentialBackoff(4)).toBe(16000);  // 16s
+  });
+
+  it('caps at 30 seconds', () => {
+    expect(calculateExponentialBackoff(5)).toBe(30000);
+    expect(calculateExponentialBackoff(10)).toBe(30000);
+  });
+});
+
+describe('areAllBatchesComplete', () => {
+  it('returns false for empty batches', () => {
+    expect(areAllBatchesComplete({ total: 0, current: 0, items: [] })).toBe(false);
+  });
+
+  it('returns true when all batches completed', () => {
+    const batches = {
+      total: 2,
+      current: 1,
+      items: [
+        { index: 0, section: 'A', taskIds: ['T001'], status: 'completed' as const, healAttempts: 0 },
+        { index: 1, section: 'B', taskIds: ['T002'], status: 'completed' as const, healAttempts: 0 },
+      ],
+    };
+    expect(areAllBatchesComplete(batches)).toBe(true);
+  });
+
+  it('returns true when all batches healed', () => {
+    const batches = {
+      total: 2,
+      current: 1,
+      items: [
+        { index: 0, section: 'A', taskIds: ['T001'], status: 'healed' as const, healAttempts: 1 },
+        { index: 1, section: 'B', taskIds: ['T002'], status: 'healed' as const, healAttempts: 1 },
+      ],
+    };
+    expect(areAllBatchesComplete(batches)).toBe(true);
+  });
+
+  it('returns false when some batches pending', () => {
+    const batches = {
+      total: 2,
+      current: 0,
+      items: [
+        { index: 0, section: 'A', taskIds: ['T001'], status: 'completed' as const, healAttempts: 0 },
+        { index: 1, section: 'B', taskIds: ['T002'], status: 'pending' as const, healAttempts: 0 },
+      ],
+    };
+    expect(areAllBatchesComplete(batches)).toBe(false);
+  });
+});
+
+// =============================================================================
+// Pre-Decision Gates Tests (G1.1, G1.2)
+// =============================================================================
+
+describe('makeDecision - Pre-Decision Gates', () => {
+  it('G1.1: returns fail when budget exceeded', () => {
+    const execution = createMockExecution({
+      totalCostUsd: 60, // Exceeds maxTotal of 50
+    });
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'in_progress' },
+      execution,
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('fail');
+    expect(result.reason).toContain('Budget exceeded');
+    expect(result.errorMessage).toContain('Budget limit exceeded');
+  });
+
+  it('G1.1: does not fail when under budget', () => {
+    const execution = createMockExecution({
+      totalCostUsd: 10,
+    });
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'in_progress' },
+      execution,
+      workflow: createMockWorkflow({ status: 'running' }),
+      lastFileChangeTime: Date.now() - 1000,
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).not.toBe('fail');
+  });
+
+  it('G1.2: returns needs_attention when duration exceeds 4 hours', () => {
+    const fourHoursAgo = Date.now() - (5 * 60 * 60 * 1000); // 5 hours ago
+    const execution = createMockExecution({
+      startedAt: new Date(fourHoursAgo).toISOString(),
+    });
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'in_progress' },
+      execution,
+      currentTime: Date.now(),
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('needs_attention');
+    expect(result.reason).toContain('too long');
+    expect(result.recoveryOptions).toContain('abort');
+  });
+
+  it('G1.2: does not fail when under 4 hours', () => {
+    const twoHoursAgo = Date.now() - (2 * 60 * 60 * 1000); // 2 hours ago
+    const execution = createMockExecution({
+      startedAt: new Date(twoHoursAgo).toISOString(),
+    });
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'in_progress' },
+      execution,
+      workflow: createMockWorkflow({ status: 'running' }),
+      lastFileChangeTime: Date.now() - 1000,
+      currentTime: Date.now(),
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).not.toBe('needs_attention');
+  });
+
+  it('G1.1 takes precedence over G1.2 (budget check first)', () => {
+    const fiveHoursAgo = Date.now() - (5 * 60 * 60 * 1000);
+    const execution = createMockExecution({
+      totalCostUsd: 60, // Over budget
+      startedAt: new Date(fiveHoursAgo).toISOString(), // Also over time
+    });
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'in_progress' },
+      execution,
+      currentTime: Date.now(),
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('fail'); // Budget check takes precedence
+  });
+});
+
+// =============================================================================
+// Decision Matrix Tests (G1.x Goals)
+// =============================================================================
+
+describe('makeDecision - Workflow States', () => {
+  it('G1.4: returns wait when workflow is running (recent activity)', () => {
+    // Use design step to avoid batch handling logic
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'in_progress' },
+      workflow: createMockWorkflow({ status: 'running' }),
+      lastFileChangeTime: Date.now() - 1000, // 1 second ago
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('wait');
+    expect(result.reason).toBe('Workflow running');
+  });
+
+  it('G1.5: returns recover_stale when workflow stale (>10 min)', () => {
+    // Use design step to avoid batch handling logic
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'in_progress' },
+      workflow: createMockWorkflow({ status: 'running' }),
+      lastFileChangeTime: Date.now() - STALE_THRESHOLD_MS - 60000, // 11 minutes ago
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('recover_stale');
+    expect(result.workflowId).toBe('test-workflow-id');
+  });
+
+  it('G1.6: returns wait when workflow waiting for input', () => {
+    // Use design step to avoid batch handling logic
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'in_progress' },
+      workflow: createMockWorkflow({ status: 'waiting_for_input' }),
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('wait');
+    expect(result.reason).toBe('Waiting for user input');
+  });
+
+  it('returns needs_attention when workflow failed', () => {
+    // Use design step to avoid batch handling logic
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'in_progress' },
+      workflow: createMockWorkflow({ status: 'failed', error: 'Something went wrong' }),
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('needs_attention');
+    expect(result.recoveryOptions).toContain('retry');
+    expect(result.failedWorkflowId).toBe('test-workflow-id');
+  });
+
+  it('returns needs_attention when workflow cancelled', () => {
+    // Use design step to avoid batch handling logic
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'in_progress' },
+      workflow: createMockWorkflow({ status: 'cancelled' }),
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('needs_attention');
+  });
+});
+
+describe('makeDecision - Lookup Failures', () => {
+  it('G1.3: returns wait_with_backoff when workflow lookup fails', () => {
+    const execution = createMockExecution({
+      currentPhase: 'design',
+      executions: { design: 'stored-workflow-id', implement: [], healers: [] },
+    });
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'in_progress' },
+      execution,
+      workflow: null, // Lookup failed
+      lookupFailures: 2,
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('wait_with_backoff');
+    expect(result.backoffMs).toBe(4000); // 2^2 * 1000
+  });
+});
+
+describe('makeDecision - Step Complete Transitions', () => {
+  it('G1.8: waits for USER_GATE when verify complete', () => {
+    const input = createMockInput({
+      step: { current: 'verify', index: 3, status: 'complete' },
+      phase: { hasUserGate: true, userGateStatus: 'pending' },
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('wait_user_gate');
+  });
+
+  it('G1.9: waits for merge when autoMerge=false', () => {
+    const execution = createMockExecution({
+      config: {
+        ...createMockExecution().config,
+        autoMerge: false,
+      },
+    });
+    const input = createMockInput({
+      step: { current: 'verify', index: 3, status: 'complete' },
+      execution,
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('wait_merge');
+  });
+
+  it('G1.10: transitions to merge when autoMerge=true', () => {
+    const execution = createMockExecution({
+      config: {
+        ...createMockExecution().config,
+        autoMerge: true,
+      },
+    });
+    const input = createMockInput({
+      step: { current: 'verify', index: 3, status: 'complete' },
+      execution,
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('transition');
+    expect(result.nextStep).toBe('merge');
+    expect(result.skill).toBe('flow.merge');
+  });
+
+  it('G1.11: completes when merge step is complete', () => {
+    const input = createMockInput({
+      step: { current: 'merge', index: 4, status: 'complete' },
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('complete');
+  });
+
+  it('G1.12: transitions to next step when complete', () => {
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'complete' },
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('transition');
+    expect(result.nextStep).toBe('analyze');
+    expect(result.skill).toBe('flow.analyze');
+  });
+});
+
+describe('makeDecision - Step Failed/Blocked', () => {
+  it('G1.13: returns recover_failed when step failed', () => {
+    // Use design step to avoid batch handling logic
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'failed' },
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('recover_failed');
+  });
+
+  it('G1.14: returns recover_failed when step blocked', () => {
+    // Use design step to avoid batch handling logic
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'blocked' },
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('recover_failed');
+  });
+});
+
+describe('makeDecision - Spawn Workflows', () => {
+  it('G1.15: spawns workflow when in_progress but no workflow', () => {
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'in_progress' },
+      workflow: null,
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('spawn');
+    expect(result.skill).toBe('flow.design');
+  });
+
+  it('G1.16: spawns workflow when step not_started', () => {
+    const input = createMockInput({
+      step: { current: 'analyze', index: 1, status: 'not_started' },
+      workflow: null,
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('spawn');
+    expect(result.skill).toBe('flow.analyze');
+  });
+
+  it('G1.17: initializes batches when entering implement with no batches', () => {
+    const input = createMockInput({
+      step: { current: 'implement', index: 2, status: 'not_started' },
+      workflow: null,
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('initialize_batches');
+  });
+});
+
+describe('makeDecision - Unknown Status', () => {
+  it('G1.18: returns needs_attention for unknown status', () => {
+    // Use design step to avoid batch handling logic
+    const input = createMockInput({
+      step: { current: 'design', index: 0, status: 'skipped' as any },
+    });
+
+    const result = makeDecision(input);
+    expect(result.action).toBe('needs_attention');
+  });
+});
+
+// =============================================================================
+// Batch Handling Tests (G2.x Goals)
+// =============================================================================
+
+describe('handleImplementBatching', () => {
+  it('G2.1: returns initialize_batches when no batches', () => {
+    const step = { current: 'implement', index: 2, status: 'in_progress' as const };
+    const execution = createMockExecution({ batches: { total: 0, current: 0, items: [] } });
+
+    const result = handleImplementBatching(step, execution, null);
+    expect(result?.action).toBe('initialize_batches');
+  });
+
+  it('G2.4: spawns batch when pending and no workflow', () => {
+    const step = { current: 'implement', index: 2, status: 'in_progress' as const };
+    const execution = createMockExecution({
+      batches: {
+        total: 2,
+        current: 0,
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001', 'T002'], status: 'pending', healAttempts: 0 },
+          { index: 1, section: 'Core', taskIds: ['T003', 'T004'], status: 'pending', healAttempts: 0 },
+        ],
+      },
+    });
+
+    const result = handleImplementBatching(step, execution, null);
+    expect(result?.action).toBe('spawn_batch');
+    expect(result?.skill).toBe('flow.implement');
+    expect(result?.batchContext).toContain('T001');
+    expect(result?.batchContext).toContain('Setup');
+  });
+
+  it('G2.5: defers to staleness check when batch running with workflow', () => {
+    const step = { current: 'implement', index: 2, status: 'in_progress' as const };
+    const execution = createMockExecution({
+      batches: {
+        total: 1,
+        current: 0,
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001'], status: 'running', healAttempts: 0 },
+        ],
+      },
+    });
+    const workflow = createMockWorkflow({ status: 'running' });
+
+    const result = handleImplementBatching(step, execution, workflow);
+    expect(result).toBeNull(); // Defer to main matrix
+  });
+
+  it('G2.6: pauses when batch complete and pauseBetweenBatches=true', () => {
+    const step = { current: 'implement', index: 2, status: 'in_progress' as const };
+    const execution = createMockExecution({
+      config: {
+        ...createMockExecution().config,
+        pauseBetweenBatches: true,
+      },
+      batches: {
+        total: 2,
+        current: 0,
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001'], status: 'completed', healAttempts: 0 },
+          { index: 1, section: 'Core', taskIds: ['T002'], status: 'pending', healAttempts: 0 },
+        ],
+      },
+    });
+
+    const result = handleImplementBatching(step, execution, null);
+    expect(result?.action).toBe('pause');
+  });
+
+  it('G2.7: advances batch when complete and pauseBetweenBatches=false', () => {
+    const step = { current: 'implement', index: 2, status: 'in_progress' as const };
+    const execution = createMockExecution({
+      batches: {
+        total: 2,
+        current: 0,
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001'], status: 'completed', healAttempts: 0 },
+          { index: 1, section: 'Core', taskIds: ['T002'], status: 'pending', healAttempts: 0 },
+        ],
+      },
+    });
+
+    const result = handleImplementBatching(step, execution, null);
+    expect(result?.action).toBe('advance_batch');
+    expect(result?.batchIndex).toBe(1);
+  });
+
+  it('G2.8: advances batch when healed', () => {
+    const step = { current: 'implement', index: 2, status: 'in_progress' as const };
+    const execution = createMockExecution({
+      batches: {
+        total: 2,
+        current: 0,
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001'], status: 'healed', healAttempts: 1 },
+          { index: 1, section: 'Core', taskIds: ['T002'], status: 'pending', healAttempts: 0 },
+        ],
+      },
+    });
+
+    const result = handleImplementBatching(step, execution, null);
+    expect(result?.action).toBe('advance_batch');
+  });
+
+  it('G2.9: heals batch when failed and attempts remaining', () => {
+    const step = { current: 'implement', index: 2, status: 'in_progress' as const };
+    const execution = createMockExecution({
+      batches: {
+        total: 1,
+        current: 0,
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001'], status: 'failed', healAttempts: 1 },
+        ],
+      },
+    });
+
+    const result = handleImplementBatching(step, execution, null);
+    expect(result?.action).toBe('heal_batch');
+    expect(result?.batchIndex).toBe(0);
+  });
+
+  it('G2.9: returns recover_failed when no heal attempts remaining', () => {
+    const step = { current: 'implement', index: 2, status: 'in_progress' as const };
+    const execution = createMockExecution({
+      batches: {
+        total: 1,
+        current: 0,
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001'], status: 'failed', healAttempts: 3 },
+        ],
+      },
+    });
+
+    const result = handleImplementBatching(step, execution, null);
+    expect(result?.action).toBe('recover_failed');
+  });
+
+  it('G2.10-11: forces step complete when all batches done but status not updated', () => {
+    const step = { current: 'implement', index: 2, status: 'in_progress' as const };
+    const execution = createMockExecution({
+      batches: {
+        total: 2,
+        current: 1,
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001'], status: 'completed', healAttempts: 0 },
+          { index: 1, section: 'Core', taskIds: ['T002'], status: 'completed', healAttempts: 0 },
+        ],
+      },
+    });
+
+    const result = handleImplementBatching(step, execution, null);
+    expect(result?.action).toBe('force_step_complete');
+  });
+
+  it('G2.10: defers when all batches done and status is complete', () => {
+    const step = { current: 'implement', index: 2, status: 'complete' as const };
+    const execution = createMockExecution({
+      batches: {
+        total: 2,
+        current: 1,
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001'], status: 'completed', healAttempts: 0 },
+          { index: 1, section: 'Core', taskIds: ['T002'], status: 'completed', healAttempts: 0 },
+        ],
+      },
+    });
+
+    const result = handleImplementBatching(step, execution, null);
+    expect(result).toBeNull(); // Let main matrix handle transition
+  });
+});
+
+// =============================================================================
+// Happy Path Integration Test (G11.5)
+// =============================================================================
+
+describe('Happy Path: design → analyze → implement → verify → merge', () => {
+  it('transitions through all phases with autoMerge=true', () => {
+    // Phase 1: design complete → transition to analyze
+    let input = createMockInput({
+      step: { current: 'design', index: 0, status: 'complete' },
+    });
+    let result = makeDecision(input);
+    expect(result.action).toBe('transition');
+    expect(result.nextStep).toBe('analyze');
+
+    // Phase 2: analyze complete → transition to implement
+    input = createMockInput({
+      step: { current: 'analyze', index: 1, status: 'complete' },
+    });
+    result = makeDecision(input);
+    expect(result.action).toBe('transition');
+    expect(result.nextStep).toBe('implement');
+
+    // Phase 3: implement batches → all batches complete → transition to verify
+    // (This is handled by handleImplementBatching, tested separately)
+
+    // Phase 4: verify complete with autoMerge=true → transition to merge
+    const autoMergeExecution = createMockExecution({
+      config: {
+        ...createMockExecution().config,
+        autoMerge: true,
+      },
+    });
+    input = createMockInput({
+      step: { current: 'verify', index: 3, status: 'complete' },
+      execution: autoMergeExecution,
+    });
+    result = makeDecision(input);
+    expect(result.action).toBe('transition');
+    expect(result.nextStep).toBe('merge');
+    expect(result.skill).toBe('flow.merge');
+
+    // Phase 5: merge complete → orchestration complete
+    input = createMockInput({
+      step: { current: 'merge', index: 4, status: 'complete' },
+    });
+    result = makeDecision(input);
+    expect(result.action).toBe('complete');
+  });
+
+  it('handles batch progression during implement phase', () => {
+    const step = { current: 'implement', index: 2, status: 'in_progress' as const };
+
+    // Batch 0 pending, no workflow → spawn_batch
+    let execution = createMockExecution({
+      batches: {
+        total: 2,
+        current: 0,
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001'], status: 'pending', healAttempts: 0 },
+          { index: 1, section: 'Core', taskIds: ['T002'], status: 'pending', healAttempts: 0 },
+        ],
+      },
+    });
+    let result = handleImplementBatching(step, execution, null);
+    expect(result?.action).toBe('spawn_batch');
+
+    // Batch 0 completed → advance_batch to 1
+    execution = createMockExecution({
+      batches: {
+        total: 2,
+        current: 0,
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001'], status: 'completed', healAttempts: 0 },
+          { index: 1, section: 'Core', taskIds: ['T002'], status: 'pending', healAttempts: 0 },
+        ],
+      },
+    });
+    result = handleImplementBatching(step, execution, null);
+    expect(result?.action).toBe('advance_batch');
+    expect(result?.batchIndex).toBe(1);
+
+    // Both batches completed → force_step_complete
+    execution = createMockExecution({
+      batches: {
+        total: 2,
+        current: 1,
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001'], status: 'completed', healAttempts: 0 },
+          { index: 1, section: 'Core', taskIds: ['T002'], status: 'completed', healAttempts: 0 },
+        ],
+      },
+    });
+    result = handleImplementBatching(step, execution, null);
+    expect(result?.action).toBe('force_step_complete');
+  });
+});
diff --git a/packages/dashboard/tests/orchestration/orchestration-runner.test.ts b/packages/dashboard/tests/orchestration/orchestration-runner.test.ts
index e9f4d8f..e637859 100644
--- a/packages/dashboard/tests/orchestration/orchestration-runner.test.ts
+++ b/packages/dashboard/tests/orchestration/orchestration-runner.test.ts
@@ -15,6 +15,7 @@ const {
   mockAttemptHealFn,
   mockQuickDecision,
   mockExecSync,
+  mockIsPhaseComplete,
 } = vi.hoisted(() => ({
   mockOrchestrationServiceFns: {
     get: vi.fn(),
@@ -60,11 +61,20 @@ const {
       progress: { tasksTotal: 10, tasksComplete: 0, percentage: 0 },
     })
   ),
+  mockIsPhaseComplete: vi.fn(() => false),
 }));
 
-// Mock fs operations
+// Mock fs operations (updated for direct file reading in T021-T024)
 vi.mock('fs', () => ({
-  existsSync: vi.fn((path: string) => path.includes('.specflow') || path.includes('registry')),
+  existsSync: vi.fn((path: string) => {
+    // Spawn intent and runner state files should not exist by default (for spawn guards)
+    if (path.includes('spawn-intent-') || path.includes('runner-')) return false;
+    // Return true for specflow directories, registry, and specs directories
+    if (path.includes('.specflow') || path.includes('registry')) return true;
+    if (path.includes('/specs')) return true;
+    if (path.includes('spec.md') || path.includes('plan.md') || path.includes('tasks.md')) return true;
+    return false;
+  }),
   readFileSync: vi.fn((path: string) => {
     // Return registry with test project
     if (path.includes('registry.json')) {
@@ -74,22 +84,52 @@ vi.mock('fs', () => ({
         },
       });
     }
+    // Return tasks.md content for direct file reading
+    if (path.includes('tasks.md')) {
+      return `# Tasks: Test Phase
+
+## Phase 1: Setup
+- [x] T001 Create project structure
+- [x] T002 Add configuration
+- [x] T003 Setup tests
+
+## Phase 2: Implementation
+- [ ] T004 Implement feature A
+- [ ] T005 Implement feature B
+- [ ] T006 Implement feature C
+`;
+    }
     throw new Error(`File not found: ${path}`);
   }),
+  readdirSync: vi.fn((path: string, options?: { withFileTypes?: boolean }) => {
+    // Return specs directory listing for findActiveFeatureDir
+    if (path.includes('/specs')) {
+      if (options?.withFileTypes) {
+        return [
+          { name: '1055-test-phase', isDirectory: () => true },
+        ];
+      }
+      return ['1055-test-phase'];
+    }
+    return [];
+  }),
   writeFileSync: vi.fn(),
   mkdirSync: vi.fn(),
   unlinkSync: vi.fn(),
+  renameSync: vi.fn(),
 }));
 
-// Mock child_process for specflow status
-vi.mock('child_process', () => ({
-  execSync: mockExecSync,
-  spawn: vi.fn(),
-}));
+// Note: child_process mocking removed - no longer uses execSync (T021-T024)
 
 // Mock orchestration service
 vi.mock('@/lib/services/orchestration-service', () => ({
   orchestrationService: mockOrchestrationServiceFns,
+  getNextPhase: vi.fn((current: string) => {
+    const phases = ['design', 'analyze', 'implement', 'verify', 'merge', 'complete'];
+    const idx = phases.indexOf(current);
+    return idx >= 0 && idx < phases.length - 1 ? phases[idx + 1] : null;
+  }),
+  isPhaseComplete: mockIsPhaseComplete,
 }));
 
 // Mock workflow service
@@ -201,18 +241,16 @@ describe('OrchestrationRunner', () => {
     });
 
     it('should transition from design to analyze when design completes', async () => {
-      const orch = createOrchestration({ currentPhase: 'design' });
+      // Include executions.design so getCurrentWorkflowId can find the workflow
+      const orch = createOrchestration({
+        currentPhase: 'design',
+        executions: { design: 'wf-1', implement: [], healers: [] },
+      });
       mockOrchestrationService.get.mockReturnValue(orch);
       mockWorkflowService.get.mockReturnValue({ id: 'wf-1', status: 'completed' });
 
-      // Mock specflow status showing design artifacts exist
-      mockExecSync.mockReturnValue(
-        JSON.stringify({
-          phase: { number: 1055 },
-          context: { hasSpec: true, hasPlan: true, hasTasks: true },
-          progress: { tasksTotal: 10, tasksComplete: 0 },
-        })
-      );
+      // Design phase is complete when artifacts exist (hasPlan && hasTasks)
+      mockIsPhaseComplete.mockReturnValue(true);
 
       // Run briefly
       const promise = runOrchestration(projectId, orchestrationId, 50, 2);
@@ -460,6 +498,8 @@ describe('OrchestrationRunner', () => {
       const orch = createOrchestration({
         currentPhase: 'verify',
         config: { ...defaultConfig, autoMerge: false },
+        // Include executions.verify so getCurrentWorkflowId can find the workflow
+        executions: { verify: 'wf-1', implement: [], healers: [] },
         batches: {
           total: 1,
           current: 0,
@@ -471,14 +511,7 @@ describe('OrchestrationRunner', () => {
       mockOrchestrationService.get.mockReturnValue(orch);
       mockWorkflowService.get.mockReturnValue({ id: 'wf-1', status: 'completed' });
 
-      // Mock specflow status showing all tasks complete
-      mockExecSync.mockReturnValue(
-        JSON.stringify({
-          phase: { number: 1055 },
-          context: { hasSpec: true, hasPlan: true, hasTasks: true },
-          progress: { tasksTotal: 1, tasksComplete: 1 },
-        })
-      );
+      // Note: mockExecSync no longer used - direct file reading mocks are set up at top level
 
       const promise = runOrchestration(projectId, orchestrationId, 50, 2);
       await new Promise(resolve => setTimeout(resolve, 150));
@@ -580,6 +613,36 @@ describe('OrchestrationRunner', () => {
       await Promise.all([promise1, promise2]);
     });
 
+    it('G5.5: should not spawn when hasActiveWorkflow returns true', async () => {
+      // The spawn intent pattern (G5.3-G5.7) guards workflow spawning
+      // This test verifies the hasActiveWorkflow guard prevents duplicate spawns
+
+      const orch = createOrchestration({
+        currentPhase: 'implement',
+        status: 'running',
+        batches: {
+          total: 1,
+          current: 0,
+          items: [
+            { index: 0, section: 'Setup', taskIds: ['T001'], status: 'pending', healAttempts: 0 },
+          ],
+        },
+      });
+      mockOrchestrationService.get.mockReturnValue(orch);
+      mockWorkflowService.get.mockReturnValue(undefined);
+
+      // hasActiveWorkflow returns true means another spawn is in progress
+      mockWorkflowService.hasActiveWorkflow.mockReturnValue(true);
+
+      const promise = runOrchestration(projectId, orchestrationId, 50, 2);
+      await new Promise(resolve => setTimeout(resolve, 150));
+      stopRunner(orchestrationId);
+      await promise;
+
+      // Should not spawn because hasActiveWorkflow returns true (guard prevents duplicate)
+      expect(mockWorkflowService.start).not.toHaveBeenCalled();
+    });
+
     it('should track active runner status', async () => {
       mockOrchestrationService.get.mockReturnValue(createOrchestration({ status: 'paused' }));
 
@@ -595,6 +658,140 @@ describe('OrchestrationRunner', () => {
 
       expect(isRunnerActive(orchestrationId)).toBe(false);
     });
+
+    it('G11.12/G12.17: prevents duplicate workflow spawns on rapid triggers', async () => {
+      // This test verifies that rapid parallel calls to spawn logic result in only ONE workflow
+      // The spawn intent pattern (G5.3-G5.7) uses file-based locks to prevent race conditions
+
+      const orch = createOrchestration({
+        currentPhase: 'implement',
+        status: 'running',
+        batches: {
+          total: 1,
+          current: 0,
+          items: [
+            { index: 0, section: 'Setup', taskIds: ['T001'], status: 'pending', healAttempts: 0 },
+          ],
+        },
+      });
+
+      // Track spawn intent state to simulate file-based locking
+      let spawnIntentExists = false;
+      let workflowStartCount = 0;
+
+      // Mock fs.existsSync to track spawn intent file
+      const fs = await import('fs');
+      const originalExistsSync = fs.existsSync as ReturnType<typeof vi.fn>;
+      originalExistsSync.mockImplementation((path: string) => {
+        if (typeof path === 'string' && path.includes('spawn-intent-')) {
+          return spawnIntentExists;
+        }
+        if (path.includes('.specflow') || path.includes('registry')) return true;
+        if (path.includes('/specs')) return true;
+        if (path.includes('spec.md') || path.includes('plan.md') || path.includes('tasks.md')) return true;
+        return false;
+      });
+
+      // Mock fs.writeFileSync to track when spawn intent is written
+      const originalWriteFileSync = fs.writeFileSync as ReturnType<typeof vi.fn>;
+      originalWriteFileSync.mockImplementation((path: string) => {
+        if (typeof path === 'string' && path.includes('spawn-intent-')) {
+          spawnIntentExists = true;
+        }
+      });
+
+      // Mock fs.unlinkSync to track when spawn intent is cleared
+      const originalUnlinkSync = fs.unlinkSync as ReturnType<typeof vi.fn>;
+      originalUnlinkSync.mockImplementation((path: string) => {
+        if (typeof path === 'string' && path.includes('spawn-intent-')) {
+          spawnIntentExists = false;
+        }
+      });
+
+      mockOrchestrationService.get.mockReturnValue(orch);
+      mockWorkflowService.get.mockReturnValue(undefined);
+      mockWorkflowService.hasActiveWorkflow.mockReturnValue(false);
+
+      // Track actual workflow.start calls
+      mockWorkflowService.start.mockImplementation(async () => {
+        workflowStartCount++;
+        // Simulate a small delay like a real spawn would have
+        await new Promise(resolve => setTimeout(resolve, 10));
+        return { id: `workflow-${workflowStartCount}`, status: 'running' };
+      });
+
+      // Simulate rapid parallel spawn attempts by running multiple orchestration loops
+      // The first should spawn a workflow, subsequent ones should see spawn intent and skip
+      const promise1 = runOrchestration(projectId, orchestrationId, 50, 2);
+
+      // Small delay to let first runner start and write spawn intent
+      await new Promise(resolve => setTimeout(resolve, 20));
+
+      // Try to start second runner while first is spawning
+      // This simulates a race condition where two runners try to spawn simultaneously
+      const promise2 = runOrchestration(projectId, `${orchestrationId}-2`, 50, 2);
+
+      // Wait for both to complete their first iteration
+      await new Promise(resolve => setTimeout(resolve, 200));
+
+      stopRunner(orchestrationId);
+      stopRunner(`${orchestrationId}-2`);
+      await Promise.all([promise1, promise2]);
+
+      // The spawn intent pattern should have prevented duplicate spawns
+      // workflowService.start should have been called at most twice (once per runner)
+      // but the spawn guard checks should limit actual spawns
+      // Note: Each runner can spawn once for its own orchestration ID since they use different IDs
+      // The key test is that a SINGLE orchestration doesn't spawn multiple workflows
+
+      // Reset for clean single-orchestration test
+      vi.clearAllMocks();
+      spawnIntentExists = false;
+      workflowStartCount = 0;
+
+      // Re-setup mocks after clearAllMocks
+      originalExistsSync.mockImplementation((path: string) => {
+        if (typeof path === 'string' && path.includes('spawn-intent-')) {
+          return spawnIntentExists;
+        }
+        if (path.includes('.specflow') || path.includes('registry')) return true;
+        if (path.includes('/specs')) return true;
+        return false;
+      });
+      originalWriteFileSync.mockImplementation((path: string) => {
+        if (typeof path === 'string' && path.includes('spawn-intent-')) {
+          spawnIntentExists = true;
+        }
+      });
+      originalUnlinkSync.mockImplementation((path: string) => {
+        if (typeof path === 'string' && path.includes('spawn-intent-')) {
+          spawnIntentExists = false;
+        }
+      });
+
+      mockOrchestrationService.get.mockReturnValue(orch);
+      mockWorkflowService.get.mockReturnValue(undefined);
+      mockWorkflowService.hasActiveWorkflow.mockReturnValue(false);
+
+      // For the spawn guard test: after first spawn, hasActiveWorkflow should return true
+      let hasSpawned = false;
+      mockWorkflowService.hasActiveWorkflow.mockImplementation(() => hasSpawned);
+      mockWorkflowService.start.mockImplementation(async () => {
+        workflowStartCount++;
+        hasSpawned = true;
+        await new Promise(resolve => setTimeout(resolve, 5));
+        return { id: `workflow-${workflowStartCount}`, status: 'running' };
+      });
+
+      // Single orchestration, multiple iterations - should only spawn ONCE
+      const singlePromise = runOrchestration(projectId, orchestrationId, 30, 4);
+      await new Promise(resolve => setTimeout(resolve, 200));
+      stopRunner(orchestrationId);
+      await singlePromise;
+
+      // Assert: Only ONE workflow was started despite multiple poll iterations
+      expect(workflowStartCount).toBe(1);
+    });
   });
 
   describe('Resume and Merge Triggers', () => {
@@ -608,11 +805,15 @@ describe('OrchestrationRunner', () => {
 
     it('triggerMerge should start merge workflow', async () => {
       mockOrchestrationService.get.mockReturnValue(createOrchestration({ status: 'waiting_merge' }));
+      // Reset hasActiveWorkflow to false (may have been set to true by G5.5 test)
+      // Note: vi.clearAllMocks() only clears call history, not mockReturnValue
+      mockWorkflowService.hasActiveWorkflow.mockReturnValue(false);
 
       await triggerMerge(projectId, orchestrationId);
 
       expect(mockOrchestrationService.triggerMerge).toHaveBeenCalledWith('/test/project', orchestrationId);
-      expect(mockWorkflowService.start).toHaveBeenCalledWith(projectId, 'flow.merge');
+      // workflowService.start is called with (projectId, skill, timeout, resumeSession, orchestrationId)
+      expect(mockWorkflowService.start).toHaveBeenCalledWith(projectId, 'flow.merge', undefined, undefined, orchestrationId);
     });
   });
 
diff --git a/packages/dashboard/tests/orchestration/orchestration-service.test.ts b/packages/dashboard/tests/orchestration/orchestration-service.test.ts
index 95b9bbf..733cfe4 100644
--- a/packages/dashboard/tests/orchestration/orchestration-service.test.ts
+++ b/packages/dashboard/tests/orchestration/orchestration-service.test.ts
@@ -40,6 +40,16 @@ vi.mock('fs', () => ({
     }
     return [];
   }),
+  renameSync: vi.fn((oldPath: string, newPath: string) => {
+    // For atomic writes: copy content from temp to final path
+    if (mockFiles.has(oldPath)) {
+      mockFiles.set(newPath, mockFiles.get(oldPath)!);
+      mockFiles.delete(oldPath);
+    }
+  }),
+  unlinkSync: vi.fn((path: string) => {
+    mockFiles.delete(path);
+  }),
 }));
 
 // Mock child_process for specflow status
diff --git a/packages/dashboard/tests/orchestration/orchestration-validation.test.ts b/packages/dashboard/tests/orchestration/orchestration-validation.test.ts
new file mode 100644
index 0000000..4cd1b80
--- /dev/null
+++ b/packages/dashboard/tests/orchestration/orchestration-validation.test.ts
@@ -0,0 +1,331 @@
+/**
+ * Tests for orchestration-validation.ts
+ *
+ * These tests verify the state validation logic for orchestration.
+ * Each test covers a specific validation check from NFR-002 and G7.x goals.
+ */
+
+import { describe, it, expect } from 'vitest';
+import {
+  validateState,
+  validateOrchestrationState,
+  validateExecutionState,
+  validateCrossFileConsistency,
+  getDetailedValidationIssues,
+} from '../../src/lib/services/orchestration-validation';
+import type { OrchestrationExecution, OrchestrationState } from '@specflow/shared';
+
+// =============================================================================
+// Test Fixtures
+// =============================================================================
+
+function createMockState(overrides: Partial<OrchestrationState> = {}): OrchestrationState {
+  return {
+    schema_version: '3.0.0',
+    project: {
+      id: 'test-project',
+      name: 'Test Project',
+      path: '/path/to/project',
+    },
+    orchestration: {
+      phase: {
+        number: '1057',
+        name: 'test-phase',
+        status: 'in_progress',
+      },
+      step: {
+        current: 'implement',
+        index: 2,
+        status: 'in_progress',
+      },
+    },
+    ...overrides,
+  };
+}
+
+function createMockExecution(overrides: Partial<OrchestrationExecution> = {}): OrchestrationExecution {
+  return {
+    id: 'test-orch-id',
+    projectId: 'test-project',
+    status: 'running',
+    config: {
+      autoMerge: false,
+      skipDesign: false,
+      skipAnalyze: false,
+      autoHealEnabled: true,
+      maxHealAttempts: 3,
+      pauseBetweenBatches: false,
+      batchSizeFallback: 10,
+      additionalContext: '',
+      budget: {
+        maxTotal: 50,
+        maxPerBatch: 5,
+        healingBudget: 5,
+        decisionBudget: 2,
+      },
+    },
+    currentPhase: 'implement',
+    batches: {
+      total: 2,
+      current: 0,
+      items: [
+        { index: 0, section: 'Setup', taskIds: ['T001'], status: 'running', healAttempts: 0 },
+        { index: 1, section: 'Core', taskIds: ['T002'], status: 'pending', healAttempts: 0 },
+      ],
+    },
+    executions: {
+      implement: [],
+      healers: [],
+    },
+    startedAt: new Date().toISOString(),
+    updatedAt: new Date().toISOString(),
+    decisionLog: [],
+    totalCostUsd: 0,
+    ...overrides,
+  };
+}
+
+// =============================================================================
+// Orchestration State Validation Tests (G7.1-G7.3)
+// =============================================================================
+
+describe('validateOrchestrationState', () => {
+  it('returns no issues for valid state', () => {
+    const state = createMockState();
+    const issues = validateOrchestrationState(state);
+    expect(issues).toHaveLength(0);
+  });
+
+  it('detects missing active phase', () => {
+    const state = createMockState({
+      orchestration: {
+        phase: {},
+        step: { current: 'implement', index: 2, status: 'in_progress' },
+      },
+    });
+    const issues = validateOrchestrationState(state);
+    expect(issues.some((i) => i.code === 'NO_ACTIVE_PHASE')).toBe(true);
+  });
+
+  it('G7.2: detects invalid step', () => {
+    const state = createMockState({
+      orchestration: {
+        phase: { number: '1057' },
+        step: { current: 'invalid_step' as any, index: 99, status: 'in_progress' },
+      },
+    });
+    const issues = validateOrchestrationState(state);
+    expect(issues.some((i) => i.code === 'INVALID_STEP')).toBe(true);
+  });
+
+  it('G7.3: detects invalid status', () => {
+    const state = createMockState({
+      orchestration: {
+        phase: { number: '1057' },
+        step: { current: 'implement', index: 2, status: 'invalid_status' as any },
+      },
+    });
+    const issues = validateOrchestrationState(state);
+    expect(issues.some((i) => i.code === 'INVALID_STATUS')).toBe(true);
+  });
+
+  it('G7.1: detects step index mismatch', () => {
+    const state = createMockState({
+      orchestration: {
+        phase: { number: '1057' },
+        step: { current: 'implement', index: 0, status: 'in_progress' }, // Should be 2
+      },
+    });
+    const issues = validateOrchestrationState(state);
+    expect(issues.some((i) => i.code === 'STEP_INDEX_MISMATCH')).toBe(true);
+  });
+});
+
+// =============================================================================
+// Execution State Validation Tests (G7.4-G7.6)
+// =============================================================================
+
+describe('validateExecutionState', () => {
+  it('returns no issues for valid execution', () => {
+    const execution = createMockExecution();
+    const issues = validateExecutionState(execution);
+    expect(issues).toHaveLength(0);
+  });
+
+  it('G7.4: detects batch index mismatch', () => {
+    const execution = createMockExecution({
+      batches: {
+        total: 2,
+        current: 0,
+        items: [
+          { index: 1, section: 'Setup', taskIds: ['T001'], status: 'running', healAttempts: 0 }, // Wrong index
+          { index: 1, section: 'Core', taskIds: ['T002'], status: 'pending', healAttempts: 0 },
+        ],
+      },
+    });
+    const issues = validateExecutionState(execution);
+    expect(issues.some((i) => i.code === 'BATCH_INDEX_MISMATCH')).toBe(true);
+  });
+
+  it('G7.5: detects batches.current out of bounds', () => {
+    const execution = createMockExecution({
+      batches: {
+        total: 2,
+        current: 5, // Out of bounds
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001'], status: 'running', healAttempts: 0 },
+          { index: 1, section: 'Core', taskIds: ['T002'], status: 'pending', healAttempts: 0 },
+        ],
+      },
+    });
+    const issues = validateExecutionState(execution);
+    expect(issues.some((i) => i.code === 'BATCH_CURRENT_OUT_OF_BOUNDS')).toBe(true);
+  });
+
+  it('G7.5: allows batches.current >= total when all complete', () => {
+    const execution = createMockExecution({
+      batches: {
+        total: 2,
+        current: 2, // At end
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001'], status: 'completed', healAttempts: 0 },
+          { index: 1, section: 'Core', taskIds: ['T002'], status: 'completed', healAttempts: 0 },
+        ],
+      },
+    });
+    const issues = validateExecutionState(execution);
+    expect(issues.some((i) => i.code === 'BATCH_CURRENT_OUT_OF_BOUNDS')).toBe(false);
+  });
+
+  it('G7.6: detects missing recoveryContext when needs_attention', () => {
+    const execution = createMockExecution({
+      status: 'needs_attention',
+      recoveryContext: undefined,
+    });
+    const issues = validateExecutionState(execution);
+    expect(issues.some((i) => i.code === 'MISSING_RECOVERY_CONTEXT')).toBe(true);
+  });
+
+  it('G7.6: accepts needs_attention with recoveryContext', () => {
+    const execution = createMockExecution({
+      status: 'needs_attention',
+      recoveryContext: {
+        issue: 'Test issue',
+        options: ['retry', 'abort'],
+      },
+    });
+    const issues = validateExecutionState(execution);
+    expect(issues.some((i) => i.code === 'MISSING_RECOVERY_CONTEXT')).toBe(false);
+  });
+
+  it('detects invalid batch status', () => {
+    const execution = createMockExecution({
+      batches: {
+        total: 1,
+        current: 0,
+        items: [
+          { index: 0, section: 'Setup', taskIds: ['T001'], status: 'invalid' as any, healAttempts: 0 },
+        ],
+      },
+    });
+    const issues = validateExecutionState(execution);
+    expect(issues.some((i) => i.code === 'INVALID_BATCH_STATUS')).toBe(true);
+  });
+});
+
+// =============================================================================
+// Cross-File Consistency Tests (G7.7)
+// =============================================================================
+
+describe('validateCrossFileConsistency', () => {
+  it('returns no issues when state and execution match', () => {
+    const state = createMockState();
+    const execution = createMockExecution();
+    const issues = validateCrossFileConsistency(state, execution);
+    expect(issues).toHaveLength(0);
+  });
+
+  it('G7.7: detects step/phase mismatch', () => {
+    const state = createMockState({
+      orchestration: {
+        phase: { number: '1057' },
+        step: { current: 'design', index: 0, status: 'in_progress' },
+      },
+    });
+    const execution = createMockExecution({
+      currentPhase: 'implement', // Mismatch
+    });
+    const issues = validateCrossFileConsistency(state, execution);
+    expect(issues.some((i) => i.code === 'STEP_PHASE_MISMATCH')).toBe(true);
+  });
+
+  it('ignores mismatch when execution phase is complete', () => {
+    const state = createMockState();
+    const execution = createMockExecution({
+      currentPhase: 'complete',
+    });
+    const issues = validateCrossFileConsistency(state, execution);
+    expect(issues.some((i) => i.code === 'STEP_PHASE_MISMATCH')).toBe(false);
+  });
+});
+
+// =============================================================================
+// Combined Validation Tests
+// =============================================================================
+
+describe('validateState', () => {
+  it('returns valid=true for valid state', () => {
+    const state = createMockState();
+    const execution = createMockExecution();
+    const result = validateState(state, execution);
+    expect(result.valid).toBe(true);
+    expect(result.issues).toHaveLength(0);
+    expect(result.severity).toBe('none');
+  });
+
+  it('returns valid=false with issues for invalid state', () => {
+    const state = createMockState({
+      orchestration: {
+        phase: {},
+        step: { current: 'invalid' as any, index: 99, status: 'invalid' as any },
+      },
+    });
+    const execution = createMockExecution({
+      status: 'needs_attention',
+      recoveryContext: undefined,
+    });
+    const result = validateState(state, execution);
+    expect(result.valid).toBe(false);
+    expect(result.issues.length).toBeGreaterThan(0);
+    expect(result.severity).toBe('error');
+  });
+
+  it('returns warning severity when only warnings present', () => {
+    const state = createMockState({
+      orchestration: {
+        phase: { number: '1057' },
+        step: { current: 'implement', index: 0, status: 'in_progress' }, // Wrong index (warning)
+      },
+    });
+    const execution = createMockExecution();
+    const result = validateState(state, execution);
+    expect(result.severity).toBe('warning');
+  });
+});
+
+describe('getDetailedValidationIssues', () => {
+  it('returns issues with codes and suggested fixes', () => {
+    const state = createMockState({
+      orchestration: {
+        phase: { number: '1057' },
+        step: { current: 'implement', index: 0, status: 'in_progress' },
+      },
+    });
+    const execution = createMockExecution();
+    const issues = getDetailedValidationIssues(state, execution);
+
+    const stepIndexIssue = issues.find((i) => i.code === 'STEP_INDEX_MISMATCH');
+    expect(stepIndexIssue).toBeDefined();
+    expect(stepIndexIssue?.suggestedFix).toContain('2'); // Should suggest index 2
+  });
+});
diff --git a/packages/shared/src/schemas/events.ts b/packages/shared/src/schemas/events.ts
index 6e767e6..ab8a7a8 100644
--- a/packages/shared/src/schemas/events.ts
+++ b/packages/shared/src/schemas/events.ts
@@ -1,7 +1,7 @@
 import { z } from 'zod';
 import { RegistrySchema } from './registry.js';
 import { TasksDataSchema } from './tasks.js';
-import { WorkflowDataSchema } from './workflow.js';
+import { WorkflowDataSchema, QuestionOptionSchema } from './workflow.js';
 import { PhasesDataSchema } from './phases.js';
 
 /**
@@ -151,17 +151,106 @@ export const OrchestrationStateSchema = z.object({
 
 export type StepStatus = z.infer<typeof StepStatusSchema>;
 
+/**
+ * Session message schema for real-time session content
+ * Matches the structure in session-parser.ts
+ */
+export const ToolCallInfoSchema = z.object({
+  name: z.string(),
+  operation: z.enum(['read', 'write', 'edit', 'search', 'execute', 'todo', 'agent']),
+  files: z.array(z.string()),
+  input: z.record(z.string(), z.unknown()).optional(),
+});
+
+/**
+ * Agent task information from Task tool calls
+ */
+export const AgentTaskInfoSchema = z.object({
+  id: z.string(),
+  description: z.string(),
+  subagentType: z.string(),
+  status: z.enum(['running', 'completed']),
+});
+
+export const SessionMessageSchema = z.object({
+  role: z.enum(['user', 'assistant', 'system']),
+  content: z.string(),
+  timestamp: z.string().optional(),
+  toolCalls: z.array(ToolCallInfoSchema).optional(),
+  isCommandInjection: z.boolean().optional(),
+  commandName: z.string().optional(),
+  isSessionEnd: z.boolean().optional(),
+  questions: z.array(z.object({
+    question: z.string(),
+    header: z.string().optional(),
+    options: z.array(z.object({
+      label: z.string(),
+      description: z.string().optional(),
+    })),
+    multiSelect: z.boolean().optional(),
+  })).optional(),
+  agentTasks: z.array(AgentTaskInfoSchema).optional(),
+});
+
+export const TodoItemSchema = z.object({
+  content: z.string(),
+  status: z.enum(['pending', 'in_progress', 'completed']),
+  activeForm: z.string(),
+});
+
+/**
+ * Question from AskUserQuestion tool call (for session:question SSE events)
+ * Uses QuestionOptionSchema from workflow.ts for consistency
+ */
+export const SessionQuestionSchema = z.object({
+  question: z.string(),
+  header: z.string().optional(),
+  options: z.array(QuestionOptionSchema),
+  multiSelect: z.boolean().optional(),
+});
+
+/**
+ * Workflow output from StructuredOutput tool call
+ */
+export const WorkflowOutputSchema = z.object({
+  status: z.string(), // 'completed' | 'error' | 'needs_input' | 'cancelled' | etc.
+  phase: z.string().optional(),
+  message: z.string().optional(),
+  artifacts: z.array(z.object({
+    path: z.string(),
+    action: z.string(),
+  })).optional(),
+  questions: z.array(SessionQuestionSchema).optional(),
+});
+
+/**
+ * Session content structure for SSE
+ */
+export const SessionContentSchema = z.object({
+  messages: z.array(SessionMessageSchema),
+  filesModified: z.array(z.string()),
+  elapsedMs: z.number(),
+  currentTodos: z.array(TodoItemSchema),
+  workflowOutput: WorkflowOutputSchema.optional(),
+  agentTasks: z.array(AgentTaskInfoSchema).optional(),
+});
+
 /**
  * SSE Event Types
  */
 export const SSEEventTypeSchema = z.enum([
-  'connected',    // Initial connection established
-  'heartbeat',    // Keep-alive ping
-  'registry',     // Registry file changed
-  'state',        // Project state file changed
-  'tasks',        // Project tasks.md file changed
-  'workflow',     // Project workflow index changed
-  'phases',       // Project ROADMAP.md phases changed
+  'connected',        // Initial connection established
+  'heartbeat',        // Keep-alive ping
+  'registry',         // Registry file changed
+  'state',            // Project state file changed
+  'tasks',            // Project tasks.md file changed
+  'workflow',         // Project workflow index changed
+  'phases',           // Project ROADMAP.md phases changed
+  'session:message',  // Session JSONL content changed
+  'session:question', // AskUserQuestion detected
+  'session:end',      // Session ended
+  'session:created',  // New session JSONL file detected (G6.4)
+  'session:activity', // Existing session JSONL file modified (G6.5)
 ]);
 
 /**
@@ -229,6 +318,60 @@ export const PhasesEventSchema = z.object({
   data: PhasesDataSchema,
 });
 
+/**
+ * Session message event - session JSONL content changed
+ */
+export const SessionMessageEventSchema = z.object({
+  type: z.literal('session:message'),
+  timestamp: z.string(),
+  projectId: z.string(),
+  sessionId: z.string(),
+  data: SessionContentSchema,
+});
+
+/**
+ * Session question event - AskUserQuestion detected
+ */
+export const SessionQuestionEventSchema = z.object({
+  type: z.literal('session:question'),
+  timestamp: z.string(),
+  projectId: z.string(),
+  sessionId: z.string(),
+  data: z.object({
+    questions: z.array(SessionQuestionSchema),
+  }),
+});
+
+/**
+ * Session end event - session ended
+ */
+export const SessionEndEventSchema = z.object({
+  type: z.literal('session:end'),
+  timestamp: z.string(),
+  projectId: z.string(),
+  sessionId: z.string(),
+});
+
+/**
+ * Session created event - new session JSONL file detected (G6.4)
+ */
+export const SessionCreatedEventSchema = z.object({
+  type: z.literal('session:created'),
+  timestamp: z.string(),
+  projectId: z.string(),
+  sessionId: z.string(),
+});
+
+/**
+ * Session activity event - existing session JSONL file modified (G6.5)
+ */
+export const SessionActivityEventSchema = z.object({
+  type: z.literal('session:activity'),
+  timestamp: z.string(),
+  projectId: z.string(),
+  sessionId: z.string(),
+});
+
 /**
  * Union of all SSE event types
  */
@@ -240,6 +383,11 @@ export const SSEEventSchema = z.discriminatedUnion('type', [
   TasksEventSchema,
   WorkflowSSEEventSchema,
   PhasesEventSchema,
+  SessionMessageEventSchema,
+  SessionQuestionEventSchema,
+  SessionEndEventSchema,
+  SessionCreatedEventSchema,
+  SessionActivityEventSchema,
 ]);
 
 // Type exports
@@ -251,5 +399,18 @@ export type StateEvent = z.infer<typeof StateEventSchema>;
 export type TasksEvent = z.infer<typeof TasksEventSchema>;
 export type WorkflowSSEEvent = z.infer<typeof WorkflowSSEEventSchema>;
 export type PhasesEvent = z.infer<typeof PhasesEventSchema>;
+export type SessionMessageEvent = z.infer<typeof SessionMessageEventSchema>;
+export type SessionQuestionEvent = z.infer<typeof SessionQuestionEventSchema>;
+export type SessionEndEvent = z.infer<typeof SessionEndEventSchema>;
+export type SessionCreatedEvent = z.infer<typeof SessionCreatedEventSchema>;
+export type SessionActivityEvent = z.infer<typeof SessionActivityEventSchema>;
 export type SSEEvent = z.infer<typeof SSEEventSchema>;
 export type OrchestrationState = z.infer<typeof OrchestrationStateSchema>;
+export type ToolCallInfo = z.infer<typeof ToolCallInfoSchema>;
+export type AgentTaskInfo = z.infer<typeof AgentTaskInfoSchema>;
+export type SessionMessage = z.infer<typeof SessionMessageSchema>;
+export type TodoItem = z.infer<typeof TodoItemSchema>;
+// QuestionOption is exported from workflow.ts
+export type SessionQuestion = z.infer<typeof SessionQuestionSchema>;
+export type WorkflowOutput = z.infer<typeof WorkflowOutputSchema>;
+export type SessionContent = z.infer<typeof SessionContentSchema>;
diff --git a/packages/shared/src/schemas/index.ts b/packages/shared/src/schemas/index.ts
index 41d2c94..34ce5ca 100644
--- a/packages/shared/src/schemas/index.ts
+++ b/packages/shared/src/schemas/index.ts
@@ -17,12 +17,24 @@ export {
   TasksEventSchema,
   WorkflowSSEEventSchema,
   PhasesEventSchema,
+  SessionMessageEventSchema,
+  SessionQuestionEventSchema,
+  SessionEndEventSchema,
+  SessionCreatedEventSchema,
+  SessionActivityEventSchema,
   OrchestrationStateSchema,
   StepStatusSchema,
   WorkflowStepSchema,
   PhaseStatusSchema,
   UserGateStatusSchema,
   STEP_INDEX_MAP,
+  ToolCallInfoSchema,
+  AgentTaskInfoSchema,
+  SessionMessageSchema,
+  TodoItemSchema,
+  SessionQuestionSchema,
+  WorkflowOutputSchema,
+  SessionContentSchema,
   type SSEEventType,
   type SSEEvent,
   type ConnectedEvent,
@@ -32,8 +44,20 @@ export {
   type TasksEvent,
   type WorkflowSSEEvent,
   type PhasesEvent,
+  type SessionMessageEvent,
+  type SessionQuestionEvent,
+  type SessionEndEvent,
+  type SessionCreatedEvent,
+  type SessionActivityEvent,
   type OrchestrationState,
   type StepStatus,
+  type ToolCallInfo,
+  type AgentTaskInfo,
+  type SessionMessage,
+  type TodoItem,
+  type SessionQuestion,
+  type WorkflowOutput,
+  type SessionContent,
 } from './events.js';
 
 export {
diff --git a/packages/shared/src/schemas/orchestration-config.ts b/packages/shared/src/schemas/orchestration-config.ts
index a1bb83a..cd7274a 100644
--- a/packages/shared/src/schemas/orchestration-config.ts
+++ b/packages/shared/src/schemas/orchestration-config.ts
@@ -31,6 +31,10 @@ export const OrchestrationConfigSchema = z.object({
   skipDesign: z.boolean().default(false),
   /** Skip /flow.analyze step */
   skipAnalyze: z.boolean().default(false),
+  /** Skip /flow.implement if all tasks are already complete */
+  skipImplement: z.boolean().default(false),
+  /** Skip /flow.verify if verify step is already complete */
+  skipVerify: z.boolean().default(false),
 
   // Advanced options (collapsed section in modal)
   /** Attempt automatic recovery on batch failure */
@@ -56,6 +60,8 @@ export const DEFAULT_ORCHESTRATION_CONFIG: OrchestrationConfig = {
   additionalContext: '',
   skipDesign: false,
   skipAnalyze: false,
+  skipImplement: false,
+  skipVerify: false,
   autoHealEnabled: true,
   maxHealAttempts: 1,
   batchSizeFallback: 15,
diff --git a/packages/shared/src/schemas/orchestration-execution.ts b/packages/shared/src/schemas/orchestration-execution.ts
index 55ac79e..4219279 100644
--- a/packages/shared/src/schemas/orchestration-execution.ts
+++ b/packages/shared/src/schemas/orchestration-execution.ts
@@ -120,6 +120,17 @@ export const OrchestrationExecutionSchema = z.object({
 
 export type OrchestrationExecution = z.infer<typeof OrchestrationExecutionSchema>;
 
+/**
+ * Determine the starting phase based on config skip flags
+ */
+function getStartingPhase(config: z.infer<typeof OrchestrationConfigSchema>): z.infer<typeof OrchestrationPhaseSchema> {
+  if (!config.skipDesign) return 'design';
+  if (!config.skipAnalyze) return 'analyze';
+  if (!config.skipImplement) return 'implement';
+  if (!config.skipVerify) return 'verify';
+  return 'merge';
+}
+
 /**
  * Create a new orchestration execution with defaults
  */
@@ -135,7 +146,7 @@ export function createOrchestrationExecution(
     projectId,
     status: 'running',
     config,
-    currentPhase: config.skipDesign ? (config.skipAnalyze ? 'implement' : 'analyze') : 'design',
+    currentPhase: getStartingPhase(config),
     batches,
     executions: {
       implement: [],
diff --git a/packages/shared/src/schemas/workflow.ts b/packages/shared/src/schemas/workflow.ts
index 9d795be..7519e9d 100644
--- a/packages/shared/src/schemas/workflow.ts
+++ b/packages/shared/src/schemas/workflow.ts
@@ -32,7 +32,7 @@ export type WorkflowEvent = z.infer<typeof WorkflowEventSchema>;
  */
 export const QuestionOptionSchema = z.object({
   label: z.string(),
-  description: z.string(),
+  description: z.string().optional(),
 });
 
 export type QuestionOption = z.infer<typeof QuestionOptionSchema>;
diff --git a/pnpm-lock.yaml b/pnpm-lock.yaml
index ea02ec9..13d4164 100644
--- a/pnpm-lock.yaml
+++ b/pnpm-lock.yaml
@@ -104,6 +104,9 @@ importers:
       tailwind-merge:
         specifier: ^3.4.0
         version: 3.4.0
+      uuid:
+        specifier: ^13.0.0
+        version: 13.0.0
       zod:
         specifier: ^3.25.76
         version: 3.25.76
@@ -123,6 +126,9 @@ importers:
       '@types/react-syntax-highlighter':
         specifier: ^15.5.13
         version: 15.5.13
+      '@types/uuid':
+        specifier: ^11.0.0
+        version: 11.0.0
       autoprefixer:
         specifier: ^10.4.23
         version: 10.4.23(postcss@8.5.6)
@@ -1371,6 +1377,10 @@ packages:
   '@types/unist@3.0.3':
     resolution: {integrity: sha512-ko/gIFJRv177XgZsZcBwnqJN5x/Gien8qNOn0D5bQU/zAzVf9Zt3BlcUiLqhV9y4ARk0GbT3tnUiPNgnTXzc/Q==}
 
+  '@types/uuid@11.0.0':
+    resolution: {integrity: sha512-HVyk8nj2m+jcFRNazzqyVKiZezyhDKrGUA3jlEcg/nZ6Ms+qHwocba1Y/AaVaznJTAM9xpdFSh+ptbNrhOGvZA==}
+    deprecated: This is a stub types definition. uuid provides its own type definitions, so you do not need this installed.
+
   '@typescript-eslint/eslint-plugin@8.53.0':
     resolution: {integrity: sha512-eEXsVvLPu8Z4PkFibtuFJLJOTAV/nPdgtSjkGoPpddpFk3/ym2oy97jynY6ic2m6+nc5M8SE1e9v/mHKsulcJg==}
     engines: {node: ^18.18.0 || ^20.9.0 || >=21.1.0}
@@ -3504,6 +3514,10 @@ packages:
   util-deprecate@1.0.2:
     resolution: {integrity: sha512-EPD5q1uXyFxJpCrLnCc1nHnq3gOa6DZBocAIiI2TaSCA7VCJ1UJDMagCzIkXNsUYfD1daK//LTEQ8xiIbrHtcw==}
 
+  uuid@13.0.0:
+    resolution: {integrity: sha512-XQegIaBTVUjSHliKqcnFqYypAd4S+WCYt5NIeRs6w/UAry7z8Y9j5ZwRRL4kzq9U3sD6v+85er9FvkEaBpji2w==}
+    hasBin: true
+
   vfile-message@4.0.3:
     resolution: {integrity: sha512-QTHzsGd1EhbZs4AsQ20JX1rC3cOlt/IWJruk893DfLRr57lcnOeMaWG4K0JrRta4mIJZKth2Au3mM3u03/JWKw==}
 
@@ -4624,6 +4638,10 @@ snapshots:
 
   '@types/unist@3.0.3': {}
 
+  '@types/uuid@11.0.0':
+    dependencies:
+      uuid: 13.0.0
+
   '@typescript-eslint/eslint-plugin@8.53.0(@typescript-eslint/parser@8.53.0(eslint@9.39.2(jiti@1.21.7))(typescript@5.9.3))(eslint@9.39.2(jiti@1.21.7))(typescript@5.9.3)':
     dependencies:
       '@eslint-community/regexpp': 4.12.2
@@ -7409,6 +7427,8 @@ snapshots:
 
   util-deprecate@1.0.2: {}
 
+  uuid@13.0.0: {}
+
   vfile-message@4.0.3:
     dependencies:
       '@types/unist': 3.0.3