diff --git a/.github/workflows/publish.yml b/.github/workflows/publish.yml
index bc639d047..d80c7998d 100644
--- a/.github/workflows/publish.yml
+++ b/.github/workflows/publish.yml
@@ -12,7 +12,6 @@ on:
           - main
           - cli-prerelease
           - sdk
-          - workflow-types
           - sdk-py
           - brand
         default: 'all'
@@ -687,7 +686,6 @@ jobs:
           (cd packages/config && npm pack --ignore-scripts --pack-destination "$TARBALLS")
           (cd packages/github-primitive && npm pack --ignore-scripts --pack-destination "$TARBALLS")
           (cd packages/slack-primitive && npm pack --ignore-scripts --pack-destination "$TARBALLS")
-          (cd packages/workflow-types && npm pack --ignore-scripts --pack-destination "$TARBALLS")
           ls -lh "$TARBALLS"
 
       - name: Install tarballs into scratch project
@@ -705,11 +703,10 @@ jobs:
           CONFIG_TGZ=$(ls "$TARBALLS"/agent-relay-config-*.tgz | head -n1)
           GITHUB_PRIMITIVE_TGZ=$(ls "$TARBALLS"/agent-relay-github-primitive-*.tgz | head -n1)
           SLACK_PRIMITIVE_TGZ=$(ls "$TARBALLS"/agent-relay-slack-primitive-*.tgz | head -n1)
-          WORKFLOW_TYPES_TGZ=$(ls "$TARBALLS"/agent-relay-workflow-types-*.tgz | head -n1)
-          echo "Installing $SDK_TGZ + $BROKER_TGZ + $CLOUD_TGZ + $CONFIG_TGZ + $GITHUB_PRIMITIVE_TGZ + $SLACK_PRIMITIVE_TGZ + $WORKFLOW_TYPES_TGZ"
+          echo "Installing $SDK_TGZ + $BROKER_TGZ + $CLOUD_TGZ + $CONFIG_TGZ + $GITHUB_PRIMITIVE_TGZ + $SLACK_PRIMITIVE_TGZ"
           npm install --ignore-scripts --no-audit --no-fund \
             "$SDK_TGZ" "$BROKER_TGZ" "$CLOUD_TGZ" "$CONFIG_TGZ" \
-            "$GITHUB_PRIMITIVE_TGZ" "$SLACK_PRIMITIVE_TGZ" "$WORKFLOW_TYPES_TGZ"
+            "$GITHUB_PRIMITIVE_TGZ" "$SLACK_PRIMITIVE_TGZ"
           ls node_modules/@agent-relay/
 
       - name: Resolver smoke — getBrokerBinaryPath()
@@ -763,13 +760,12 @@ jobs:
           CONFIG_TGZ=$(ls "$TARBALLS"/agent-relay-config-*.tgz | head -n1)
           GITHUB_PRIMITIVE_TGZ=$(ls "$TARBALLS"/agent-relay-github-primitive-*.tgz | head -n1)
           SLACK_PRIMITIVE_TGZ=$(ls "$TARBALLS"/agent-relay-slack-primitive-*.tgz | head -n1)
-          WORKFLOW_TYPES_TGZ=$(ls "$TARBALLS"/agent-relay-workflow-types-*.tgz | head -n1)
           # Install SDK + every internal required dep whose bumped version
           # isn't on the registry yet, but skip the broker optional deps
           # entirely. The resolver should return null and spawn() should
           # throw the clear error.
           npm install --ignore-scripts --no-audit --no-fund --no-optional \
-            "$SDK_TGZ" "$CLOUD_TGZ" "$CONFIG_TGZ" "$GITHUB_PRIMITIVE_TGZ" "$SLACK_PRIMITIVE_TGZ" "$WORKFLOW_TYPES_TGZ"
+            "$SDK_TGZ" "$CLOUD_TGZ" "$CONFIG_TGZ" "$GITHUB_PRIMITIVE_TGZ" "$SLACK_PRIMITIVE_TGZ"
           node --input-type=module -e "
             import { AgentRelayClient } from '@agent-relay/sdk';
             try {
@@ -808,7 +804,6 @@ jobs:
           - events
           - github-primitive
           - slack-primitive
-          - workflow-types
 
     steps:
       - name: Checkout code
@@ -847,52 +842,6 @@ jobs:
           fi
           npm publish --access public --provenance --tag ${{ github.event.inputs.tag }} --ignore-scripts
 
-  # Publish workflow-types only. This is intentionally narrow: it repairs
-  # already-published SDK versions whose exact-version workflow-types package
-  # was missing, without attempting to republish @agent-relay/sdk.
-  publish-workflow-types-only:
-    name: Publish Workflow Types to NPM
-    needs: build
-    runs-on: ubuntu-latest
-    if: github.event.inputs.package == 'workflow-types'
-
-    steps:
-      - name: Checkout code
-        uses: actions/checkout@v4
-
-      - name: Setup Node.js
-        uses: actions/setup-node@v4
-        with:
-          node-version: '22.14.0'
-          registry-url: 'https://registry.npmjs.org'
-
-      - name: Download build artifacts
-        uses: actions/download-artifact@v4
-        with:
-          name: build-output
-          path: .
-
-      - name: Update npm for OIDC support
-        run: npm install -g npm@latest
-
-      - name: Dry run check
-        if: github.event.inputs.dry_run == 'true'
-        working-directory: packages/workflow-types
-        run: npm publish --dry-run --access public --tag ${{ github.event.inputs.tag }} --ignore-scripts
-
-      - name: Publish Workflow Types to NPM
-        if: github.event.inputs.dry_run != 'true'
-        working-directory: packages/workflow-types
-        run: |
-          set -euo pipefail
-          PKG_NAME=$(node -p "require('./package.json').name")
-          PKG_VERSION=$(node -p "require('./package.json').version")
-          if npm view "${PKG_NAME}@${PKG_VERSION}" version >/dev/null 2>&1; then
-            echo "${PKG_NAME}@${PKG_VERSION} already exists on npm; skipping publish"
-            exit 0
-          fi
-          npm publish --access public --provenance --tag ${{ github.event.inputs.tag }} --ignore-scripts
-
   # Publish the per-platform broker packages first. @agent-relay/sdk declares
   # these as exact-version optionalDependencies, so they must exist on the
   # registry at the matching version before the SDK is published — otherwise
@@ -2305,7 +2254,6 @@ jobs:
         verify-acp-macos,
         smoke-broker-packages,
         publish-sdk-internal-deps,
-        publish-workflow-types-only,
         publish-broker-packages,
         publish-packages,
         publish-brand-only,
@@ -2351,7 +2299,6 @@ jobs:
           echo "| Verify relay-acp (macOS) | ${{ needs.verify-acp-macos.result == 'success' && '✅' || (needs.verify-acp-macos.result == 'skipped' && '⏭️' || '❌') }} ${{ needs.verify-acp-macos.result }} |" >> $GITHUB_STEP_SUMMARY
           echo "| Smoke Broker Packages | ${{ needs.smoke-broker-packages.result == 'success' && '✅' || (needs.smoke-broker-packages.result == 'skipped' && '⏭️' || '❌') }} ${{ needs.smoke-broker-packages.result }} |" >> $GITHUB_STEP_SUMMARY
           echo "| Publish SDK Internal Deps | ${{ needs.publish-sdk-internal-deps.result == 'success' && '✅' || (needs.publish-sdk-internal-deps.result == 'skipped' && '⏭️' || '❌') }} ${{ needs.publish-sdk-internal-deps.result }} |" >> $GITHUB_STEP_SUMMARY
-          echo "| Publish Workflow Types Only | ${{ needs.publish-workflow-types-only.result == 'success' && '✅' || (needs.publish-workflow-types-only.result == 'skipped' && '⏭️' || '❌') }} ${{ needs.publish-workflow-types-only.result }} |" >> $GITHUB_STEP_SUMMARY
           echo "| Publish Broker Packages | ${{ needs.publish-broker-packages.result == 'success' && '✅' || (needs.publish-broker-packages.result == 'skipped' && '⏭️' || '❌') }} ${{ needs.publish-broker-packages.result }} |" >> $GITHUB_STEP_SUMMARY
           echo "| Publish Packages | ${{ needs.publish-packages.result == 'success' && '✅' || (needs.publish-packages.result == 'skipped' && '⏭️' || '❌') }} ${{ needs.publish-packages.result }} |" >> $GITHUB_STEP_SUMMARY
           echo "| Publish Brand | ${{ needs.publish-brand-only.result == 'success' && '✅' || (needs.publish-brand-only.result == 'skipped' && '⏭️' || '❌') }} ${{ needs.publish-brand-only.result }} |" >> $GITHUB_STEP_SUMMARY
diff --git a/.github/workflows/relay-cleanroom-hardening.yml b/.github/workflows/relay-cleanroom-hardening.yml
deleted file mode 100644
index b7ffd3112..000000000
--- a/.github/workflows/relay-cleanroom-hardening.yml
+++ /dev/null
@@ -1,82 +0,0 @@
-name: Relay Clean-Room Hardening
-
-on:
-  pull_request:
-    branches: [main]
-    paths:
-      - 'install.sh'
-      - 'packages/**'
-      - '!packages/sdk-swift/**'
-      - 'workflows/relay-e2e-meta-workflow.ts'
-      - 'workflows/relay-clean-room-e2e-validation.ts'
-      - 'scripts/run-relay-cleanroom-ci.sh'
-      - '.github/workflows/relay-cleanroom-hardening.yml'
-  workflow_dispatch:
-
-concurrency:
-  group: ${{ github.workflow }}-${{ github.ref }}
-  cancel-in-progress: true
-
-env:
-  AGENT_RELAY_TELEMETRY_DISABLED: 1
-
-jobs:
-  cleanroom-hardening:
-    name: Clean-Room Hardening (${{ matrix.os }})
-    runs-on: ${{ matrix.os }}
-    strategy:
-      fail-fast: false
-      matrix:
-        os: [macos-latest]
-    timeout-minutes: 20
-
-    permissions:
-      contents: read
-
-    steps:
-      - name: Checkout repository
-        uses: actions/checkout@v4
-
-      - name: Setup Node.js
-        uses: actions/setup-node@v4
-        with:
-          node-version: '22'
-          cache: 'npm'
-
-      - name: Install dependencies
-        run: npm ci
-
-      - name: Build local CLI/runtime
-        run: npm run build
-
-      - name: Link local CLI
-        run: cd packages/cli && npm link
-
-      - name: Verify CLI
-        run: agent-relay --version
-
-      - name: Run clean-room hardening validator
-        env:
-          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
-        run: bash scripts/run-relay-cleanroom-ci.sh
-
-      - name: Upload clean-room artifacts
-        if: always()
-        uses: actions/upload-artifact@v4
-        with:
-          name: relay-cleanroom-${{ matrix.os }}
-          path: .e2e-artifacts/
-          if-no-files-found: warn
-
-      - name: Append job summary
-        if: always()
-        run: |
-          if [ -f .e2e-artifacts/ci-summary.md ]; then
-            cat .e2e-artifacts/ci-summary.md >> "$GITHUB_STEP_SUMMARY"
-          else
-            echo "No CI summary produced." >> "$GITHUB_STEP_SUMMARY"
-          fi
-          if [ -f .e2e-artifacts/verdict.md ]; then
-            printf '\n## Reviewer Verdict\n\n' >> "$GITHUB_STEP_SUMMARY"
-            cat .e2e-artifacts/verdict.md >> "$GITHUB_STEP_SUMMARY"
-          fi
diff --git a/.github/workflows/workflow-reliability.yml b/.github/workflows/workflow-reliability.yml
deleted file mode 100644
index 5e1f72b76..000000000
--- a/.github/workflows/workflow-reliability.yml
+++ /dev/null
@@ -1,54 +0,0 @@
-name: Workflow Reliability
-
-on:
-  pull_request:
-    branches: [main]
-    paths:
-      - '.github/workflows/workflow-reliability.yml'
-      - 'packages/sdk/src/workflows/**'
-      - 'packages/sdk/package.json'
-      - 'packages/workflow-types/**'
-      - 'package-lock.json'
-      - 'package.json'
-  push:
-    branches: [main]
-    paths:
-      - '.github/workflows/workflow-reliability.yml'
-      - 'packages/sdk/src/workflows/**'
-      - 'packages/sdk/package.json'
-      - 'packages/workflow-types/**'
-      - 'package-lock.json'
-      - 'package.json'
-
-concurrency:
-  group: ${{ github.workflow }}-${{ github.ref }}
-  cancel-in-progress: true
-
-jobs:
-  workflow-reliability:
-    name: SDK Workflow Reliability
-    runs-on: ubuntu-latest
-    env:
-      NPM_CONFIG_FUND: false
-
-    steps:
-      - name: Checkout repository
-        uses: actions/checkout@v4
-
-      - name: Setup Node.js
-        uses: actions/setup-node@v4
-        with:
-          node-version: '22'
-          cache: 'npm'
-
-      - name: Install dependencies
-        run: npm ci
-
-      - name: Typecheck SDK workflows
-        run: npm --prefix packages/sdk run check
-
-      - name: Run workflow reliability contract matrix
-        run: |
-          npx vitest run --root packages/sdk --config vitest.config.ts \
-            src/workflows/__tests__/workflow-reliability-contract.test.ts \
-            src/workflows/__tests__/workflow-reliability-e2e.test.ts
diff --git a/.github/workflows/workflow-validation.yml b/.github/workflows/workflow-validation.yml
deleted file mode 100644
index 5117abaa3..000000000
--- a/.github/workflows/workflow-validation.yml
+++ /dev/null
@@ -1,72 +0,0 @@
-name: Workflow Validation
-
-on:
-  pull_request:
-    branches: [main]
-    paths:
-      - 'workflows/**'
-
-concurrency:
-  group: ${{ github.workflow }}-${{ github.ref }}
-  cancel-in-progress: true
-
-jobs:
-  validate:
-    name: Validate & Dry Run
-    runs-on: ubuntu-latest
-    env:
-      NPM_CONFIG_FUND: false
-
-    steps:
-      - name: Checkout repository
-        uses: actions/checkout@v4
-        with:
-          fetch-depth: 0
-
-      - name: Setup Node.js
-        uses: actions/setup-node@v4
-        with:
-          node-version: '22'
-          cache: 'npm'
-
-      - name: Cache node_modules
-        id: cache-modules
-        uses: actions/cache@v4
-        with:
-          path: |
-            node_modules
-            packages/*/node_modules
-          key: modules-${{ hashFiles('package-lock.json') }}
-
-      - name: Install dependencies
-        if: steps.cache-modules.outputs.cache-hit != 'true'
-        run: npm ci
-
-      - name: Build packages
-        run: npm run build
-
-      - name: Find changed workflow files
-        id: changed
-        env:
-          BASE_REF: ${{ github.base_ref }}
-        run: |
-          files=$(git diff --name-only "origin/$BASE_REF"...HEAD -- 'workflows/**' \
-            | grep -E '\.(ts|yaml|yml)$' || true)
-          echo "files<<EOF" >> "$GITHUB_OUTPUT"
-          echo "$files" >> "$GITHUB_OUTPUT"
-          echo "EOF" >> "$GITHUB_OUTPUT"
-          echo "Found: $files"
-
-      - name: Validate & dry run workflows
-        if: steps.changed.outputs.files != ''
-        env:
-          CHANGED_FILES: ${{ steps.changed.outputs.files }}
-        run: |
-          for f in $CHANGED_FILES; do
-            echo "=== $f ==="
-            if [[ "$f" == *.yaml || "$f" == *.yml ]]; then
-              npx tsx packages/sdk/src/workflows/cli.ts "$f" --validate
-              DRY_RUN=1 npx tsx packages/sdk/src/workflows/cli.ts "$f"
-            fi
-            echo ""
-          done
diff --git a/package.json b/package.json
index 0cf1b1adf..0d3f2726c 100644
--- a/package.json
+++ b/package.json
@@ -9,7 +9,7 @@
     "web"
   ],
   "scripts": {
-    "typecheck": "npm run build:config && npm --prefix packages/workflow-types run build && npm --prefix packages/github-primitive run build && npm --prefix packages/slack-primitive run build && npm --prefix packages/cloud run build && npm run build:utils && npm run build:trajectory && npm run build:policy && npm run build:sdk && npm run build:hooks && npm run build:memory && npm run build:telemetry && cd packages/cli && npx tsc --noEmit",
+    "typecheck": "npm run build:config && npm --prefix packages/github-primitive run build && npm --prefix packages/slack-primitive run build && npm --prefix packages/cloud run build && npm run build:utils && npm run build:trajectory && npm run build:policy && npm run build:sdk && npm run build:hooks && npm run build:memory && npm run build:telemetry && cd packages/cli && npx tsc --noEmit",
     "build": "npm run clean && npm run build:rust && turbo run build --filter='./packages/*'",
     "build:packages": "turbo run build --filter='./packages/*'",
     "build:packages:watch": "turbo run build --filter='./packages/*' --watch",
@@ -34,8 +34,7 @@
     "build:rust": "if command -v ~/.cargo/bin/cargo >/dev/null 2>&1; then ~/.cargo/bin/cargo build --release --bin agent-relay-broker && mkdir -p packages/sdk/bin && cp target/release/agent-relay-broker packages/sdk/bin/agent-relay-broker.new && mv -f packages/sdk/bin/agent-relay-broker.new packages/sdk/bin/agent-relay-broker && echo '✓ broker binary (agent-relay-broker) built and copied to packages/sdk/bin/'; else echo '⚠ Rust not installed, skipping local broker build; installs use platform optional dependencies'; fi",
     "start": "node packages/cli/dist/cli/index.js",
     "pretest": "npm run build",
-    "test": "vitest run && npm run test:sdk:vitest",
-    "test:sdk:vitest": "cd packages/sdk && vitest run --config vitest.config.ts src/workflows/__tests__/run-script.test.ts",
+    "test": "vitest run",
     "pretest:coverage": "npm run build",
     "test:coverage": "vitest run --coverage",
     "test:watch": "vitest",
diff --git a/packages/browser-primitive/examples/browser-workflow.ts b/packages/browser-primitive/examples/browser-workflow.ts
deleted file mode 100644
index 211a08610..000000000
--- a/packages/browser-primitive/examples/browser-workflow.ts
+++ /dev/null
@@ -1,138 +0,0 @@
-import { WorkflowRunner, type RelayYamlConfig } from '@agent-relay/sdk/workflows';
-
-import { BrowserStepExecutor, createBrowserStep } from '../src/workflow-step.js';
-
-const browserExecutor = new BrowserStepExecutor();
-
-const config: RelayYamlConfig = {
-  version: '1.0',
-  name: 'browser-primitive-workflow',
-  description: 'Browser primitive workflow with chained actions and captured output.',
-  swarm: {
-    pattern: 'pipeline',
-  },
-  agents: [],
-  workflows: [
-    {
-      name: 'browser-primitive-workflow',
-      steps: [
-        createBrowserStep({
-          name: 'inspect-example-page',
-          sessionId: 'example-page-session',
-          config: {
-            browser: 'chromium',
-            headless: true,
-            viewport: { width: 1280, height: 720 },
-            captureConsole: true,
-            persistSession: true,
-          },
-          actions: [
-            {
-              action: 'goto',
-              params: {
-                url: 'https://example.com',
-                waitUntil: 'domcontentloaded',
-              },
-            },
-            {
-              action: 'text',
-              id: 'heading',
-              params: {
-                selector: 'h1',
-                innerText: true,
-              },
-            },
-          ],
-          output: {
-            mode: 'last',
-            format: 'text',
-          },
-        }),
-        createBrowserStep({
-          name: 'use-captured-heading',
-          dependsOn: ['inspect-example-page'],
-          sessionId: 'example-page-session',
-          config: {
-            browser: 'chromium',
-            headless: true,
-            persistSession: true,
-          },
-          actions: [
-            {
-              action: 'evaluate',
-              params: {
-                script: '() => `Current title from the persisted session: ${document.title}`',
-              },
-            },
-          ],
-          output: {
-            mode: 'last',
-            format: 'text',
-          },
-        }),
-        createBrowserStep({
-          name: 'capture-page-report',
-          dependsOn: ['use-captured-heading'],
-          sessionId: 'example-page-session',
-          config: {
-            browser: 'chromium',
-            headless: true,
-            persistSession: true,
-          },
-          actions: [
-            {
-              action: 'evaluate',
-              id: 'pageFacts',
-              outputKey: 'pageFacts',
-              capture: true,
-              params: {
-                script: '() => ({ title: document.title, links: document.links.length })',
-              },
-            },
-            {
-              action: 'screenshot',
-              id: 'screenshot',
-              outputKey: 'screenshot',
-              capture: true,
-              params: {
-                path: 'artifacts/example-page.png',
-                fullPage: true,
-              },
-            },
-          ],
-          output: {
-            mode: 'captures',
-            includeMetadata: true,
-            includeSession: true,
-            pretty: true,
-          },
-          closeSession: true,
-        }),
-      ],
-    },
-  ],
-  errorHandling: {
-    strategy: 'fail-fast',
-  },
-};
-
-async function main(): Promise<void> {
-  const runner = new WorkflowRunner({
-    cwd: process.cwd(),
-    executor: browserExecutor,
-  });
-
-  const result = await runner.execute(config);
-  console.log(`Browser workflow completed: ${result.status}`);
-}
-
-if (process.argv[1] === new URL(import.meta.url).pathname) {
-  main()
-    .catch((error) => {
-      console.error(error instanceof Error ? error.stack : error);
-      process.exitCode = 1;
-    })
-    .finally(async () => {
-      await browserExecutor.closeAll();
-    });
-}
diff --git a/packages/browser-primitive/package.json b/packages/browser-primitive/package.json
index 6b5ca38ec..8bb5ff5ab 100644
--- a/packages/browser-primitive/package.json
+++ b/packages/browser-primitive/package.json
@@ -11,11 +11,6 @@
       "import": "./dist/index.js",
       "default": "./dist/index.js"
     },
-    "./workflow-step": {
-      "types": "./dist/workflow-step.d.ts",
-      "import": "./dist/workflow-step.js",
-      "default": "./dist/workflow-step.js"
-    },
     "./mcp-server": {
       "types": "./dist/mcp-server.d.ts",
       "import": "./dist/mcp-server.js",
diff --git a/packages/browser-primitive/src/index.ts b/packages/browser-primitive/src/index.ts
index 076627102..793880e77 100644
--- a/packages/browser-primitive/src/index.ts
+++ b/packages/browser-primitive/src/index.ts
@@ -1,6 +1,5 @@
 export { BrowserClient, type BrowserClientOptions } from './browser-client.js';
 export * from './types.js';
-export * from './workflow-step.js';
 export * from './mcp-server.js';
 
 export * from './actions/navigation.js';
diff --git a/packages/browser-primitive/src/mcp-server.ts b/packages/browser-primitive/src/mcp-server.ts
index 604da45cc..ac186cae4 100644
--- a/packages/browser-primitive/src/mcp-server.ts
+++ b/packages/browser-primitive/src/mcp-server.ts
@@ -10,12 +10,6 @@ import type {
   BrowserConfig,
   BrowserSession,
 } from './types.js';
-import {
-  BrowserStepExecutor,
-  type BrowserStepConfig,
-  type BrowserStepExecutionResult,
-} from './workflow-step.js';
-
 export type JsonRpcId = string | number | null;
 
 export interface JsonRpcRequest {
@@ -68,11 +62,6 @@ export interface BrowserActionsExecuteParams {
   config?: BrowserConfig;
 }
 
-export interface BrowserStepExecuteParams {
-  step: BrowserStepConfig;
-  workspaceId?: string;
-}
-
 export class BrowserMcpSessionManager {
   private readonly clients = new Map<string, BrowserClient>();
   private defaultSessionId?: string;
@@ -161,7 +150,6 @@ export class BrowserMcpServer {
   private readonly serverName: string;
   private readonly serverVersion: string;
   private readonly sessions: BrowserMcpSessionManager;
-  private readonly stepExecutor: BrowserStepExecutor;
   private rl?: ReadlineInterface;
 
   constructor(options: BrowserMcpServerOptions = {}) {
@@ -171,7 +159,6 @@ export class BrowserMcpServer {
     this.serverName = options.serverName ?? 'agent-relay-browser';
     this.serverVersion = options.serverVersion ?? '1.0.0';
     this.sessions = new BrowserMcpSessionManager(options.defaultConfig);
-    this.stepExecutor = new BrowserStepExecutor({ config: options.defaultConfig });
   }
 
   start(): void {
@@ -234,7 +221,6 @@ export class BrowserMcpServer {
 
   async shutdown(exitCode?: number): Promise<void> {
     await this.sessions.closeAll();
-    await this.stepExecutor.closeAll();
     if (exitCode !== undefined) {
       process.exit(exitCode);
     }
@@ -284,9 +270,6 @@ export class BrowserMcpServer {
       case 'browser.actions.execute':
         return this.executeActions(params);
 
-      case 'browser.step.execute':
-        return this.executeStep(params);
-
       default:
         throw jsonRpcMethodNotFound(method);
     }
@@ -316,10 +299,6 @@ export class BrowserMcpServer {
         const result = await this.executeActions(args);
         return toMcpToolResult(result, hasActionErrors(result));
       }
-      case 'browser_step_execute': {
-        const result = await this.executeStep(args);
-        return toMcpToolResult(result, !(result as BrowserStepExecutionResult).success);
-      }
       default:
         throw new Error(`Unknown browser tool: ${name}`);
     }
@@ -375,14 +354,6 @@ export class BrowserMcpServer {
     return client.executeMany(record.actions as BrowserActionRequest[]);
   }
 
-  private async executeStep(params: unknown): Promise<BrowserStepExecutionResult> {
-    const record = requireRecord(params, 'browser.step.execute params');
-    const step = requireRecord(record.step, 'step') as unknown as BrowserStepConfig;
-    const workspaceId = typeof record.workspaceId === 'string' ? record.workspaceId : undefined;
-
-    return this.stepExecutor.execute(step, { workspaceId });
-  }
-
   private writeResponse(response: JsonRpcResponse): void {
     this.stdout.write(`${JSON.stringify(response)}\n`);
   }
@@ -472,18 +443,6 @@ export function getBrowserToolDefinitions(): Array<Record<string, unknown>> {
         required: ['actions'],
       },
     },
-    {
-      name: 'browser_step_execute',
-      description: 'Execute a BrowserStepConfig using the workflow step executor.',
-      inputSchema: {
-        type: 'object',
-        properties: {
-          workspaceId: { type: 'string' },
-          step: { type: 'object' },
-        },
-        required: ['step'],
-      },
-    },
   ];
 }
 
diff --git a/packages/browser-primitive/src/workflow-step.ts b/packages/browser-primitive/src/workflow-step.ts
deleted file mode 100644
index b4fcf1fd1..000000000
--- a/packages/browser-primitive/src/workflow-step.ts
+++ /dev/null
@@ -1,602 +0,0 @@
-import type { RunnerStepExecutor, WorkflowStep } from '@agent-relay/sdk/workflows';
-
-import { BrowserClient, type BrowserClientOptions } from './browser-client.js';
-import type {
-  ActionResult,
-  BrowserActionName,
-  BrowserActionParamsMap,
-  BrowserActionRequest,
-  BrowserConfig,
-  BrowserSession,
-} from './types.js';
-
-export type BrowserStepOutputMode = 'last' | 'all' | 'captures' | 'summary' | 'none';
-export type BrowserStepOutputFormat = 'json' | 'text';
-
-export type BrowserStepAction<TName extends BrowserActionName = BrowserActionName> = {
-  [Name in TName]: {
-    action: Name;
-    params: BrowserActionParamsMap[Name];
-    /** Stable key for captured output. Defaults to the zero-based action index. */
-    id?: string;
-    /** Include this action in output.mode = "captures". Defaults true for extraction actions. */
-    capture?: boolean;
-    /** Output object key when output.mode = "captures". Defaults to id or action_<index>. */
-    outputKey?: string;
-    /** Continue running later actions if this action fails. Defaults false. */
-    continueOnError?: boolean;
-  };
-}[TName];
-
-export interface BrowserStepOutputConfig {
-  /** Which action results become the workflow step output. Defaults to "last". */
-  mode?: BrowserStepOutputMode;
-  /** Emit JSON for structured chaining or text for simple downstream interpolation. Defaults to "json". */
-  format?: BrowserStepOutputFormat;
-  /** Include per-action metadata such as current URL and timing in JSON output. Defaults false. */
-  includeMetadata?: boolean;
-  /** Include final browser session state in JSON output. Defaults false. */
-  includeSession?: boolean;
-  /** Pretty-print JSON output. Defaults false. */
-  pretty?: boolean;
-}
-
-export interface BrowserStepConfig {
-  /** Unique step name within the workflow. */
-  name: string;
-  /** Dependencies in the Relay workflow DAG. */
-  dependsOn?: string[];
-  /** Browser settings for this step/session. */
-  config?: BrowserConfig;
-  /** Ordered browser actions to execute in one browser session. */
-  actions: BrowserStepAction[];
-  /** Controls the string captured as {{steps.<name>.output}}. */
-  output?: BrowserStepOutputConfig;
-  /** Reuse a named browser session across browser steps. Defaults to the workspace/config session. */
-  sessionId?: string;
-  /** Close the session after this step, even when persistSession is true. */
-  closeSession?: boolean;
-  /** Workflow step timeout in milliseconds. */
-  timeoutMs?: number;
-  /** Number of retry attempts when the workflow runner retries this integration step. */
-  retries?: number;
-}
-
-export interface BrowserStepExecutionContext {
-  workspaceId?: string;
-  sessionId?: string;
-  client?: BrowserClient;
-}
-
-export interface BrowserStepActionRecord<TOutput = unknown> {
-  index: number;
-  id?: string;
-  action: BrowserActionName;
-  success: boolean;
-  output?: TOutput;
-  error?: string;
-  metadata?: ActionResult['metadata'];
-}
-
-export interface BrowserStepExecutionResult {
-  success: boolean;
-  output: string;
-  results: BrowserStepActionRecord[];
-  session: BrowserSession;
-  error?: string;
-}
-
-export interface BrowserIntegrationStepResult {
-  output: string;
-  success: boolean;
-}
-
-type ResolvedParams = Record<string, unknown>;
-
-const BROWSER_INTEGRATION = 'browser';
-const BROWSER_RUN_ACTION = 'run';
-const EXTRACTION_ACTIONS = new Set<BrowserActionName>([
-  'text',
-  'getText',
-  'html',
-  'getHTML',
-  'attribute',
-  'getAttribute',
-  'screenshot',
-  'elementScreenshot',
-  'evaluate',
-]);
-
-/**
- * Create a Relay integration step that can be used in relay.yaml or passed to
- * WorkflowRunner directly. Complex action/config objects are serialized into
- * params so the existing workflow template resolver can interpolate them.
- */
-export function createBrowserStep(config: BrowserStepConfig): WorkflowStep {
-  validateBrowserStepConfig(config);
-
-  const params: Record<string, string> = {
-    actions: JSON.stringify(config.actions),
-  };
-
-  if (config.config !== undefined) {
-    params.config = JSON.stringify(config.config);
-  }
-  if (config.output !== undefined) {
-    params.output = JSON.stringify(config.output);
-  }
-  if (config.sessionId !== undefined) {
-    params.sessionId = config.sessionId;
-  }
-  if (config.closeSession !== undefined) {
-    params.closeSession = String(config.closeSession);
-  }
-
-  const step: WorkflowStep = {
-    name: config.name,
-    type: 'integration',
-    integration: BROWSER_INTEGRATION,
-    action: BROWSER_RUN_ACTION,
-    params,
-  };
-
-  if (config.dependsOn !== undefined) step.dependsOn = config.dependsOn;
-  if (config.timeoutMs !== undefined) step.timeoutMs = config.timeoutMs;
-  if (config.retries !== undefined) step.retries = config.retries;
-
-  return step;
-}
-
-export class BrowserStepExecutor implements RunnerStepExecutor {
-  private readonly sessions = new Map<string, BrowserClient>();
-
-  constructor(private readonly options: BrowserClientOptions = {}) {}
-
-  async executeAgentStep(): Promise<string> {
-    throw new Error('BrowserStepExecutor only executes browser integration steps.');
-  }
-
-  async execute(
-    config: BrowserStepConfig,
-    context: BrowserStepExecutionContext = {}
-  ): Promise<BrowserStepExecutionResult> {
-    validateBrowserStepConfig(config);
-
-    const client = context.client ?? this.getOrCreateClient(config, context);
-    const records: BrowserStepActionRecord[] = [];
-    let hardFailure: BrowserStepActionRecord | undefined;
-
-    for (let index = 0; index < config.actions.length; index += 1) {
-      const action = config.actions[index];
-      const started = Date.now();
-      const result = await client.executeWorkflowAction(action as BrowserActionRequest);
-
-      const record: BrowserStepActionRecord = {
-        index,
-        id: action.id,
-        action: action.action,
-        success: result.success,
-        output: result.output,
-        error: result.error,
-        metadata: result.metadata,
-      };
-      records.push(record);
-
-      if (!result.success && !action.continueOnError) {
-        hardFailure = record;
-        break;
-      }
-
-      if (!record.metadata) {
-        record.metadata = {
-          action: action.action,
-          sessionId: client.getSession().id,
-          currentUrl: client.getCurrentUrl(),
-          executionTime: Date.now() - started,
-        };
-      }
-    }
-
-    const session = client.getSession();
-    const output = formatStepOutput(config, records, session);
-    const success = hardFailure === undefined;
-
-    if (config.closeSession || config.config?.persistSession === false) {
-      if (context.client) {
-        await context.client.close();
-      } else {
-        await this.closeSession(this.resolveSessionKey(config, context));
-      }
-    }
-
-    return {
-      success,
-      output,
-      results: records,
-      session,
-      error: hardFailure?.error,
-    };
-  }
-
-  async executeIntegrationStep(
-    step: WorkflowStep,
-    resolvedParams: Record<string, string>,
-    context: { workspaceId?: string } = {}
-  ): Promise<BrowserIntegrationStepResult> {
-    if (step.integration !== BROWSER_INTEGRATION) {
-      return {
-        success: false,
-        output: `BrowserStepExecutor only handles "${BROWSER_INTEGRATION}" integration steps`,
-      };
-    }
-
-    try {
-      const config = browserStepConfigFromWorkflowStep(step, resolvedParams);
-      const result = await this.execute(config, context);
-
-      return {
-        success: result.success,
-        output: result.success ? result.output : result.output || result.error || 'Browser step failed',
-      };
-    } catch (error) {
-      return {
-        success: false,
-        output: error instanceof Error ? error.message : String(error),
-      };
-    }
-  }
-
-  async closeSession(sessionId: string): Promise<boolean> {
-    const client = this.sessions.get(sessionId);
-    if (!client) {
-      return false;
-    }
-
-    await client.close();
-    this.sessions.delete(sessionId);
-    return true;
-  }
-
-  async closeAll(): Promise<void> {
-    await Promise.all([...this.sessions.values()].map((client) => client.close()));
-    this.sessions.clear();
-  }
-
-  listSessions(): BrowserSession[] {
-    return [...this.sessions.values()].map((client) => client.getSession());
-  }
-
-  private getOrCreateClient(config: BrowserStepConfig, context: BrowserStepExecutionContext): BrowserClient {
-    const key = this.resolveSessionKey(config, context);
-    const existing = this.sessions.get(key);
-
-    if (existing) {
-      return existing;
-    }
-
-    const client = new BrowserClient({
-      ...this.options,
-      config: {
-        ...this.options.config,
-        ...config.config,
-      },
-    });
-    this.sessions.set(key, client);
-    return client;
-  }
-
-  private resolveSessionKey(config: BrowserStepConfig, context: BrowserStepExecutionContext): string {
-    if (context.sessionId) return context.sessionId;
-    if (config.sessionId) return config.sessionId;
-
-    const workspace = context.workspaceId ?? 'default';
-    return `${workspace}:${stableStringify(config.config ?? {})}`;
-  }
-}
-
-export function browserStepConfigFromWorkflowStep(
-  step: WorkflowStep,
-  resolvedParams: Record<string, string>
-): BrowserStepConfig {
-  const params = normalizeResolvedParams(resolvedParams);
-  const config = readJsonParam<BrowserConfig>(params.config ?? params.browserConfig, 'config') ?? undefined;
-  const output = readJsonParam<BrowserStepOutputConfig>(params.output, 'output') ?? undefined;
-  const closeSession =
-    params.closeSession === undefined ? undefined : Boolean(coerceScalar(params.closeSession));
-  const sessionId = params.sessionId === undefined ? undefined : String(params.sessionId);
-
-  const actions = readActions(step, params);
-
-  return {
-    name: step.name,
-    dependsOn: step.dependsOn,
-    config,
-    actions,
-    output,
-    sessionId,
-    closeSession,
-    timeoutMs: step.timeoutMs,
-    retries: step.retries,
-  };
-}
-
-function validateBrowserStepConfig(config: BrowserStepConfig): void {
-  if (!config.name) {
-    throw new Error('Browser step requires a non-empty name');
-  }
-  if (!Array.isArray(config.actions) || config.actions.length === 0) {
-    throw new Error(`Browser step "${config.name}" requires at least one action`);
-  }
-
-  for (const [index, action] of config.actions.entries()) {
-    if (!action || typeof action !== 'object') {
-      throw new Error(`Browser step "${config.name}" action ${index} must be an object`);
-    }
-    if (!action.action || typeof action.action !== 'string') {
-      throw new Error(`Browser step "${config.name}" action ${index} requires an action name`);
-    }
-    if (action.params === undefined || typeof action.params !== 'object' || action.params === null) {
-      throw new Error(`Browser step "${config.name}" action ${index} requires params`);
-    }
-  }
-}
-
-function readActions(step: WorkflowStep, params: ResolvedParams): BrowserStepAction[] {
-  const serializedActions = params.actions;
-  if (serializedActions !== undefined) {
-    const parsed = readJsonParam<BrowserStepAction[]>(serializedActions, 'actions');
-    if (!Array.isArray(parsed)) {
-      throw new Error('Browser step params.actions must be a JSON array');
-    }
-    return parsed;
-  }
-
-  if (!step.action || step.action === BROWSER_RUN_ACTION) {
-    throw new Error(`Browser step "${step.name}" requires params.actions or a browser action`);
-  }
-
-  const actionParams: Record<string, unknown> = {};
-  for (const [key, value] of Object.entries(params)) {
-    if (
-      key === 'config' ||
-      key === 'browserConfig' ||
-      key === 'output' ||
-      key === 'sessionId' ||
-      key === 'closeSession'
-    ) {
-      continue;
-    }
-    actionParams[key] = value;
-  }
-
-  return [
-    {
-      action: step.action as BrowserActionName,
-      params: actionParams as BrowserActionParamsMap[BrowserActionName],
-    } as BrowserStepAction,
-  ];
-}
-
-function formatStepOutput(
-  config: BrowserStepConfig,
-  records: BrowserStepActionRecord[],
-  session: BrowserSession
-): string {
-  const outputConfig = config.output ?? {};
-  const mode = outputConfig.mode ?? 'last';
-  const format = outputConfig.format ?? 'json';
-
-  if (mode === 'none') {
-    return '';
-  }
-
-  const projection = buildOutputProjection(mode, config.actions, records, session, outputConfig);
-
-  if (format === 'text') {
-    return projectionToText(projection);
-  }
-
-  return JSON.stringify(projection, undefined, outputConfig.pretty ? 2 : undefined);
-}
-
-function buildOutputProjection(
-  mode: BrowserStepOutputMode,
-  actions: BrowserStepAction[],
-  records: BrowserStepActionRecord[],
-  session: BrowserSession,
-  outputConfig: BrowserStepOutputConfig
-): unknown {
-  if (mode === 'summary') {
-    const failed = records.find((record) => !record.success);
-    return withOptionalSession(
-      {
-        success: failed === undefined,
-        actionCount: records.length,
-        currentUrl: session.currentUrl,
-        failedAction: failed
-          ? {
-              index: failed.index,
-              id: failed.id,
-              action: failed.action,
-              error: failed.error,
-            }
-          : undefined,
-      },
-      session,
-      outputConfig
-    );
-  }
-
-  if (mode === 'all') {
-    return withOptionalSession(
-      {
-        results: records.map((record) => projectRecord(record, outputConfig.includeMetadata ?? false)),
-      },
-      session,
-      outputConfig
-    );
-  }
-
-  if (mode === 'captures') {
-    const captures: Record<string, unknown> = {};
-
-    for (const record of records) {
-      const action = record.action;
-      const actionConfig = actions[record.index];
-      const capture = actionConfig?.capture ?? (EXTRACTION_ACTIONS.has(action) && record.success);
-      if (!capture) continue;
-
-      const key = actionConfig?.outputKey ?? actionConfig?.id ?? record.id ?? `action_${record.index}`;
-      captures[key] = projectRecord(record, outputConfig.includeMetadata ?? false);
-    }
-
-    return withOptionalSession({ captures }, session, outputConfig);
-  }
-
-  const last = records.at(-1);
-  return withOptionalSession(
-    last ? projectRecord(last, outputConfig.includeMetadata ?? false) : null,
-    session,
-    outputConfig
-  );
-}
-
-function projectRecord(record: BrowserStepActionRecord, includeMetadata: boolean): unknown {
-  const projected: BrowserStepActionRecord = {
-    index: record.index,
-    action: record.action,
-    success: record.success,
-  };
-
-  if (record.id !== undefined) projected.id = record.id;
-  if (record.output !== undefined) projected.output = record.output;
-  if (record.error !== undefined) projected.error = record.error;
-  if (includeMetadata && record.metadata !== undefined) projected.metadata = record.metadata;
-
-  return projected;
-}
-
-function withOptionalSession(
-  value: unknown,
-  session: BrowserSession,
-  outputConfig: BrowserStepOutputConfig
-): unknown {
-  if (!outputConfig.includeSession) {
-    return value;
-  }
-
-  return {
-    value,
-    session: {
-      id: session.id,
-      active: session.active,
-      currentUrl: session.currentUrl,
-      startTime: session.startTime,
-      config: session.config,
-    },
-  };
-}
-
-function projectionToText(value: unknown): string {
-  if (typeof value === 'string') return value;
-  if (value === null || value === undefined) return '';
-
-  if (isRecord(value)) {
-    if ('output' in value) {
-      return projectionToText(value.output);
-    }
-    if ('value' in value) {
-      return projectionToText(value.value);
-    }
-    if ('text' in value) {
-      return projectionToText(value.text);
-    }
-    if ('html' in value) {
-      return projectionToText(value.html);
-    }
-    if ('captures' in value) {
-      return JSON.stringify(value.captures);
-    }
-  }
-
-  if (Array.isArray(value)) {
-    return value.map((entry) => projectionToText(entry)).join('\n');
-  }
-
-  return JSON.stringify(value);
-}
-
-function normalizeResolvedParams(params: Record<string, string>): ResolvedParams {
-  const normalized: ResolvedParams = {};
-  for (const [key, value] of Object.entries(params)) {
-    normalized[key] = coerceScalar(value);
-  }
-  return normalized;
-}
-
-function coerceScalar(value: unknown): unknown {
-  if (typeof value !== 'string') {
-    return value;
-  }
-
-  const trimmed = value.trim();
-  if (trimmed === 'true') return true;
-  if (trimmed === 'false') return false;
-  if (trimmed === 'null') return null;
-  if (/^-?(?:0|[1-9]\d*)(?:\.\d+)?$/.test(trimmed)) return Number(trimmed);
-  if (
-    (trimmed.startsWith('{') && trimmed.endsWith('}')) ||
-    (trimmed.startsWith('[') && trimmed.endsWith(']')) ||
-    (trimmed.startsWith('"') && trimmed.endsWith('"'))
-  ) {
-    try {
-      return JSON.parse(trimmed);
-    } catch {
-      return value;
-    }
-  }
-
-  return value;
-}
-
-function readJsonParam<T>(value: unknown, name: string): T | undefined {
-  if (value === undefined) return undefined;
-  if (typeof value !== 'string') return value as T;
-
-  try {
-    return JSON.parse(value) as T;
-  } catch (error) {
-    throw new Error(
-      `Browser step params.${name} must be valid JSON: ${error instanceof Error ? error.message : String(error)}`
-    );
-  }
-}
-
-function stableStringify(value: unknown): string {
-  if (!isRecord(value) && !Array.isArray(value)) {
-    return JSON.stringify(value);
-  }
-
-  return JSON.stringify(sortJson(value));
-}
-
-function sortJson(value: unknown): unknown {
-  if (Array.isArray(value)) {
-    return value.map(sortJson);
-  }
-
-  if (!isRecord(value)) {
-    return value;
-  }
-
-  return Object.keys(value)
-    .sort()
-    .reduce<Record<string, unknown>>((acc, key) => {
-      acc[key] = sortJson(value[key]);
-      return acc;
-    }, {});
-}
-
-function isRecord(value: unknown): value is Record<string, unknown> {
-  return typeof value === 'object' && value !== null && !Array.isArray(value);
-}
diff --git a/packages/cli/src/cli/bootstrap.test.ts b/packages/cli/src/cli/bootstrap.test.ts
index 2e5cfeed0..39bbc2098 100644
--- a/packages/cli/src/cli/bootstrap.test.ts
+++ b/packages/cli/src/cli/bootstrap.test.ts
@@ -39,7 +39,6 @@ const expectedLeafCommands = [
   'telemetry',
   'on',
   'off',
-  'run',
   'connect',
   'view',
   'drive',
@@ -50,7 +49,6 @@ const expectedLeafCommands = [
   'dlq inspect',
   'dlq replay',
   'dlq purge',
-  'workflows list',
   'workspaces create',
   'tokens issue',
   'cloud login',
@@ -136,10 +134,8 @@ describe('bootstrap CLI', () => {
         'telemetry',
         'on',
         'off',
-        'run',
         'dlq',
         'workspaces',
-        'workflows',
         'tokens',
       ])
     );
diff --git a/packages/cli/src/cli/commands/core.ts b/packages/cli/src/cli/commands/core.ts
index 64ea6e58e..414ad6aa1 100644
--- a/packages/cli/src/cli/commands/core.ts
+++ b/packages/cli/src/cli/commands/core.ts
@@ -123,7 +123,6 @@ export interface CoreDependencies {
   sleep: (ms: number) => Promise<void>;
   onSignal: (signal: NodeJS.Signals, handler: () => void | Promise<void>) => void;
   holdOpen: () => Promise<void>;
-  resolveTemplatesDir: () => string;
   isPortInUse: (port: number) => Promise<boolean>;
   findBrokerApiPort: () => Promise<number>;
   log: (...args: unknown[]) => void;
@@ -354,19 +353,6 @@ function withDefaults(overrides: Partial<CoreDependencies> = {}): CoreDependenci
       process.on(signal, () => runSignalHandler(handler));
     },
     holdOpen: () => new Promise(() => undefined),
-    resolveTemplatesDir: () => {
-      // Walk up from __dirname to find the sdk package's builtin-templates dir
-      const dirname = path.dirname(fileURLToPath(import.meta.url));
-      let dir = dirname;
-      for (let i = 0; i < 8; i++) {
-        const candidate = path.join(dir, 'packages', 'sdk', 'src', 'workflows', 'builtin-templates');
-        if (fs.existsSync(candidate)) return candidate;
-        const distCandidate = path.join(dir, 'packages', 'sdk', 'dist', 'workflows', 'builtin-templates');
-        if (fs.existsSync(distCandidate)) return distCandidate;
-        dir = path.dirname(dir);
-      }
-      return path.join(dirname, 'builtin-templates');
-    },
     log: (...args: unknown[]) => console.log(...args),
     error: (...args: unknown[]) => console.error(...args),
     warn: (...args: unknown[]) => console.warn(...args),
@@ -532,26 +518,4 @@ export function registerCoreCommands(program: Command, overrides: Partial<CoreDe
       });
       await runBridgeCommand(projectPaths, options, deps);
     });
-
-  const workflowsCmd = program.command('workflows').description('Manage relay.yaml workflow templates');
-
-  workflowsCmd
-    .command('list')
-    .description('List available built-in workflow templates')
-    .action(() => {
-      const templatesDir = deps.resolveTemplatesDir();
-      if (!deps.fs.existsSync(templatesDir)) {
-        deps.log('No built-in templates found.');
-        return;
-      }
-      const files = deps.fs.readdirSync(templatesDir).filter((f) => f.endsWith('.yaml'));
-      if (files.length === 0) {
-        deps.log('No built-in templates found.');
-        return;
-      }
-      deps.log('Built-in workflow templates:');
-      for (const file of files) {
-        deps.log(`  ${file.replace(/\.yaml$/, '')}`);
-      }
-    });
 }
diff --git a/packages/cli/src/cli/commands/on/provision.ts b/packages/cli/src/cli/commands/on/provision.ts
index 322826950..7017888b9 100644
--- a/packages/cli/src/cli/commands/on/provision.ts
+++ b/packages/cli/src/cli/commands/on/provision.ts
@@ -7,8 +7,8 @@ import {
   discoverAgents as discoverAgentsFromCore,
   hasDotfiles as hasDotfilesFromCore,
 } from './dotfiles.js';
-import { mintAgentToken as mintToken } from '@agent-relay/sdk/provisioner/token';
-import type { LocalJwksSigningKey } from '@agent-relay/sdk/provisioner/local-jwks';
+import { mintAgentToken as mintToken } from '@agent-relay/cloud';
+import type { LocalJwksSigningKey } from '@agent-relay/cloud';
 
 interface ProvisionConfig {
   relayauthRoot: string;
diff --git a/packages/cli/src/cli/commands/on/start.test.ts b/packages/cli/src/cli/commands/on/start.test.ts
index dbf74388e..534864d1c 100644
--- a/packages/cli/src/cli/commands/on/start.test.ts
+++ b/packages/cli/src/cli/commands/on/start.test.ts
@@ -3,10 +3,14 @@ import { tmpdir } from 'node:os';
 import path from 'node:path';
 import { describe, expect, it, vi } from 'vitest';
 
-vi.mock('@agent-relay/cloud', () => ({
-  readStoredAuth: vi.fn().mockResolvedValue(null),
-  ensureAuthenticated: vi.fn().mockResolvedValue({ accessToken: 'test-token' }),
-}));
+vi.mock('@agent-relay/cloud', async (importOriginal) => {
+  const actual = await importOriginal<typeof import('@agent-relay/cloud')>();
+  return {
+    ...actual,
+    readStoredAuth: vi.fn().mockResolvedValue(null),
+    ensureAuthenticated: vi.fn().mockResolvedValue({ accessToken: 'test-token' }),
+  };
+});
 
 vi.mock('./dotfiles.js', () => ({
   hasDotfiles: () => false,
@@ -14,7 +18,7 @@ vi.mock('./dotfiles.js', () => ({
 }));
 
 import { requestWorkspaceSession } from './start.js';
-import { createLocalJwksKeyPair } from '../../../../../sdk/src/provisioner/local-jwks.js';
+import { createLocalJwksKeyPair } from '@agent-relay/cloud';
 
 function jsonResponse(payload: unknown, status = 200): Response {
   return new Response(JSON.stringify(payload), {
diff --git a/packages/cli/src/cli/commands/on/start.ts b/packages/cli/src/cli/commands/on/start.ts
index a942fde22..bea20c035 100644
--- a/packages/cli/src/cli/commands/on/start.ts
+++ b/packages/cli/src/cli/commands/on/start.ts
@@ -20,8 +20,7 @@ import { compileDotfiles, hasDotfiles } from './dotfiles.js';
 import { ensureRelayfileMountBinary } from './relayfile-binary.js';
 import { launchOnMount } from '@relayfile/local-mount';
 import { mintToken } from './token.js';
-import { seedAclRules } from './workspace.js';
-import { seedWorkspace } from '@agent-relay/sdk/provisioner/seeder';
+import { seedAclRules, seedWorkspace } from './workspace.js';
 import {
   createLocalJwks,
   exportPrivateKeyPem,
@@ -29,7 +28,7 @@ import {
   RELAYAUTH_JWT_KID_ENV,
   RELAYAUTH_JWT_PRIVATE_KEY_PEM_ENV,
   type LocalJwksSigningKey,
-} from '@agent-relay/sdk/provisioner/local-jwks';
+} from '@agent-relay/cloud';
 import { ensureAuthenticated, readStoredAuth } from '@agent-relay/cloud';
 
 interface OnOptions {
diff --git a/packages/cli/src/cli/commands/setup.test.ts b/packages/cli/src/cli/commands/setup.test.ts
deleted file mode 100644
index ef27e63d0..000000000
--- a/packages/cli/src/cli/commands/setup.test.ts
+++ /dev/null
@@ -1,359 +0,0 @@
-import { Command } from 'commander';
-import { describe, expect, it, vi } from 'vitest';
-
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-
-import {
-  ensureLocalSdkWorkflowRuntime,
-  findLocalSdkWorkspace,
-  formatWorkflowParseError,
-  parseTsxStderr,
-  registerSetupCommands,
-  type SetupDependencies,
-} from './setup.js';
-
-class ExitSignal extends Error {
-  constructor(public readonly code: number) {
-    super(`exit:${code}`);
-  }
-}
-
-function createHarness(overrides: Partial<SetupDependencies> = {}) {
-  const exit = vi.fn((code: number) => {
-    throw new ExitSignal(code);
-  }) as unknown as SetupDependencies['exit'];
-
-  const deps: SetupDependencies = {
-    runInit: vi.fn(async () => undefined),
-    runTelemetry: vi.fn(async () => undefined),
-    runYamlWorkflow: vi.fn(async () => ({ status: 'completed' })),
-    runScriptWorkflow: vi.fn(() => undefined),
-    log: vi.fn(() => undefined),
-    error: vi.fn(() => undefined),
-    exit,
-    ...overrides,
-  };
-
-  const program = new Command();
-  registerSetupCommands(program, deps);
-
-  return { program, deps };
-}
-
-async function runCommand(program: Command, args: string[]): Promise<number | undefined> {
-  try {
-    await program.parseAsync(args, { from: 'user' });
-    return undefined;
-  } catch (err) {
-    if (err instanceof ExitSignal) {
-      return err.code;
-    }
-    throw err;
-  }
-}
-
-describe('local SDK workflow runtime bootstrapping', () => {
-  it('finds the agent-relay workspace root from a nested directory', () => {
-    const tempRoot = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-workspace-'));
-    const nestedDir = path.join(tempRoot, 'workflows', 'nested');
-    const sdkDir = path.join(tempRoot, 'packages', 'sdk');
-    fs.mkdirSync(nestedDir, { recursive: true });
-    fs.mkdirSync(sdkDir, { recursive: true });
-    fs.writeFileSync(path.join(tempRoot, 'package.json'), JSON.stringify({ name: 'agent-relay' }));
-    fs.writeFileSync(path.join(sdkDir, 'package.json'), JSON.stringify({ name: '@agent-relay/sdk' }));
-
-    expect(findLocalSdkWorkspace(nestedDir)).toEqual({ rootDir: tempRoot, sdkDir });
-
-    fs.rmSync(tempRoot, { recursive: true, force: true });
-  });
-
-  it('builds the local sdk when the workflows dist entry is missing', () => {
-    const tempRoot = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-build-'));
-    const nestedDir = path.join(tempRoot, 'workflows');
-    const sdkDir = path.join(tempRoot, 'packages', 'sdk');
-    const workflowsDistDir = path.join(sdkDir, 'dist', 'workflows');
-    fs.mkdirSync(nestedDir, { recursive: true });
-    fs.mkdirSync(sdkDir, { recursive: true });
-    fs.writeFileSync(path.join(tempRoot, 'package.json'), JSON.stringify({ name: 'agent-relay' }));
-    fs.writeFileSync(path.join(sdkDir, 'package.json'), JSON.stringify({ name: '@agent-relay/sdk' }));
-
-    const execRunner = vi.fn(() => {
-      fs.mkdirSync(workflowsDistDir, { recursive: true });
-      fs.writeFileSync(path.join(workflowsDistDir, 'index.js'), 'export {}\n');
-      return Buffer.from('');
-    });
-
-    ensureLocalSdkWorkflowRuntime(nestedDir, execRunner as never);
-
-    expect(execRunner).toHaveBeenCalledTimes(6);
-    expect(execRunner.mock.calls.map((call) => call[1])).toEqual([
-      ['run', 'build:config'],
-      ['--prefix', 'packages/workflow-types', 'run', 'build'],
-      ['--prefix', 'packages/github-primitive', 'run', 'build'],
-      ['--prefix', 'packages/slack-primitive', 'run', 'build'],
-      ['--prefix', 'packages/cloud', 'run', 'build'],
-      ['run', 'build:sdk'],
-    ]);
-    expect(execRunner).toHaveBeenNthCalledWith(
-      1,
-      'npm',
-      ['run', 'build:config'],
-      expect.objectContaining({ cwd: tempRoot, stdio: 'inherit' })
-    );
-    expect(execRunner).toHaveBeenNthCalledWith(
-      6,
-      'npm',
-      ['run', 'build:sdk'],
-      expect.objectContaining({ cwd: tempRoot, stdio: 'inherit' })
-    );
-    fs.rmSync(tempRoot, { recursive: true, force: true });
-  });
-});
-
-describe('registerSetupCommands', () => {
-  it('registers setup commands on the program', () => {
-    const { program } = createHarness();
-    const commandNames = program.commands.map((cmd) => cmd.name());
-
-    expect(commandNames).toEqual(expect.arrayContaining(['init', 'setup', 'telemetry', 'run']));
-  });
-
-  it('routes both init and setup alias to runInit', async () => {
-    const { program, deps } = createHarness();
-
-    await runCommand(program, ['init', '--yes', '--skip-broker']);
-    await runCommand(program, ['setup', '--yes']);
-
-    expect((deps.runInit as unknown as { mock: { calls: unknown[][] } }).mock.calls[0][0]).toMatchObject({
-      yes: true,
-      skipBroker: true,
-    });
-    expect((deps.runInit as unknown as { mock: { calls: unknown[][] } }).mock.calls[1][0]).toMatchObject({
-      yes: true,
-    });
-  });
-
-  it('routes telemetry action', async () => {
-    const { program, deps } = createHarness();
-
-    const exitCode = await runCommand(program, ['telemetry', 'enable']);
-
-    expect(exitCode).toBeUndefined();
-    expect(deps.runTelemetry).toHaveBeenCalledWith('enable');
-  });
-
-  it('routes run command based on file extension', async () => {
-    const { program, deps } = createHarness();
-
-    await runCommand(program, ['run', 'workflow.yaml', '--workflow', 'main']);
-    await runCommand(program, [
-      'run',
-      'workflow.py',
-      '--resume',
-      'run-123',
-      '--start-from',
-      'step-a',
-      '--previous-run-id',
-      'run-122',
-    ]);
-
-    expect(deps.runYamlWorkflow).toHaveBeenCalledWith('workflow.yaml', {
-      workflow: 'main',
-      onEvent: expect.any(Function),
-    });
-    expect(deps.runScriptWorkflow).toHaveBeenCalledWith('workflow.py', {
-      dryRun: undefined,
-      resume: 'run-123',
-      startFrom: 'step-a',
-      previousRunId: 'run-122',
-    });
-  });
-
-  it('prints resume hints when a script workflow fails', async () => {
-    const { program, deps } = createHarness({
-      runScriptWorkflow: vi.fn(() => {
-        throw new Error('script failed');
-      }),
-    });
-
-    const exitCode = await runCommand(program, ['run', 'workflow.ts']);
-
-    expect(exitCode).toBe(1);
-    expect(deps.error).toHaveBeenCalledWith('Error: script failed');
-    expect(deps.error).toHaveBeenCalledWith(
-      expect.stringContaining('agent-relay run workflow.ts --resume <run-id>')
-    );
-  });
-
-  it('prints a copy-pasteable resume command when the script error includes a run id', async () => {
-    const { program, deps } = createHarness({
-      runScriptWorkflow: vi.fn(() => {
-        throw new Error('script failed\nRun ID: run-456');
-      }),
-    });
-
-    const exitCode = await runCommand(program, ['run', 'workflow.ts']);
-
-    expect(exitCode).toBe(1);
-    expect(deps.error).toHaveBeenCalledWith(
-      'Run ID: run-456 — resume with: agent-relay run workflow.ts --resume run-456'
-    );
-  });
-
-  it('exits with code 1 for unsupported run file extension', async () => {
-    const { program } = createHarness();
-
-    const exitCode = await runCommand(program, ['run', 'workflow.txt']);
-
-    expect(exitCode).toBe(1);
-  });
-});
-
-describe('parseTsxStderr', () => {
-  it('returns null for empty stderr', () => {
-    expect(parseTsxStderr('')).toBeNull();
-  });
-
-  it('returns null for runtime errors with no parse signature', () => {
-    const stderr = [
-      'node:internal/modules/run_main:123',
-      '    triggerUncaughtException(',
-      '    ^',
-      'Error: something blew up at runtime',
-      '    at Object.<anonymous> (/path/to/workflow.ts:5:10)',
-    ].join('\n');
-    expect(parseTsxStderr(stderr)).toBeNull();
-  });
-
-  it('parses the inline "file:line:col: ERROR: message" format', () => {
-    const stderr = [
-      'node:internal/modules/run_main:123',
-      '    triggerUncaughtException(',
-      '    ^',
-      'Error [TransformError]: Transform failed with 1 error:',
-      '/path/to/workflow.ts:1073:4: ERROR: Expected "}" but found "npm"',
-      '    at failureErrorWithLog (... lib/main.js:1748:15)',
-    ].join('\n');
-
-    expect(parseTsxStderr(stderr)).toEqual({
-      file: '/path/to/workflow.ts',
-      line: 1073,
-      column: 4,
-      message: 'Expected "}" but found "npm"',
-    });
-  });
-
-  it('parses the pretty-printed ✘ [ERROR] multi-line format', () => {
-    const stderr = [
-      '✘ [ERROR] Unterminated template literal',
-      '',
-      '    /path/to/workflow.ts:42:10:',
-      '      42 │   command: `echo hello',
-      '         ╵           ^',
-    ].join('\n');
-
-    expect(parseTsxStderr(stderr)).toEqual({
-      file: '/path/to/workflow.ts',
-      line: 42,
-      column: 10,
-      message: 'Unterminated template literal',
-    });
-  });
-
-  it('strips ANSI color codes before matching', () => {
-    const stderr = [
-      '\x1b[31mError [TransformError]: Transform failed with 1 error:\x1b[0m',
-      '\x1b[1m/path/to/workflow.ts:10:5:\x1b[0m \x1b[31mERROR:\x1b[0m Expected "}" but found "foo"',
-    ].join('\n');
-
-    const parsed = parseTsxStderr(stderr);
-    expect(parsed).not.toBeNull();
-    expect(parsed?.line).toBe(10);
-    expect(parsed?.column).toBe(5);
-    expect(parsed?.message).toBe('Expected "}" but found "foo"');
-  });
-
-  it('falls back to a loose match on "Transform failed" without inline ERROR:', () => {
-    const stderr = [
-      'Error [TransformError]: Transform failed with 1 error:',
-      '    /path/to/workflow.ts:99:7',
-      '    at failureErrorWithLog',
-    ].join('\n');
-
-    const parsed = parseTsxStderr(stderr);
-    expect(parsed).not.toBeNull();
-    expect(parsed?.file).toBe('/path/to/workflow.ts');
-    expect(parsed?.line).toBe(99);
-    expect(parsed?.column).toBe(7);
-  });
-});
-
-describe('formatWorkflowParseError', () => {
-  it('formats a basic parse error without hints when the message is generic', () => {
-    const err = formatWorkflowParseError({
-      file: '/tmp/wf.ts',
-      line: 10,
-      column: 5,
-      message: 'Some unrelated TypeScript error',
-    });
-
-    expect(err.message).toContain('Workflow file failed to parse: /tmp/wf.ts:10:5');
-    expect(err.message).toContain('Some unrelated TypeScript error');
-    expect(err.message).not.toContain('Hint:');
-    expect((err as Error & { code?: string }).code).toBe('WORKFLOW_PARSE_ERROR');
-  });
-
-  it('adds a template-literal hint for Expected "}" but found errors', () => {
-    const err = formatWorkflowParseError({
-      file: '/tmp/wf.ts',
-      line: 1073,
-      column: 4,
-      message: 'Expected "}" but found "npm"',
-    });
-
-    expect(err.message).toMatch(/Hint:/);
-    expect(err.message).toMatch(/template literal/i);
-    expect(err.message).toMatch(/single quotes/);
-  });
-
-  it('adds a template-literal hint for Unterminated template literal errors', () => {
-    const err = formatWorkflowParseError({
-      file: '/tmp/wf.ts',
-      line: 42,
-      column: 10,
-      message: 'Unterminated template literal',
-    });
-
-    expect(err.message).toMatch(/Hint:/);
-    expect(err.message).toMatch(/backticks/i);
-  });
-
-  it('adds a dollar-sign hint for Unexpected "$" errors', () => {
-    const err = formatWorkflowParseError({
-      file: '/tmp/wf.ts',
-      line: 1,
-      column: 0,
-      message: 'Unexpected "$"',
-    });
-
-    expect(err.message).toMatch(/Hint:/);
-    expect(err.message).toMatch(/interpolation/);
-  });
-
-  it('includes a line-text pointer when lineText is provided', () => {
-    const err = formatWorkflowParseError({
-      file: '/tmp/wf.ts',
-      line: 10,
-      column: 12,
-      message: 'Expected "}" but found "x"',
-      lineText: '  command: `echo foo`',
-    });
-
-    expect(err.message).toContain('| ');
-    expect(err.message).toContain('echo foo');
-    // The ^ pointer should be 12 spaces offset into the indented line
-    expect(err.message).toMatch(/\|\s+\^/);
-  });
-});
diff --git a/packages/cli/src/cli/commands/setup.ts b/packages/cli/src/cli/commands/setup.ts
index 825e2fd9d..425c6a238 100644
--- a/packages/cli/src/cli/commands/setup.ts
+++ b/packages/cli/src/cli/commands/setup.ts
@@ -1,74 +1,20 @@
-import path from 'node:path';
 import readline from 'node:readline';
 import { spawn as spawnProcess } from 'node:child_process';
 import { Command } from 'commander';
 import { getProjectPaths } from '@agent-relay/config';
 import { readBrokerConnection } from '../lib/broker-lifecycle.js';
-import {
-  enableTelemetry,
-  disableTelemetry,
-  getStatus,
-  isDisabledByEnv,
-  track,
-  type WorkflowFileType as TelemetryWorkflowFileType,
-} from '@agent-relay/telemetry';
-import {
-  runWorkflow,
-  runScriptWorkflow,
-  ensureLocalSdkWorkflowRuntime,
-  findLocalSdkWorkspace,
-  parseTsxStderr,
-  formatWorkflowParseError,
-  type ParsedWorkflowError,
-} from '@agent-relay/sdk/workflows';
-import type { WorkflowEvent } from '@agent-relay/sdk/workflows';
-import { CliExit, defaultExit } from '../lib/exit.js';
-import { errorClassName } from '../lib/telemetry-helpers.js';
-
-export {
-  ensureLocalSdkWorkflowRuntime,
-  findLocalSdkWorkspace,
-  parseTsxStderr,
-  formatWorkflowParseError,
-  type ParsedWorkflowError,
-};
+import { enableTelemetry, disableTelemetry, getStatus, isDisabledByEnv, track } from '@agent-relay/telemetry';
+import { defaultExit } from '../lib/exit.js';
 
 type ExitFn = (code: number) => never;
 type RunInitOptions = {
   yes?: boolean;
   skipBroker?: boolean;
 };
-type RunWorkflowOptions = {
-  workflow?: string;
-  dryRun?: boolean;
-  resume?: string;
-  startFrom?: string;
-  previousRunId?: string;
-};
-type WorkflowRunResult = {
-  id?: string;
-  status: string;
-  error?: string;
-};
 
 export interface SetupDependencies {
   runInit: (options: RunInitOptions) => Promise<void>;
   runTelemetry: (action?: string) => Promise<void> | void;
-  runYamlWorkflow: (
-    filePath: string,
-    options: {
-      workflow?: string;
-      dryRun?: boolean;
-      resume?: string;
-      startFrom?: string;
-      previousRunId?: string;
-      onEvent: (event: WorkflowEvent) => void;
-    }
-  ) => Promise<WorkflowRunResult>;
-  runScriptWorkflow: (
-    filePath: string,
-    options?: { dryRun?: boolean; resume?: string; startFrom?: string; previousRunId?: string }
-  ) => void | Promise<void>;
   log: (...args: unknown[]) => void;
   error: (...args: unknown[]) => void;
   exit: ExitFn;
@@ -86,41 +32,12 @@ function withDefaults(overrides: Partial<SetupDependencies> = {}): SetupDependen
   return {
     runInit: overrides.runInit ?? ((options: RunInitOptions) => runInitDefault(options, io)),
     runTelemetry: overrides.runTelemetry ?? ((action?: string) => runTelemetryDefault(action, io)),
-    runYamlWorkflow: runYamlWorkflowDefault,
-    runScriptWorkflow,
     log,
     error,
     exit,
     ...overrides,
   };
 }
-function logWorkflowEvent(event: WorkflowEvent, log: (...args: unknown[]) => void): void {
-  if (event.type === 'broker:event') return;
-  const prefix = event.type.startsWith('run:') ? '[run]' : '[step]';
-  const name = 'stepName' in event ? `${event.stepName} ` : '';
-  const status = event.type.split(':')[1];
-  const detail = 'error' in event ? `: ${event.error}` : '';
-  log(`${prefix} ${name}${status}${detail}`);
-}
-async function runYamlWorkflowDefault(
-  filePath: string,
-  options: {
-    workflow?: string;
-    dryRun?: boolean;
-    resume?: string;
-    startFrom?: string;
-    previousRunId?: string;
-    onEvent: (event: WorkflowEvent) => void;
-  }
-): Promise<WorkflowRunResult> {
-  const result = await runWorkflow(filePath, options);
-  // DryRunReport has 'valid' instead of 'status'
-  if ('valid' in result) {
-    const report = result as unknown as { valid: boolean; errors: string[] };
-    return { status: report.valid ? 'dry-run' : 'failed', error: report.errors.join('; ') || undefined };
-  }
-  return result;
-}
 async function runInitDefault(options: RunInitOptions, io: SetupIo): Promise<void> {
   const prompt = async (question: string, defaultYes = true): Promise<boolean> => {
     if (options.yes) return true;
@@ -304,136 +221,4 @@ export function registerSetupCommands(program: Command, overrides: Partial<Setup
     .action(async (action?: string) => {
       await deps.runTelemetry(action);
     });
-  program
-    .command('run')
-    .description('Run a workflow file (YAML, TypeScript, or Python)')
-    .argument('<file>', 'Path to workflow file (.yaml, .yml, .ts, or .py)')
-    .option('-w, --workflow <name>', 'Run a specific workflow by name (default: first, YAML only)')
-    .option('--dry-run', 'Validate workflow and show execution plan without running')
-    .option('--resume <runId>', 'Resume a previously failed workflow run from where it left off')
-    .option('--start-from <step>', 'Start from a specific step and skip predecessor steps')
-    .option('--previous-run-id <runId>', 'Use cached outputs from a previous run when starting from a step')
-    .action(async (filePath: string, options: RunWorkflowOptions) => {
-      const ext = path.extname(filePath).toLowerCase();
-      const isScriptWorkflow = ext === '.ts' || ext === '.tsx' || ext === '.py';
-      const fileType: TelemetryWorkflowFileType =
-        ext === '.yaml' || ext === '.yml'
-          ? 'yaml'
-          : ext === '.ts' || ext === '.tsx'
-            ? 'ts'
-            : ext === '.py'
-              ? 'py'
-              : 'unknown';
-      const started = Date.now();
-      let tracked = false;
-      const emit = (result: { success: boolean; errorClass?: string }): void => {
-        if (tracked) return;
-        tracked = true;
-        track('workflow_run', {
-          file_type: fileType,
-          is_dry_run: Boolean(options.dryRun),
-          is_resume: Boolean(options.resume),
-          is_start_from: Boolean(options.startFrom),
-          is_script: isScriptWorkflow,
-          success: result.success,
-          duration_ms: Date.now() - started,
-          ...(result.errorClass ? { error_class: result.errorClass } : {}),
-        });
-      };
-
-      try {
-        if (ext === '.yaml' || ext === '.yml') {
-          if (options.resume) {
-            deps.log(`Resuming workflow run ${options.resume} from ${filePath}...`);
-            const result = await deps.runYamlWorkflow(filePath, {
-              workflow: options.workflow,
-              resume: options.resume,
-              onEvent: (event: WorkflowEvent) => logWorkflowEvent(event, deps.log),
-            });
-            if (result.status === 'completed') {
-              deps.log('\nWorkflow resumed and completed successfully.');
-              emit({ success: true });
-            } else {
-              deps.error(`\nWorkflow ${result.status}${result.error ? `: ${result.error}` : ''}`);
-              deps.error(
-                `Run ID: ${result.id} — resume with: agent-relay run ${filePath} --resume ${result.id}`
-              );
-              emit({ success: false, errorClass: 'WorkflowNotCompleted' });
-              deps.exit(1);
-            }
-            return;
-          }
-          if (options.dryRun) {
-            deps.log(`Dry run: validating workflow from ${filePath}...`);
-          } else {
-            deps.log(`Running workflow from ${filePath}...`);
-          }
-          const result = await deps.runYamlWorkflow(filePath, {
-            workflow: options.workflow,
-            dryRun: options.dryRun,
-            resume: options.resume,
-            startFrom: options.startFrom,
-            previousRunId: options.previousRunId,
-            onEvent: (event: WorkflowEvent) => logWorkflowEvent(event, deps.log),
-          });
-          if (options.dryRun) {
-            // Report was already printed by runWorkflow
-            emit({ success: true });
-            return;
-          }
-          if (result.status === 'completed') {
-            deps.log('\nWorkflow completed successfully.');
-            emit({ success: true });
-          } else {
-            deps.error(`\nWorkflow ${result.status}${result.error ? `: ${result.error}` : ''}`);
-            deps.error(
-              `Run ID: ${result.id} — resume with: agent-relay run ${filePath} --resume ${result.id}`
-            );
-            emit({ success: false, errorClass: 'WorkflowNotCompleted' });
-            deps.exit(1);
-          }
-          return;
-        }
-        if (ext === '.ts' || ext === '.tsx' || ext === '.py') {
-          deps.log(`Running workflow script ${filePath}...`);
-          await deps.runScriptWorkflow(filePath, {
-            dryRun: options.dryRun,
-            resume: options.resume,
-            startFrom: options.startFrom,
-            previousRunId: options.previousRunId,
-          });
-          emit({ success: true });
-          return;
-        }
-        deps.error(`Unsupported file type: ${ext}. Use .yaml, .yml, .ts, or .py`);
-        emit({ success: false, errorClass: 'UnsupportedFileType' });
-        deps.exit(1);
-      } catch (err: any) {
-        // `deps.exit(1)` above throws `CliExit` in production so runCli can
-        // flush telemetry — let that bubble straight through instead of
-        // treating it as an unexpected error (which would print the internal
-        // "cli-exit:1" message and clobber `error_class` with 'CliExit').
-        if (err instanceof CliExit) throw err;
-        emit({ success: false, errorClass: errorClassName(err) });
-        deps.error(`Error: ${err.message}`);
-        if (isScriptWorkflow) {
-          const runIdMatch = typeof err?.message === 'string' ? err.message.match(/Run ID:\s*(\S+)/) : null;
-          if (runIdMatch?.[1]) {
-            deps.error(
-              `Run ID: ${runIdMatch[1]} — resume with: agent-relay run ${filePath} --resume ${runIdMatch[1]}`
-            );
-          }
-          deps.error(
-            `Script workflows can be retried with:
-` +
-              `  agent-relay run ${filePath} --resume <run-id>
-` +
-              `or start from a specific step with:
-` +
-              `  agent-relay run ${filePath} --start-from <step> [--previous-run-id <run-id>]`
-          );
-        }
-        deps.exit(1);
-      }
-    });
 }
diff --git a/packages/cloud/package.json b/packages/cloud/package.json
index 60fb8a130..41adc986c 100644
--- a/packages/cloud/package.json
+++ b/packages/cloud/package.json
@@ -10,6 +10,26 @@
       "types": "./dist/index.d.ts",
       "import": "./dist/index.js"
     },
+    "./permissions": {
+      "types": "./dist/permissions.d.ts",
+      "import": "./dist/permissions.js"
+    },
+    "./token": {
+      "types": "./dist/token.d.ts",
+      "import": "./dist/token.js"
+    },
+    "./local-jwks": {
+      "types": "./dist/local-jwks.d.ts",
+      "import": "./dist/local-jwks.js"
+    },
+    "./compiler": {
+      "types": "./dist/compiler.d.ts",
+      "import": "./dist/compiler.js"
+    },
+    "./audit": {
+      "types": "./dist/audit.d.ts",
+      "import": "./dist/audit.js"
+    },
     "./package.json": "./package.json"
   },
   "files": [
diff --git a/packages/sdk/src/provisioner/__tests__/compiler.test.ts b/packages/cloud/src/__tests__/compiler.test.ts
similarity index 99%
rename from packages/sdk/src/provisioner/__tests__/compiler.test.ts
rename to packages/cloud/src/__tests__/compiler.test.ts
index fadac2628..b2a2ca8a7 100644
--- a/packages/sdk/src/provisioner/__tests__/compiler.test.ts
+++ b/packages/cloud/src/__tests__/compiler.test.ts
@@ -2,7 +2,7 @@ import assert from 'node:assert/strict';
 import { mkdtemp, mkdir, rm, writeFile } from 'node:fs/promises';
 import { tmpdir } from 'node:os';
 import path from 'node:path';
-import test from 'node:test';
+import { test } from 'vitest';
 
 import { compileAgentScopes, globToScopes } from '../compiler.js';
 
diff --git a/packages/sdk/src/provisioner/__tests__/presets.test.ts b/packages/cloud/src/__tests__/presets.test.ts
similarity index 100%
rename from packages/sdk/src/provisioner/__tests__/presets.test.ts
rename to packages/cloud/src/__tests__/presets.test.ts
diff --git a/packages/sdk/src/provisioner/__tests__/token-factory.test.ts b/packages/cloud/src/__tests__/token-factory.test.ts
similarity index 99%
rename from packages/sdk/src/provisioner/__tests__/token-factory.test.ts
rename to packages/cloud/src/__tests__/token-factory.test.ts
index 082f9d47c..62a7fac91 100644
--- a/packages/sdk/src/provisioner/__tests__/token-factory.test.ts
+++ b/packages/cloud/src/__tests__/token-factory.test.ts
@@ -1,6 +1,6 @@
 import assert from 'node:assert/strict';
 import { createPublicKey, createVerify } from 'node:crypto';
-import test from 'node:test';
+import { test } from 'vitest';
 
 import { createLocalJwksKeyPair } from '../local-jwks.js';
 import {
diff --git a/packages/sdk/src/provisioner/__tests__/token.test.ts b/packages/cloud/src/__tests__/token.test.ts
similarity index 98%
rename from packages/sdk/src/provisioner/__tests__/token.test.ts
rename to packages/cloud/src/__tests__/token.test.ts
index f79028303..141134846 100644
--- a/packages/sdk/src/provisioner/__tests__/token.test.ts
+++ b/packages/cloud/src/__tests__/token.test.ts
@@ -1,5 +1,5 @@
 import assert from 'node:assert/strict';
-import test from 'node:test';
+import { test } from 'vitest';
 
 import { createLocalJwksKeyPair } from '../local-jwks.js';
 import { DEFAULT_WORKFLOW_TOKEN_TTL_SECONDS, mintAgentToken, type TokenClaims } from '../token.js';
diff --git a/packages/sdk/src/provisioner/audit.ts b/packages/cloud/src/audit.ts
similarity index 100%
rename from packages/sdk/src/provisioner/audit.ts
rename to packages/cloud/src/audit.ts
diff --git a/packages/sdk/src/provisioner/compiler.ts b/packages/cloud/src/compiler.ts
similarity index 98%
rename from packages/sdk/src/provisioner/compiler.ts
rename to packages/cloud/src/compiler.ts
index 33e7d613f..7411d242f 100644
--- a/packages/sdk/src/provisioner/compiler.ts
+++ b/packages/cloud/src/compiler.ts
@@ -1,9 +1,14 @@
 import ignore, { type Ignore } from 'ignore';
 import { existsSync, readdirSync, readFileSync } from 'node:fs';
 import path from 'node:path';
-import type { AgentPreset } from '../workflows/types.js';
-
-import type { AgentPermissions, CompiledAgentPermissions, CompileInput, PermissionSource } from './types.js';
+import type { AgentPreset } from './permissions.js';
+
+import type {
+  AgentPermissions,
+  CompiledAgentPermissions,
+  CompileInput,
+  PermissionSource,
+} from './provisioning-types.js';
 
 type FileAction = 'read' | 'write';
 
diff --git a/packages/cloud/src/index.ts b/packages/cloud/src/index.ts
index 3a6da0b6d..ed125b9b9 100644
--- a/packages/cloud/src/index.ts
+++ b/packages/cloud/src/index.ts
@@ -65,6 +65,42 @@ export {
   type AuthSshRuntime,
 } from './lib/ssh-runtime.js';
 
+// Cross-product identity, permissions, tokens, and audit primitives.
+export * from './permissions.js';
+export * from './provisioning-types.js';
+export {
+  defaultPermissionsForPreset,
+  expandPreset,
+  globsToScopes,
+  compileAgentPermissions,
+  mergeAcl,
+  resolveAgentPermissions,
+  compileAgentScopes,
+  mergePermissionSources,
+  expandAccessPreset,
+  globToScopes,
+} from './compiler.js';
+export {
+  DEFAULT_WORKFLOW_TOKEN_TTL_SECONDS,
+  DEFAULT_ADMIN_AGENT_NAME,
+  DEFAULT_ADMIN_SCOPES,
+  mintAgentToken,
+  type TokenClaims,
+} from './token.js';
+export {
+  createLocalJwks,
+  createLocalJwksKeyPair,
+  exportPrivateKeyPem,
+  importPrivateKeyPem,
+  RELAYAUTH_JWKS_URL_ENV,
+  RELAYAUTH_JWT_KID_ENV,
+  RELAYAUTH_JWT_PRIVATE_KEY_PEM_ENV,
+  type LocalJwks,
+  type LocalJwksKeyPair,
+  type LocalJwksSigningKey,
+} from './local-jwks.js';
+export { PermissionAuditLog, getDefaultPermissionAuditPath } from './audit.js';
+
 export {
   type StoredAuth,
   type WhoAmIResponse,
diff --git a/packages/sdk/src/provisioner/local-jwks.ts b/packages/cloud/src/local-jwks.ts
similarity index 100%
rename from packages/sdk/src/provisioner/local-jwks.ts
rename to packages/cloud/src/local-jwks.ts
diff --git a/packages/cloud/src/permissions.ts b/packages/cloud/src/permissions.ts
new file mode 100644
index 000000000..dd412bbd6
--- /dev/null
+++ b/packages/cloud/src/permissions.ts
@@ -0,0 +1,154 @@
+/**
+ * General agent identity, CLI, and permission types.
+ *
+ * These are SDK-level primitives — the CLI registry, provisioner, and any
+ * other broker-adjacent code consume them directly. Workflow-shaped types
+ * (RelayYamlConfig, WorkflowStep, SwarmPattern, etc.) live in @relayflows/core.
+ */
+
+// ── CLI identity ────────────────────────────────────────────────────────────
+
+export type AgentCli =
+  | 'claude'
+  | 'codex'
+  | 'gemini'
+  | 'aider'
+  | 'goose'
+  | 'opencode'
+  | 'droid'
+  | 'cursor'
+  | 'cursor-agent'
+  | 'agent'
+  | 'api';
+
+// ── Agent shape primitives ──────────────────────────────────────────────────
+
+export type AgentPreset = 'lead' | 'worker' | 'reviewer' | 'analyst';
+
+/** Resource and behavioral constraints for an agent. */
+export interface AgentConstraints {
+  maxTokens?: number;
+  timeoutMs?: number;
+  retries?: number;
+  model?: string;
+  /** Silence duration in seconds before the agent is considered idle (0 = disabled, default: 30). */
+  idleThresholdSecs?: number;
+}
+
+/** Optional credential settings for an agent. */
+export interface AgentCredentialConfig {
+  /** Opt the agent into credential proxy mode. */
+  proxy?: boolean;
+  /** Override the provider used for proxy credential resolution. */
+  provider?: string;
+}
+
+// ── Permission types ────────────────────────────────────────────────────────
+
+/**
+ * Access preset for role-based permission shortcuts.
+ *
+ *   readonly    → read all non-ignored files, write nothing
+ *   readwrite   → read and write all non-ignored files (default behavior)
+ *   restricted  → read/write only explicitly listed paths
+ *   full        → read and write everything, including normally-ignored files
+ */
+export type AccessPreset = 'readonly' | 'readwrite' | 'restricted' | 'full';
+
+/** Fine-grained network permission with allowlist/denylist. */
+export interface NetworkPermissions {
+  /** Host:port pairs the agent may connect to (e.g. ['registry.npmjs.org:443']). */
+  allow?: string[];
+  /** Host:port patterns to block (e.g. ['*'] to deny all except allowed). */
+  deny?: string[];
+}
+
+/** Network permission: boolean to allow/deny all, or object for fine-grained control. */
+export type NetworkPermission = boolean | NetworkPermissions;
+
+/** Glob-based file permission scopes for an agent. */
+export interface FilePermissions {
+  /** Glob patterns the agent may read (e.g. ['src/**', 'docs/**']). */
+  read?: string[];
+  /** Glob patterns the agent may write (e.g. ['src/tests/**']). */
+  write?: string[];
+  /** Glob patterns the agent must never access (e.g. ['.env', 'secrets/**']).
+   *  Deny rules take precedence over read/write grants. */
+  deny?: string[];
+}
+
+/** Reusable named permission profile shared by one or more agents. */
+export interface PermissionProfileDefinition {
+  description?: string;
+  why?: string;
+  access?: AccessPreset;
+  inherit?: boolean;
+  files?: FilePermissions;
+  scopes?: string[];
+  network?: NetworkPermission;
+  exec?: string[];
+}
+
+/**
+ * Permission configuration for an agent.
+ *
+ * All fields are optional — omitting `permissions` entirely preserves the
+ * default behavior (inherit dotfiles, readwrite access).
+ *
+ * Resolution order (later overrides earlier):
+ *   1. Dotfile patterns (.agentignore / .agentreadonly) when `inherit` is true
+ *   2. `access` preset expands into base file rules
+ *   3. Explicit `files` globs merge on top
+ *   4. `deny` patterns always win (applied last)
+ *   5. `scopes` are appended verbatim to the token
+ */
+export interface AgentPermissions {
+  description?: string;
+  profile?: string;
+  why?: string;
+  access?: AccessPreset;
+  inherit?: boolean;
+  files?: FilePermissions;
+  scopes?: string[];
+  network?: NetworkPermission;
+  exec?: string[];
+}
+
+// ── Compiled permission output ──────────────────────────────────────────────
+
+/** Identifies where a permission rule originated. */
+export interface PermissionSource {
+  type: 'dotfile' | 'preset' | 'yaml' | 'scope';
+  label: string;
+  ruleCount: number;
+}
+
+/**
+ * The result of compiling an agent's permissions. Used to:
+ *   1. Mint the agent's relayauth token (scopes)
+ *   2. Configure the relayfile mount (readonlyPaths, readwritePaths, deniedPaths)
+ *   3. Enforce runtime restrictions (network, exec allowlist)
+ */
+export interface CompiledAgentPermissions {
+  agentName: string;
+  workspace: string;
+  effectiveAccess: AccessPreset;
+  inherited: boolean;
+  sources: PermissionSource[];
+  readonlyPatterns: string[];
+  readwritePatterns: string[];
+  deniedPatterns: string[];
+  readonlyPaths: string[];
+  readwritePaths: string[];
+  deniedPaths: string[];
+  scopes: string[];
+  network?: NetworkPermission;
+  exec?: string[];
+  acl: Record<string, string[]>;
+  summary: {
+    readonly: number;
+    readwrite: number;
+    denied: number;
+    customScopes: number;
+  };
+}
diff --git a/packages/cloud/src/provisioning-types.ts b/packages/cloud/src/provisioning-types.ts
new file mode 100644
index 000000000..03f221de3
--- /dev/null
+++ b/packages/cloud/src/provisioning-types.ts
@@ -0,0 +1,39 @@
+import type {
+  AccessPreset,
+  AgentPermissions,
+  CompiledAgentPermissions,
+  FilePermissions,
+  PermissionSource,
+} from './permissions.js';
+
+// ── Shared helper types ─────────────────────────────────────────────────────
+
+/** Aggregate counts for compiled permissions across provisioned agents. */
+export interface ProvisionSummary {
+  readonly: number;
+  readwrite: number;
+  denied: number;
+  customScopes: number;
+}
+
+/** Convenience shape for a single agent's compiled scopes. */
+export interface CompiledAgentScopes {
+  agentName: string;
+  workspace: string;
+  scopes: string[];
+  acl: Record<string, string[]>;
+  summary: ProvisionSummary;
+}
+
+// ── Compiler ────────────────────────────────────────────────────────────────
+
+/** Input to the permission compiler for a single agent. */
+export interface CompileInput {
+  agentName: string;
+  workspace: string;
+  projectDir: string;
+  permissions: AgentPermissions;
+}
+
+// Re-export upstream types for convenience.
+export type { AccessPreset, AgentPermissions, CompiledAgentPermissions, FilePermissions, PermissionSource };
diff --git a/packages/sdk/src/provisioner/token.ts b/packages/cloud/src/token.ts
similarity index 100%
rename from packages/sdk/src/provisioner/token.ts
rename to packages/cloud/src/token.ts
diff --git a/packages/credential-proxy/README.md b/packages/credential-proxy/README.md
index f54596e7f..18a90bb67 100644
--- a/packages/credential-proxy/README.md
+++ b/packages/credential-proxy/README.md
@@ -58,7 +58,7 @@ serve({ fetch: app.fetch, port: Number(process.env.PORT ?? 3001) });
 ```
 
 For the SDK-side wiring that lets workflow agents use the proxy transparently,
-see [`@agent-relay/sdk/workflows`'s proxy-env
+see [`@relayflows/core`'s proxy-env
 module](../sdk/src/workflows/proxy-env.ts) and the `credentialProxy` field on
 `SwarmConfig`.
 
diff --git a/packages/github-primitive/DESIGN.md b/packages/github-primitive/DESIGN.md
index 80fb4a7f5..16eadd775 100644
--- a/packages/github-primitive/DESIGN.md
+++ b/packages/github-primitive/DESIGN.md
@@ -18,7 +18,6 @@ packages/github-primitive/
 │   ├── adapter.ts          # Runtime detection, factory, base adapter
 │   ├── local-runtime.ts    # Local gh CLI implementation
 │   ├── cloud-runtime.ts    # Cloud Nango and relay-cloud implementation
-│   ├── workflow-step.ts    # Workflow step executor
 │   ├── actions/            # GitHub action implementations
 │   │   ├── branches.ts     # listBranches, createBranch operations
 │   │   ├── commits.ts      # listCommits, createCommit operations
diff --git a/packages/github-primitive/README.md b/packages/github-primitive/README.md
index 383a0fcba..0efc7a9ce 100644
--- a/packages/github-primitive/README.md
+++ b/packages/github-primitive/README.md
@@ -35,28 +35,6 @@ The client and workflow step support:
 - Branches and commits: `listBranches`, `createBranch`, `listCommits`, `createCommit`
 - Identity: `getUser`, `listOrganizations`
 
-## Workflow Step
-
-```ts
-import { createGitHubStep } from '@agent-relay/github-primitive/workflow-step';
-
-createGitHubStep({
-  name: 'read-readme',
-  action: 'readFile',
-  repo: 'AgentWorkforce/relay',
-  params: {
-    path: 'README.md',
-  },
-  output: {
-    mode: 'data',
-    format: 'text',
-  },
-});
-```
-
-See `examples/github-step.ts` for a workflow runner example and
-`examples/github-client.ts` for a standalone client example.
-
 ## End-to-end PR workflow
 
 `examples/end-to-end-pr-workflow.ts` walks the full PR lifecycle against
diff --git a/packages/github-primitive/examples/end-to-end-pr-workflow.ts b/packages/github-primitive/examples/end-to-end-pr-workflow.ts
deleted file mode 100644
index 59b998c3d..000000000
--- a/packages/github-primitive/examples/end-to-end-pr-workflow.ts
+++ /dev/null
@@ -1,286 +0,0 @@
-/**
- * End-to-end pull-request workflow using the GitHub primitive.
- *
- * Demonstrates the full PR lifecycle from a single workflow definition:
- *   1. Detect + log which runtime will be used (local gh vs Nango vs
- *      relay-cloud proxy).
- *   2. createBranch — branch off the default branch for the change.
- *   3. createFile — write a timestamped marker file on the new branch.
- *   4. createPR — open the pull request. This is the core interface the
- *      cloud workflows need to swap to.
- *   5. getPR — round-trip verify.
- *   6. updatePR — add a description edit (shows mutation).
- *   7. listPRs — confirm it appears in the default filter.
- *   8. (commented out) mergePR — the last mile. Left off by default so
- *      running this example does NOT merge anything against real repos.
- *
- * The same file runs identically in three environments because the
- * primitive's runtime selection handles the transport:
- *
- *   - LOCAL              gh CLI (needs `gh auth status` to succeed)
- *   - CLOUD (tenant)     Nango — NANGO_GITHUB_CONNECTION_ID +
- *                        NANGO_GITHUB_PROVIDER_CONFIG_KEY +
- *                        NANGO_SECRET_KEY
- *   - CLOUD (fallback)   relay-cloud proxy — RELAY_CLOUD_API_URL +
- *                        RELAY_CLOUD_API_TOKEN + WORKSPACE_ID
- *
- * Run:
- *   GITHUB_REPO=AgentWorkforce/scratch npx tsx examples/end-to-end-pr-workflow.ts
- *
- * Defaults to AgentWorkforce/scratch (a sandbox repo) so no one
- * accidentally opens a PR against a real repo. Override via env vars.
- */
-
-import { WorkflowRunner, type RelayYamlConfig } from '@agent-relay/sdk/workflows';
-
-import { GitHubClient } from '../src/client.js';
-import { GitHubStepExecutor, createGitHubStep } from '../src/workflow-step.js';
-import type { GitHubRuntimeConfig } from '../src/types.js';
-
-const repo = process.env.GITHUB_REPO ?? 'AgentWorkforce/scratch';
-const baseBranch = process.env.GITHUB_BASE_BRANCH ?? 'main';
-const branchName = process.env.GITHUB_BRANCH_OVERRIDE ?? `examples/github-primitive-${Date.now()}`;
-const markerPath = `examples/github-primitive-runs/${Date.now()}.md`;
-
-const githubConfig: GitHubRuntimeConfig = {
-  // `auto` prefers cloud credentials when present, otherwise falls back
-  // to the local `gh` CLI. Override with GITHUB_RUNTIME=local|cloud when
-  // you want to pin a specific path.
-  runtime: (process.env.GITHUB_RUNTIME as GitHubRuntimeConfig['runtime']) ?? 'auto',
-
-  // Cloud path A — Nango. Per-tenant GitHub App installation. Cloud
-  // callers typically resolve this via a connection-resolver helper
-  // that maps { workspaceId, repo } -> { connectionId, providerConfigKey }.
-  nango: {
-    connectionId: process.env.NANGO_GITHUB_CONNECTION_ID,
-    providerConfigKey: process.env.NANGO_GITHUB_PROVIDER_CONFIG_KEY,
-    secretKey: process.env.NANGO_SECRET_KEY,
-  },
-
-  // Cloud path B — relay-cloud GitHub proxy. Used when Nango isn't
-  // wired but a relay-cloud bearer token is available.
-  relayCloud: {
-    apiUrl: process.env.RELAY_CLOUD_API_URL,
-    accessToken: process.env.RELAY_CLOUD_API_TOKEN,
-    workspaceId: process.env.WORKSPACE_ID,
-  },
-};
-
-const githubExecutor = new GitHubStepExecutor(githubConfig);
-
-const config: RelayYamlConfig = {
-  version: '1.0',
-  name: 'end-to-end-pr-workflow',
-  description:
-    'Walk through the full PR lifecycle — branch, commit, open, update, list — using the GitHub primitive.',
-  swarm: { pattern: 'pipeline' },
-  agents: [],
-  workflows: [
-    {
-      name: 'end-to-end-pr-workflow',
-      steps: [
-        // 1. Resolve the default branch — sanity check the connection
-        //    works before we start making mutations.
-        createGitHubStep({
-          name: 'inspect-repo',
-          action: 'getRepo',
-          repo,
-          output: {
-            mode: 'summary',
-            includeRuntime: true,
-            pretty: true,
-          },
-        }),
-
-        // 2. Create the feature branch off the base branch's HEAD.
-        //    Chains {{steps.inspect-repo.output.data.defaultBranch}}
-        //    when no base override is provided — here we keep it
-        //    explicit for readability.
-        createGitHubStep({
-          name: 'create-branch',
-          dependsOn: ['inspect-repo'],
-          action: 'createBranch',
-          repo,
-          params: {
-            branch: branchName,
-            source: baseBranch,
-          },
-          output: { mode: 'data', format: 'json', path: 'ref' },
-        }),
-
-        // 3. Write a marker file on the new branch. createFile handles
-        //    the blob + tree + commit dance for you.
-        createGitHubStep({
-          name: 'write-marker-file',
-          dependsOn: ['create-branch'],
-          action: 'createFile',
-          repo,
-          params: {
-            path: markerPath,
-            branch: branchName,
-            content: [
-              '# GitHub primitive example run',
-              '',
-              `- Runtime chosen: see workflow log for inspect-repo detection`,
-              `- Generated: ${new Date().toISOString()}`,
-              '',
-              'This file is created by',
-              '`packages/github-primitive/examples/end-to-end-pr-workflow.ts`',
-              'to prove the full PR lifecycle works against the configured runtime.',
-            ].join('\n'),
-            message: `examples: github-primitive demo run ${new Date().toISOString()}`,
-          },
-          output: { mode: 'data', format: 'json', path: 'commit.sha' },
-        }),
-
-        // 4. Open the pull request. This is the core step cloud
-        //    workflows need. title/body/head/base mirror the REST API
-        //    shape — no translation work at the call site.
-        createGitHubStep({
-          name: 'open-pr',
-          dependsOn: ['write-marker-file'],
-          action: 'createPR',
-          repo,
-          params: {
-            title: `examples: github-primitive end-to-end demo (${branchName})`,
-            head: branchName,
-            base: baseBranch,
-            body: [
-              '## Summary',
-              '',
-              'Automated PR opened by',
-              '`packages/github-primitive/examples/end-to-end-pr-workflow.ts`',
-              'to exercise the GitHub primitive interface end-to-end.',
-              '',
-              '## Runtime selection',
-              '',
-              'See the workflow log for the `inspect-repo` step — it logs the',
-              'selected runtime (`local`, `nango`, or `relay-cloud`).',
-              '',
-              '## Safe to close',
-              '',
-              'This PR is a demonstration. No one should merge it — close it',
-              'once you have inspected the end-to-end round-trip.',
-            ].join('\n'),
-            draft: true,
-          },
-          output: {
-            mode: 'data',
-            format: 'json',
-            includeRuntime: true,
-            includeMetadata: true,
-            pretty: true,
-          },
-        }),
-
-        // 5. Read the PR back to prove the resolver + runtime actually
-        //    persisted the change, and to surface the PR number for
-        //    downstream steps.
-        createGitHubStep({
-          name: 'verify-pr',
-          dependsOn: ['open-pr'],
-          action: 'getPR',
-          repo,
-          params: {
-            // The output of `open-pr` is the Pulls REST response; we pull
-            // the number off it for subsequent mutation.
-            number: '{{steps.open-pr.output.data.number}}',
-          },
-          output: {
-            mode: 'summary',
-            includeRuntime: true,
-            pretty: true,
-          },
-        }),
-
-        // 6. Update the PR — shows how to use updatePR for edits that
-        //    don't need code changes (body, title, draft state, etc.).
-        createGitHubStep({
-          name: 'edit-pr-body',
-          dependsOn: ['verify-pr'],
-          action: 'updatePR',
-          repo,
-          params: {
-            number: '{{steps.open-pr.output.data.number}}',
-            body: [
-              '## Summary',
-              '',
-              'Automated PR opened by the GitHub primitive end-to-end',
-              'example. This body was updated by the `edit-pr-body` step',
-              'to demonstrate `updatePR` works through the same adapter.',
-              '',
-              '## Safe to close',
-              '',
-              'Demo — close, do not merge.',
-            ].join('\n'),
-          },
-          output: { mode: 'result', format: 'json' },
-        }),
-
-        // 7. List open PRs to prove the new one is indexable.
-        createGitHubStep({
-          name: 'list-open-prs',
-          dependsOn: ['edit-pr-body'],
-          action: 'listPRs',
-          repo,
-          params: {
-            state: 'open',
-            perPage: 10,
-          },
-          output: { mode: 'summary', pretty: true },
-        }),
-
-        // 8. (Commented) The last mile — merge. Intentionally left off:
-        //    running this example against a real repo should not merge
-        //    anything. Uncomment when exercising a disposable scratch
-        //    repo or CI harness.
-        //
-        // createGitHubStep({
-        //   name: 'merge-pr',
-        //   dependsOn: ['list-open-prs'],
-        //   action: 'mergePR',
-        //   repo,
-        //   params: {
-        //     number: '{{steps.open-pr.output.data.number}}',
-        //     mergeMethod: 'squash',
-        //     commitTitle: 'examples: github-primitive demo (squash)',
-        //   },
-        //   output: { mode: 'data', format: 'json' },
-        // }),
-      ],
-    },
-  ],
-  errorHandling: { strategy: 'fail-fast' },
-};
-
-async function main(): Promise<void> {
-  const detection = await GitHubClient.detect(githubConfig);
-
-  console.log('────────────────────────────────────────');
-  console.log(`repo:                 ${repo}`);
-  console.log(`base branch:          ${baseBranch}`);
-  console.log(`feature branch:       ${branchName}`);
-  console.log(`runtime selected:     ${detection.runtime}`);
-  console.log(`detection source:     ${detection.source}`);
-  console.log(`local gh available:   ${detection.local.available}`);
-  console.log(`cloud available:      ${detection.cloud.available}`);
-  if (detection.reason) {
-    console.log(`reason:               ${detection.reason}`);
-  }
-  console.log('────────────────────────────────────────');
-
-  const runner = new WorkflowRunner({
-    cwd: process.cwd(),
-    executor: githubExecutor,
-  });
-
-  const result = await runner.execute(config);
-  console.log(`\nWorkflow completed: ${result.status}`);
-}
-
-if (process.argv[1] === new URL(import.meta.url).pathname) {
-  main().catch((error) => {
-    console.error(error instanceof Error ? error.stack : error);
-    process.exitCode = 1;
-  });
-}
diff --git a/packages/github-primitive/examples/github-step.ts b/packages/github-primitive/examples/github-step.ts
deleted file mode 100644
index b060b7c32..000000000
--- a/packages/github-primitive/examples/github-step.ts
+++ /dev/null
@@ -1,105 +0,0 @@
-import { WorkflowRunner, type RelayYamlConfig } from '@agent-relay/sdk/workflows';
-
-import { GitHubClient } from '../src/client.js';
-import { GitHubStepExecutor, createGitHubStep } from '../src/workflow-step.js';
-import type { GitHubRuntimeConfig } from '../src/types.js';
-
-const repo = process.env.GITHUB_REPO ?? 'AgentWorkforce/relay';
-
-const githubConfig: GitHubRuntimeConfig = {
-  runtime: (process.env.GITHUB_RUNTIME as GitHubRuntimeConfig['runtime']) ?? 'auto',
-  nango: {
-    connectionId: process.env.NANGO_GITHUB_CONNECTION_ID,
-    providerConfigKey: process.env.NANGO_GITHUB_PROVIDER_CONFIG_KEY,
-  },
-  relayCloud: {
-    apiUrl: process.env.RELAY_CLOUD_API_URL,
-    accessToken: process.env.RELAY_CLOUD_API_TOKEN,
-    workspaceId: process.env.WORKSPACE_ID,
-  },
-};
-
-const githubExecutor = new GitHubStepExecutor(githubConfig);
-
-const config: RelayYamlConfig = {
-  version: '1.0',
-  name: 'github-primitive-workflow',
-  description: 'GitHub primitive workflow with runtime auto-detection and chained output.',
-  swarm: {
-    pattern: 'pipeline',
-  },
-  agents: [],
-  workflows: [
-    {
-      name: 'github-primitive-workflow',
-      steps: [
-        createGitHubStep({
-          name: 'inspect-repository',
-          action: 'getRepo',
-          repo,
-          output: {
-            mode: 'summary',
-            includeRuntime: true,
-            pretty: true,
-          },
-        }),
-        createGitHubStep({
-          name: 'list-open-issues',
-          dependsOn: ['inspect-repository'],
-          action: 'listIssues',
-          repo,
-          params: {
-            state: 'open',
-            perPage: 5,
-          },
-          output: {
-            mode: 'summary',
-            includeRuntime: true,
-            pretty: true,
-          },
-        }),
-        createGitHubStep({
-          name: 'read-readme',
-          dependsOn: ['list-open-issues'],
-          action: 'readFile',
-          repo,
-          params: {
-            path: 'README.md',
-          },
-          output: {
-            mode: 'data',
-            format: 'text',
-          },
-        }),
-      ],
-    },
-  ],
-  errorHandling: {
-    strategy: 'fail-fast',
-  },
-};
-
-async function main(): Promise<void> {
-  const detection = await GitHubClient.detect(githubConfig);
-
-  console.log(`GitHub runtime selected: ${detection.runtime}`);
-  console.log(`Detection source: ${detection.source}`);
-  console.log(`Local gh CLI: ${detection.local.available ? 'available' : 'unavailable'}`);
-  console.log(`Cloud GitHub: ${detection.cloud.available ? 'available' : 'unavailable'}`);
-  console.log(detection.reason);
-
-  const runner = new WorkflowRunner({
-    cwd: process.cwd(),
-    executor: githubExecutor,
-  });
-
-  const result = await runner.execute(config);
-  console.log(`GitHub workflow completed: ${result.status}`);
-}
-
-if (process.argv[1] === new URL(import.meta.url).pathname) {
-  main().catch((error) => {
-    console.error(error instanceof Error ? error.stack : error);
-    process.exitCode = 1;
-  });
-}
diff --git a/packages/github-primitive/examples/multi-tenant-pr-workflow.ts b/packages/github-primitive/examples/multi-tenant-pr-workflow.ts
deleted file mode 100644
index f06b5b91d..000000000
--- a/packages/github-primitive/examples/multi-tenant-pr-workflow.ts
+++ /dev/null
@@ -1,201 +0,0 @@
-/**
- * Multi-tenant pull-request workflow.
- *
- * Cloud's reality: every workspace (AgentWorkforce, MSD, NightCTO, ...)
- * has its own GitHub App installation. The primitive's per-step `config`
- * field lets one workflow route different actions through different
- * Nango connections — no need for one workflow per tenant.
- *
- * The usual cloud pattern:
- *
- *   1. A resolver helper — lives in cloud, NOT in this primitive — maps
- *      { workspaceId, repo } -> { connectionId, providerConfigKey }.
- *      Recommended signature:
- *
- *         githubConfigForRepo({ repo, workspaceId }): Promise<GitHubRuntimeConfig>
- *
- *      It reads the workspace_integrations table, picks the row whose
- *      provider matches the target repo's app, and returns a ready-to-
- *      use config object.
- *
- *   2. Workflow authors call that resolver at step-build time and pass
- *      the result as `config` to each `createGitHubStep` call.
- *
- * This example simulates the resolver with a static table so the
- * illustration is self-contained — in production, swap it for the DB
- * lookup.
- *
- * Run:
- *   NANGO_SECRET_KEY=... \
- *   AGENTWORKFORCE_CONNECTION_ID=... \
- *   MSD_CONNECTION_ID=... \
- *   npx tsx examples/multi-tenant-pr-workflow.ts
- */
-
-import { WorkflowRunner, type RelayYamlConfig } from '@agent-relay/sdk/workflows';
-
-import { GitHubStepExecutor, createGitHubStep } from '../src/workflow-step.js';
-import type { GitHubRuntimeConfig, RepositoryRef } from '../src/types.js';
-
-// ─── Resolver (stand-in for cloud's real implementation) ───────────────
-
-interface TenantConnection {
-  workspaceId: string;
-  providerConfigKey: string; // 'github-agentworkforce' | 'github-msd' | 'github-nightcto'
-  connectionIdEnvVar: string; // env var that carries the Nango connection id
-}
-
-// In cloud, this table is the workspace_integrations DB rows joined to
-// the Nango provider registry. Here we keep it inline for illustration.
-const TENANTS: Record<string, TenantConnection> = {
-  'AgentWorkforce/cloud': {
-    workspaceId: 'rw_agentworkforce',
-    providerConfigKey: 'github-agentworkforce',
-    connectionIdEnvVar: 'AGENTWORKFORCE_CONNECTION_ID',
-  },
-  'AgentWorkforce/sage': {
-    workspaceId: 'rw_agentworkforce',
-    providerConfigKey: 'github-agentworkforce',
-    connectionIdEnvVar: 'AGENTWORKFORCE_CONNECTION_ID',
-  },
-  'msd-ventures/platform': {
-    workspaceId: 'rw_msd',
-    providerConfigKey: 'github-msd',
-    connectionIdEnvVar: 'MSD_CONNECTION_ID',
-  },
-};
-
-function githubConfigForRepo(opts: {
-  repo: string | RepositoryRef;
-  /** Workspace scope. Optional — cloud-owned repos default to the shared app. */
-  workspaceId?: string;
-}): GitHubRuntimeConfig {
-  const repoKey = typeof opts.repo === 'string' ? opts.repo : `${opts.repo.owner}/${opts.repo.repo}`;
-  const tenant = TENANTS[repoKey];
-
-  if (!tenant) {
-    throw new Error(
-      `No GitHub connection mapped for ${repoKey} — register it in the tenants table or workspace_integrations.`
-    );
-  }
-
-  const connectionId = process.env[tenant.connectionIdEnvVar];
-  if (!connectionId) {
-    throw new Error(`Missing ${tenant.connectionIdEnvVar} — set the Nango connection id for ${repoKey}.`);
-  }
-
-  return {
-    runtime: 'auto',
-    nango: {
-      connectionId,
-      providerConfigKey: tenant.providerConfigKey,
-      secretKey: process.env.NANGO_SECRET_KEY,
-    },
-    relayCloud: {
-      apiUrl: process.env.RELAY_CLOUD_API_URL,
-      accessToken: process.env.RELAY_CLOUD_API_TOKEN,
-      workspaceId: opts.workspaceId ?? tenant.workspaceId,
-    },
-  };
-}
-
-// ─── Workflow ────────────────────────────────────────────────────────────
-
-const agentworkforceRepo = 'AgentWorkforce/cloud';
-const msdRepo = 'msd-ventures/platform';
-
-const executor = new GitHubStepExecutor({ runtime: 'auto' });
-
-const config: RelayYamlConfig = {
-  version: '1.0',
-  name: 'multi-tenant-pr-workflow',
-  description:
-    'Open PRs in two tenants — AgentWorkforce/cloud (shared app) and msd-ventures/platform (MSD app) — from one workflow by varying per-step config.',
-  swarm: { pattern: 'pipeline' },
-  agents: [],
-  workflows: [
-    {
-      name: 'multi-tenant-pr-workflow',
-      steps: [
-        // ─── Tenant A: AgentWorkforce ───────────────────────────────
-        createGitHubStep({
-          name: 'inspect-agentworkforce-cloud',
-          action: 'getRepo',
-          repo: agentworkforceRepo,
-          config: githubConfigForRepo({ repo: agentworkforceRepo }),
-          output: { mode: 'summary', includeRuntime: true, pretty: true },
-        }),
-
-        createGitHubStep({
-          name: 'open-pr-agentworkforce',
-          dependsOn: ['inspect-agentworkforce-cloud'],
-          action: 'createPR',
-          repo: agentworkforceRepo,
-          params: {
-            // Pretend we prepared this branch in an earlier workflow step
-            // (push-branch in the caller workflow).
-            head: 'feat/typed-webhook-consumers',
-            base: 'main',
-            title: 'feat(web): typed webhook-consumer config',
-            body: "Routes through AgentWorkforce's github-agentworkforce Nango connection.",
-            draft: true,
-          },
-          config: githubConfigForRepo({ repo: agentworkforceRepo }),
-          output: { mode: 'data', format: 'json', path: 'data.html_url' },
-        }),
-
-        // ─── Tenant B: MSD ──────────────────────────────────────────
-        // Same workflow, same action verbs, different connection
-        // resolved by the per-step `config` field. Runs sequentially
-        // here but could run in parallel — tenants are independent.
-        createGitHubStep({
-          name: 'inspect-msd-platform',
-          dependsOn: ['open-pr-agentworkforce'],
-          action: 'getRepo',
-          repo: msdRepo,
-          config: githubConfigForRepo({ repo: msdRepo }),
-          output: { mode: 'summary', includeRuntime: true, pretty: true },
-        }),
-
-        createGitHubStep({
-          name: 'open-pr-msd',
-          dependsOn: ['inspect-msd-platform'],
-          action: 'createPR',
-          repo: msdRepo,
-          params: {
-            head: 'integrations/agent-relay-webhook',
-            base: 'main',
-            title: 'feat: wire up Agent Relay webhook receiver',
-            body: "Routes through MSD's github-msd Nango connection — separate GitHub App install.",
-            draft: true,
-          },
-          config: githubConfigForRepo({ repo: msdRepo }),
-          output: { mode: 'data', format: 'json', path: 'data.html_url' },
-        }),
-      ],
-    },
-  ],
-  errorHandling: { strategy: 'fail-fast' },
-};
-
-async function main(): Promise<void> {
-  console.log('Opening PRs in two tenants via per-step GitHub config overrides:');
-  console.log(`  ${agentworkforceRepo}  → connection ${TENANTS[agentworkforceRepo].providerConfigKey}`);
-  console.log(`  ${msdRepo}             → connection ${TENANTS[msdRepo].providerConfigKey}`);
-  console.log();
-
-  const runner = new WorkflowRunner({
-    cwd: process.cwd(),
-    executor,
-  });
-
-  const result = await runner.execute(config);
-  console.log(`\nWorkflow completed: ${result.status}`);
-}
-
-if (process.argv[1] === new URL(import.meta.url).pathname) {
-  main().catch((error) => {
-    console.error(error instanceof Error ? error.stack : error);
-    process.exitCode = 1;
-  });
-}
diff --git a/packages/github-primitive/package.json b/packages/github-primitive/package.json
index 6a881e551..597bce925 100644
--- a/packages/github-primitive/package.json
+++ b/packages/github-primitive/package.json
@@ -10,11 +10,6 @@
       "types": "./dist/index.d.ts",
       "import": "./dist/index.js",
       "default": "./dist/index.js"
-    },
-    "./workflow-step": {
-      "types": "./dist/workflow-step.d.ts",
-      "import": "./dist/workflow-step.js",
-      "default": "./dist/workflow-step.js"
     }
   },
   "files": [
@@ -31,9 +26,7 @@
     "test": "vitest run",
     "test:watch": "vitest"
   },
-  "dependencies": {
-    "@agent-relay/workflow-types": "7.1.1"
-  },
+  "dependencies": {},
   "devDependencies": {
     "@types/node": "^22.19.3",
     "typescript": "^5.9.3",
diff --git a/packages/github-primitive/src/index.ts b/packages/github-primitive/src/index.ts
index 482276392..3fffc970c 100644
--- a/packages/github-primitive/src/index.ts
+++ b/packages/github-primitive/src/index.ts
@@ -4,7 +4,6 @@ export * from './adapter.js';
 export * from './local-runtime.js';
 export * from './cloud-runtime.js';
 export * from './client.js';
-export * from './workflow-step.js';
 export * from './actions/branches.js';
 export * from './actions/commits.js';
 export * from './actions/repos.js';
diff --git a/packages/github-primitive/src/workflow-step.ts b/packages/github-primitive/src/workflow-step.ts
deleted file mode 100644
index 11c2ca141..000000000
--- a/packages/github-primitive/src/workflow-step.ts
+++ /dev/null
@@ -1,615 +0,0 @@
-import type { RunnerStepExecutor, WorkflowStep } from '@agent-relay/workflow-types';
-
-import { GitHubClient } from './client.js';
-import type {
-  GitHubActionName,
-  GitHubActionParamsMap,
-  GitHubActionResult,
-  GitHubRuntime,
-  GitHubRuntimeConfig,
-  RepositoryRef,
-} from './types.js';
-import { GITHUB_ACTIONS } from './types.js';
-
-export type GitHubStepOutputMode = 'data' | 'result' | 'summary' | 'raw' | 'none';
-export type GitHubStepOutputFormat = 'json' | 'text';
-
-type RepoParamKeys = 'owner' | 'repo';
-type ParamsFor<TName extends GitHubActionName> = TName extends keyof GitHubActionParamsMap
-  ? GitHubActionParamsMap[TName]
-  : Record<string, unknown>;
-type StripRepoParams<TParams> = Omit<TParams, Extract<keyof TParams, RepoParamKeys>> &
-  Partial<Pick<TParams, Extract<keyof TParams, RepoParamKeys>>>;
-
-export type GitHubStepParams<TName extends GitHubActionName = GitHubActionName> = [
-  NonNullable<ParamsFor<TName>>,
-] extends [never]
-  ? Record<string, unknown>
-  : StripRepoParams<NonNullable<ParamsFor<TName>>>;
-
-export interface GitHubStepOutputConfig {
-  /** Which action result becomes the workflow step output. Defaults to "data". */
-  mode?: GitHubStepOutputMode;
-  /** Emit JSON for structured chaining or text for simple downstream interpolation. Defaults to "json". */
-  format?: GitHubStepOutputFormat;
-  /** Select a nested field from the projected output, e.g. "number" or "data.htmlUrl". */
-  path?: string;
-  /** Include adapter metadata such as runtime and timing in JSON output. Defaults false. */
-  includeMetadata?: boolean;
-  /** Include the selected runtime in JSON output. Defaults false. */
-  includeRuntime?: boolean;
-  /** Pretty-print JSON output. Defaults false. */
-  pretty?: boolean;
-}
-
-export interface GitHubStepConfig<TName extends GitHubActionName = GitHubActionName> {
-  /** Unique step name within the workflow. */
-  name: string;
-  /** Dependencies in the Relay workflow DAG. */
-  dependsOn?: string[];
-  /** GitHub action to execute. */
-  action: TName;
-  /** Repository in owner/repo format. Used as owner and repo params for repository-scoped actions. */
-  repo?: string | RepositoryRef;
-  /** Action-specific parameters. Values may include workflow templates such as {{steps.plan.output}}. */
-  params?: GitHubStepParams<TName>;
-  /** Runtime settings for local gh CLI, cloud/Nango, or auto detection. */
-  config?: GitHubRuntimeConfig;
-  /** Controls the string captured as {{steps.<name>.output}}. */
-  output?: GitHubStepOutputConfig;
-  /** Workflow step timeout in milliseconds. */
-  timeoutMs?: number;
-  /** Number of retry attempts when the workflow runner retries this integration step. */
-  retries?: number;
-}
-
-export interface GitHubStepExecutionContext {
-  workspaceId?: string;
-  client?: GitHubClient;
-  config?: GitHubRuntimeConfig;
-}
-
-export interface GitHubStepExecutionResult<TOutput = unknown> {
-  success: boolean;
-  output: string;
-  result: GitHubActionResult<TOutput>;
-  runtime?: GitHubRuntime;
-  error?: string;
-}
-
-export interface GitHubIntegrationStepResult {
-  output: string;
-  success: boolean;
-}
-
-type ResolvedParams = Record<string, unknown>;
-
-const GITHUB_INTEGRATION = 'github';
-const RESERVED_PARAM_KEYS = new Set([
-  'action',
-  'config',
-  'githubConfig',
-  'output',
-  'params',
-  'actionParams',
-  'repository',
-  'runtime',
-  'ghPath',
-  'timeout',
-  'retryOnRateLimit',
-  'maxRetries',
-]);
-
-/**
- * Create a Relay integration step that can be used in TypeScript workflows or
- * emitted into .relay YAML. Complex params/config objects are serialized so the
- * workflow template resolver can interpolate values before execution.
- */
-export function createGitHubStep<TName extends GitHubActionName>(
-  config: GitHubStepConfig<TName>
-): WorkflowStep {
-  validateGitHubStepConfig(config);
-
-  const params: Record<string, string> = {};
-
-  if (config.repo !== undefined) {
-    params.repo = repoToString(config.repo);
-  }
-  if (config.params !== undefined) {
-    params.params = JSON.stringify(config.params);
-  }
-  if (config.config !== undefined) {
-    params.config = JSON.stringify(config.config);
-  }
-  if (config.output !== undefined) {
-    params.output = JSON.stringify(config.output);
-  }
-
-  const step: WorkflowStep = {
-    name: config.name,
-    type: 'integration',
-    integration: GITHUB_INTEGRATION,
-    action: config.action,
-    params,
-  };
-
-  if (config.dependsOn !== undefined) step.dependsOn = config.dependsOn;
-  if (config.timeoutMs !== undefined) step.timeoutMs = config.timeoutMs;
-  if (config.retries !== undefined) step.retries = config.retries;
-
-  return step;
-}
-
-export class GitHubStepExecutor implements RunnerStepExecutor {
-  constructor(private readonly options: GitHubRuntimeConfig = {}) {}
-
-  async executeAgentStep(): Promise<string> {
-    throw new Error('GitHubStepExecutor only executes GitHub integration steps.');
-  }
-
-  async execute<TOutput = unknown>(
-    config: GitHubStepConfig,
-    context: GitHubStepExecutionContext = {}
-  ): Promise<GitHubStepExecutionResult<TOutput>> {
-    validateGitHubStepConfig(config);
-
-    const runtimeConfig = mergeRuntimeConfig(this.options, context.config, config.config);
-    if (context.workspaceId && !runtimeConfig.relayCloud?.workspaceId) {
-      runtimeConfig.relayCloud = {
-        ...runtimeConfig.relayCloud,
-        workspaceId: context.workspaceId,
-      };
-    }
-
-    const client = context.client ?? new GitHubClient(runtimeConfig);
-    const actionParams = buildActionParams(config);
-    const result = await client.executeAction<TOutput>(config.action, actionParams);
-    const runtime = result.metadata?.runtime ?? (await safeGetRuntime(client));
-    const output = formatStepOutput(config, result, runtime);
-
-    return {
-      success: result.success,
-      output,
-      result,
-      runtime,
-      error: result.error,
-    };
-  }
-
-  async executeIntegrationStep(
-    step: WorkflowStep,
-    resolvedParams: Record<string, string>,
-    context: { workspaceId?: string } = {}
-  ): Promise<GitHubIntegrationStepResult> {
-    if (step.integration !== GITHUB_INTEGRATION) {
-      return {
-        success: false,
-        output: `GitHubStepExecutor only handles "${GITHUB_INTEGRATION}" integration steps`,
-      };
-    }
-
-    try {
-      const config = githubStepConfigFromWorkflowStep(step, resolvedParams);
-      const result = await this.execute(config, context);
-
-      return {
-        success: result.success,
-        output: result.success ? result.output : result.output || result.error || 'GitHub step failed',
-      };
-    } catch (error) {
-      return {
-        success: false,
-        output: error instanceof Error ? error.message : String(error),
-      };
-    }
-  }
-}
-
-export function githubStepConfigFromWorkflowStep(
-  step: WorkflowStep,
-  resolvedParams: Record<string, string>
-): GitHubStepConfig {
-  const params = normalizeResolvedParams(resolvedParams);
-  const action = step.action as GitHubActionName | undefined;
-
-  if (!action) {
-    throw new Error(`GitHub step "${step.name}" requires an action`);
-  }
-
-  const config =
-    readJsonParam<GitHubRuntimeConfig>(params.config ?? params.githubConfig, 'config') ??
-    runtimeConfigFromParams(params);
-  const output = readJsonParam<GitHubStepOutputConfig>(params.output, 'output') ?? undefined;
-  const repo = readRepositoryParam(params);
-  const actionParams = readActionParams(params);
-
-  return {
-    name: step.name,
-    dependsOn: step.dependsOn,
-    action,
-    repo,
-    params: actionParams,
-    config,
-    output,
-    timeoutMs: step.timeoutMs,
-    retries: step.retries,
-  };
-}
-
-function validateGitHubStepConfig(config: GitHubStepConfig): void {
-  if (!config.name) {
-    throw new Error('GitHub step requires a non-empty name');
-  }
-  if (!config.action || typeof config.action !== 'string') {
-    throw new Error(`GitHub step "${config.name}" requires an action name`);
-  }
-  if (!GITHUB_ACTIONS.includes(config.action as never)) {
-    throw new Error(`GitHub step "${config.name}" uses unsupported action "${config.action}"`);
-  }
-  if (config.repo !== undefined) {
-    parseRepositoryRef(config.repo);
-  }
-  if (config.params !== undefined && !isRecord(config.params)) {
-    throw new Error(`GitHub step "${config.name}" params must be an object`);
-  }
-}
-
-function buildActionParams(config: GitHubStepConfig): unknown {
-  const repo = config.repo === undefined ? undefined : parseRepositoryRef(config.repo);
-  const params = config.params ? ({ ...config.params } as Record<string, unknown>) : {};
-  const merged = repo ? { ...repo, ...params } : params;
-
-  return Object.keys(merged).length === 0 ? undefined : merged;
-}
-
-function readActionParams(params: ResolvedParams): Record<string, unknown> {
-  const serializedParams = params.params ?? params.actionParams;
-  if (serializedParams !== undefined) {
-    const parsed = readJsonParam<Record<string, unknown>>(serializedParams, 'params');
-    if (parsed === undefined) return {};
-    if (!isRecord(parsed)) {
-      throw new Error('GitHub step params.params must be a JSON object');
-    }
-    return parsed;
-  }
-
-  const actionParams: Record<string, unknown> = {};
-  const repoValue = params.repo;
-  const repoIsRepositoryRef =
-    params.owner === undefined && typeof repoValue === 'string' && repoValue.includes('/');
-
-  for (const [key, value] of Object.entries(params)) {
-    if (RESERVED_PARAM_KEYS.has(key)) continue;
-    if (key === 'repo' && repoIsRepositoryRef) continue;
-    actionParams[key] = value;
-  }
-
-  return actionParams;
-}
-
-function readRepositoryParam(params: ResolvedParams): string | RepositoryRef | undefined {
-  const value = params.repository ?? (params.owner === undefined ? params.repo : undefined);
-  if (value === undefined) return undefined;
-  if (typeof value === 'string' || isRecord(value)) {
-    return parseRepositoryRef(value);
-  }
-  throw new Error('GitHub step repo must be in owner/repo format');
-}
-
-function runtimeConfigFromParams(params: ResolvedParams): GitHubRuntimeConfig | undefined {
-  const config: GitHubRuntimeConfig = {};
-
-  if (typeof params.runtime === 'string') {
-    config.runtime = params.runtime as GitHubRuntimeConfig['runtime'];
-  }
-  if (typeof params.ghPath === 'string') {
-    config.ghPath = params.ghPath;
-  }
-  if (typeof params.timeout === 'number') {
-    config.timeout = params.timeout;
-  }
-  if (typeof params.retryOnRateLimit === 'boolean') {
-    config.retryOnRateLimit = params.retryOnRateLimit;
-  }
-  if (typeof params.maxRetries === 'number') {
-    config.maxRetries = params.maxRetries;
-  }
-
-  return Object.keys(config).length === 0 ? undefined : config;
-}
-
-function mergeRuntimeConfig(...configs: Array<GitHubRuntimeConfig | undefined>): GitHubRuntimeConfig {
-  const merged: GitHubRuntimeConfig = {};
-
-  for (const config of configs) {
-    if (!config) continue;
-
-    const { nango, relayCloud, env, ...flatConfig } = config;
-    Object.assign(merged, flatConfig);
-    if (nango) {
-      merged.nango = {
-        ...merged.nango,
-        ...nango,
-      };
-    }
-    if (relayCloud) {
-      merged.relayCloud = {
-        ...merged.relayCloud,
-        ...relayCloud,
-      };
-    }
-    if (env) {
-      merged.env = {
-        ...merged.env,
-        ...env,
-      };
-    }
-  }
-
-  return merged;
-}
-
-function formatStepOutput<TOutput>(
-  config: GitHubStepConfig,
-  result: GitHubActionResult<TOutput>,
-  runtime?: GitHubRuntime
-): string {
-  const outputConfig = config.output ?? {};
-  const mode = outputConfig.mode ?? 'data';
-  const format = outputConfig.format ?? 'json';
-
-  if (mode === 'none') {
-    return '';
-  }
-
-  let projection = buildOutputProjection(mode, result, runtime, outputConfig);
-
-  if (outputConfig.path) {
-    projection = resolvePath(projection, outputConfig.path);
-  }
-
-  if (format === 'text') {
-    return projectionToText(projection);
-  }
-
-  return JSON.stringify(projection, undefined, outputConfig.pretty ? 2 : undefined);
-}
-
-function buildOutputProjection<TOutput>(
-  mode: GitHubStepOutputMode,
-  result: GitHubActionResult<TOutput>,
-  runtime: GitHubRuntime | undefined,
-  outputConfig: GitHubStepOutputConfig
-): unknown {
-  if (mode === 'raw') {
-    return result.output;
-  }
-
-  if (mode === 'summary') {
-    return withOptionalMetadata(summarizeResult(result, runtime), result, runtime, outputConfig);
-  }
-
-  if (mode === 'result') {
-    const projected: Record<string, unknown> = {
-      success: result.success,
-      output: result.output,
-    };
-    if (result.data !== undefined) projected.data = result.data;
-    if (result.error !== undefined) projected.error = result.error;
-
-    return withOptionalMetadata(projected, result, runtime, outputConfig);
-  }
-
-  const data = result.data ?? (result.output ? result.output : null);
-  return withOptionalMetadata(data, result, runtime, outputConfig);
-}
-
-function summarizeResult<TOutput>(
-  result: GitHubActionResult<TOutput>,
-  runtime?: GitHubRuntime
-): Record<string, unknown> {
-  if (!result.success) {
-    return {
-      success: false,
-      error: result.error ?? 'GitHub action failed',
-      runtime,
-    };
-  }
-
-  const data = result.data;
-  if (Array.isArray(data)) {
-    return {
-      success: true,
-      count: data.length,
-      items: data.slice(0, 10).map(summarizeValue),
-      runtime,
-    };
-  }
-
-  return {
-    success: true,
-    value: summarizeValue(data ?? result.output),
-    runtime,
-  };
-}
-
-function summarizeValue(value: unknown): unknown {
-  if (!isRecord(value)) {
-    return value;
-  }
-
-  const summary: Record<string, unknown> = {};
-  for (const key of [
-    'fullName',
-    'name',
-    'number',
-    'title',
-    'state',
-    'path',
-    'sha',
-    'type',
-    'defaultBranch',
-    'visibility',
-    'private',
-    'createdAt',
-    'updatedAt',
-    'htmlUrl',
-    'url',
-  ]) {
-    if (value[key] !== undefined) {
-      summary[key] = value[key];
-    }
-  }
-
-  return Object.keys(summary).length > 0 ? summary : value;
-}
-
-function withOptionalMetadata<TOutput>(
-  value: unknown,
-  result: GitHubActionResult<TOutput>,
-  runtime: GitHubRuntime | undefined,
-  outputConfig: GitHubStepOutputConfig
-): unknown {
-  if (!outputConfig.includeMetadata && !outputConfig.includeRuntime) {
-    return value;
-  }
-
-  const metadata: Record<string, unknown> = {};
-  if (outputConfig.includeRuntime && runtime !== undefined) metadata.runtime = runtime;
-  if (outputConfig.includeMetadata && result.metadata !== undefined) {
-    Object.assign(metadata, result.metadata);
-  }
-
-  return { value, metadata };
-}
-
-function projectionToText(value: unknown): string {
-  if (typeof value === 'string') return value;
-  if (value === null || value === undefined) return '';
-
-  if (Array.isArray(value)) {
-    return value.map((entry) => projectionToText(entry)).join('\n');
-  }
-
-  if (isRecord(value)) {
-    if ('output' in value) return projectionToText(value.output);
-    if ('value' in value) return projectionToText(value.value);
-    if ('data' in value) return projectionToText(value.data);
-    if ('content' in value) return projectionToText(value.content);
-    if ('body' in value) return projectionToText(value.body);
-    if ('title' in value) return projectionToText(value.title);
-    if ('fullName' in value) return projectionToText(value.fullName);
-    if ('path' in value) return projectionToText(value.path);
-    if ('url' in value) return projectionToText(value.url);
-  }
-
-  return JSON.stringify(value);
-}
-
-function resolvePath(value: unknown, path: string): unknown {
-  if (!path) return value;
-
-  let current = value;
-  for (const segment of path.split('.')) {
-    if (Array.isArray(current) && /^\d+$/.test(segment)) {
-      current = current[Number(segment)];
-      continue;
-    }
-    if (isRecord(current)) {
-      current = current[segment];
-      continue;
-    }
-    return undefined;
-  }
-
-  return current;
-}
-
-function parseRepositoryRef(repo: string | RepositoryRef | Record<string, unknown>): RepositoryRef {
-  if (typeof repo === 'string') {
-    const [owner, name, ...rest] = repo.split('/');
-    if (!owner || !name || rest.length > 0) {
-      throw new Error(`GitHub repo must be in owner/repo format: ${repo}`);
-    }
-
-    return {
-      owner,
-      repo: name,
-      fullName: `${owner}/${name}`,
-    };
-  }
-
-  const owner = typeof repo.owner === 'string' ? repo.owner : undefined;
-  const name = typeof repo.repo === 'string' ? repo.repo : undefined;
-  if (!owner || !name) {
-    throw new Error('GitHub repo object requires owner and repo');
-  }
-
-  return {
-    owner,
-    repo: name,
-    fullName: typeof repo.fullName === 'string' ? repo.fullName : `${owner}/${name}`,
-  };
-}
-
-function repoToString(repo: string | RepositoryRef): string {
-  return typeof repo === 'string' ? repo : `${repo.owner}/${repo.repo}`;
-}
-
-async function safeGetRuntime(client: GitHubClient): Promise<GitHubRuntime | undefined> {
-  try {
-    return await client.getRuntime();
-  } catch {
-    return undefined;
-  }
-}
-
-function normalizeResolvedParams(params: Record<string, string>): ResolvedParams {
-  const normalized: ResolvedParams = {};
-  for (const [key, value] of Object.entries(params)) {
-    normalized[key] = coerceScalar(value);
-  }
-  return normalized;
-}
-
-function coerceScalar(value: unknown): unknown {
-  if (typeof value !== 'string') {
-    return value;
-  }
-
-  const trimmed = value.trim();
-  if (trimmed === 'true') return true;
-  if (trimmed === 'false') return false;
-  if (trimmed === 'null') return null;
-  if (/^-?(?:0|[1-9]\d*)(?:\.\d+)?$/.test(trimmed)) return Number(trimmed);
-  if (
-    (trimmed.startsWith('{') && trimmed.endsWith('}')) ||
-    (trimmed.startsWith('[') && trimmed.endsWith(']')) ||
-    (trimmed.startsWith('"') && trimmed.endsWith('"'))
-  ) {
-    try {
-      return JSON.parse(trimmed);
-    } catch {
-      return value;
-    }
-  }
-
-  return value;
-}
-
-function readJsonParam<T>(value: unknown, name: string): T | undefined {
-  if (value === undefined) return undefined;
-  if (typeof value !== 'string') return value as T;
-
-  try {
-    return JSON.parse(value) as T;
-  } catch (error) {
-    throw new Error(
-      `GitHub step params.${name} must be valid JSON: ${error instanceof Error ? error.message : String(error)}`
-    );
-  }
-}
-
-function isRecord(value: unknown): value is Record<string, unknown> {
-  return typeof value === 'object' && value !== null && !Array.isArray(value);
-}
diff --git a/packages/personas/personas/agent-relay-workflow.json b/packages/personas/personas/agent-relay-workflow.json
deleted file mode 100644
index a65398d33..000000000
--- a/packages/personas/personas/agent-relay-workflow.json
+++ /dev/null
@@ -1,35 +0,0 @@
-{
-  "id": "agent-relay-workflow",
-  "intent": "agent-relay-workflow",
-  "tags": ["implementation", "documentation"],
-  "description": "Authors complete, runnable agent-relay workflow artifacts. Applies workflow skills as source material, preserves Ricky's artifact contract, and includes GitHub primitive PR shipping steps for implementation workflows.",
-  "skills": [
-    {
-      "id": "skill.sh/writing-agent-relay-workflows",
-      "source": "https://github.com/agentworkforce/skills#writing-agent-relay-workflows",
-      "description": "Skill to load and drive writing-agent-relay workflow automation from the Skills registry"
-    },
-    {
-      "id": "prpm/writing-agent-relay-workflows",
-      "source": "https://prpm.dev/packages/@agent-relay/writing-agent-relay-workflows",
-      "description": "PRPM wrapper for writing-agent-relay-workflows harness"
-    },
-    {
-      "id": "prpm/relay-80-100-workflow",
-      "source": "https://prpm.dev/packages/@agent-relay/relay-80-100-workflow",
-      "description": "PRPM-based provisioning for agent-relay/relay-80-100-workflow"
-    },
-    {
-      "id": "prpm/choosing-swarm-patterns",
-      "source": "https://prpm.dev/packages/@agent-relay/choosing-swarm-patterns",
-      "description": "PRPM-based provisioning for agent-relay/choosing-swarm-patterns"
-    }
-  ],
-  "harness": "opencode",
-  "model": "opencode/gpt-5-nano",
-  "systemPrompt": "You are an agent-relay workflow artifact author. Produce complete, runnable TypeScript workflow source plus metadata for the caller's requested artifact path; do not stop at a plan or example. Read the normalized spec, matched skill context, target mode, and response schema. Write a workflow with the Agent Relay workflow builder, a dedicated channel, explicit agents, deterministic preflight/context, bounded implementation steps, review, fix loop, final review, hard validation, regression evidence, and final signoff. Preserve declared targets, non-goals, acceptance gates, environment preflights, and tool fallbacks. When the workflow can change repository files or must ship a bug fix/feature, include GitHub primitive shipping steps in the generated workflow: import GitHubStepExecutor and createGitHubStep from @agent-relay/github-primitive, create or update a branch, commit changed files, open a pull request, and capture the PR URL. Omit PR steps only when the normalized spec explicitly says planning-only, no PR, or PR creation is out of scope. Never perform branch, commit, or pull-request side effects during persona generation itself; generate workflow source that does them later when executed. Keep runtime-agent prompts model-agnostic. Output contract: return only structured JSON or a fenced TypeScript artifact plus metadata, with artifact.content containing the complete workflow source.",
-  "harnessSettings": {
-    "reasoning": "medium",
-    "timeoutSeconds": 3600
-  }
-}
diff --git a/packages/personas/personas/opencode-workflow-specialist.json b/packages/personas/personas/opencode-workflow-specialist.json
deleted file mode 100644
index 39f6fb5c5..000000000
--- a/packages/personas/personas/opencode-workflow-specialist.json
+++ /dev/null
@@ -1,13 +0,0 @@
-{
-  "id": "opencode-workflow-specialist",
-  "intent": "opencode-workflow-correctness",
-  "tags": ["debugging"],
-  "description": "Diagnoses and repairs opencode-based agent-relay workflow failures across SDK, broker, cloud bootstrap, and CLI layers",
-  "harness": "opencode",
-  "model": "opencode/gpt-5-nano",
-  "systemPrompt": "You are the opencode workflow specialist in efficient mode. Keep the same quality bar as top tier; reduce only depth and verbosity. Own the full opencode workflow surface area: SDK spawn dispatch and transport selection, opencode session collection, the Rust headless worker, cloud bootstrap extraction/fallback, Daytona snapshot and launcher provisioning, and opencode CLI auth/model/mode quirks. Reproduce first, isolate the broken layer, fix the root cause in the correct layer, and verify with repeat runs across the failing opencode case plus nearby shared paths when relevant. Priorities remain end-to-end correctness, local test fidelity, observability, cleanup, then speed. Avoid interactive: false workarounds, env-var hacks, SDK-bypassing spawn paths, and untested fixes that may regress other providers. Output contract: brief repro status, broken layer, reproduction recipe, root cause, minimal fix, and multi-scenario evidence.",
-  "harnessSettings": {
-    "reasoning": "medium",
-    "timeoutSeconds": 1100
-  }
-}
diff --git a/packages/sdk-py/tests/test_workflow_templates.py b/packages/sdk-py/tests/test_workflow_templates.py
deleted file mode 100644
index 375c4c563..000000000
--- a/packages/sdk-py/tests/test_workflow_templates.py
+++ /dev/null
@@ -1,450 +0,0 @@
-"""Tests for workflow templates including review-loop pattern.
-
-These tests verify that workflow configurations are properly structured
-and can be serialized to valid YAML for the relay runtime.
-"""
-
-import yaml
-import pytest
-from agent_relay import (
-    workflow,
-    dag,
-    fan_out,
-    pipeline,
-    PipelineStage,
-    TemplateAgent,
-    TemplateStep,
-    VerificationCheck,
-)
-
-
-class TestReviewLoopPattern:
-    """Tests for the review-loop workflow pattern."""
-
-    def test_basic_review_loop_structure(self):
-        """Test basic review-loop workflow with implementer and reviewers."""
-        config = (
-            workflow("review-loop-test")
-            .description("Test review loop workflow")
-            .pattern("review-loop")
-            .agent("implementer", cli="claude", role="Senior developer implementing the task")
-            .agent("reviewer-diff", cli="codex", role="Code quality reviewer", interactive=False)
-            .agent("reviewer-arch", cli="claude", role="Architecture reviewer", interactive=False)
-            .agent("reviewer-security", cli="codex", role="Security reviewer", interactive=False)
-            .step("implement", agent="implementer", task="Implement the feature")
-            .step("review-diff", agent="reviewer-diff", task="Review code quality", depends_on=["implement"])
-            .step("review-arch", agent="reviewer-arch", task="Review architecture", depends_on=["implement"])
-            .step("review-security", agent="reviewer-security", task="Security review", depends_on=["implement"])
-            .step(
-                "consolidate",
-                agent="implementer",
-                task="Consolidate review feedback",
-                depends_on=["review-diff", "review-arch", "review-security"],
-            )
-            .step("address-feedback", agent="implementer", task="Address issues", depends_on=["consolidate"])
-            .to_config()
-        )
-
-        assert config["swarm"]["pattern"] == "review-loop"
-        assert len(config["agents"]) == 4
-        assert len(config["workflows"][0]["steps"]) == 6
-
-        # Check implementer is interactive, reviewers are not
-        agents = {a["name"]: a for a in config["agents"]}
-        assert agents["implementer"].get("interactive", True) is True
-        assert agents["reviewer-diff"]["interactive"] is False
-        assert agents["reviewer-arch"]["interactive"] is False
-        assert agents["reviewer-security"]["interactive"] is False
-
-    def test_review_loop_with_verification(self):
-        """Test review-loop with verification checks."""
-        config = (
-            workflow("review-loop-verified")
-            .pattern("review-loop")
-            .agent("implementer", cli="claude")
-            .agent("reviewer", cli="codex", interactive=False)
-            .step(
-                "implement",
-                agent="implementer",
-                task="Implement feature",
-                verification=VerificationCheck(type="output_contains", value="IMPLEMENTATION COMPLETE"),
-            )
-            .step(
-                "review",
-                agent="reviewer",
-                task="Review implementation",
-                depends_on=["implement"],
-                verification=VerificationCheck(type="output_contains", value="REVIEW:"),
-            )
-            .step(
-                "address",
-                agent="implementer",
-                task="Address feedback",
-                depends_on=["review"],
-                verification=VerificationCheck(type="output_contains", value="ADDRESSED"),
-            )
-            .to_config()
-        )
-
-        steps = config["workflows"][0]["steps"]
-        assert steps[0]["verification"]["value"] == "IMPLEMENTATION COMPLETE"
-        assert steps[1]["verification"]["value"] == "REVIEW:"
-        assert steps[2]["verification"]["value"] == "ADDRESSED"
-
-    def test_review_loop_with_coordination(self):
-        """Test review-loop with barriers for synchronization."""
-        config = (
-            workflow("review-loop-coordinated")
-            .pattern("review-loop")
-            .coordination(
-                barriers=[{"name": "reviews-complete", "waitFor": ["review-1", "review-2"]}],
-                consensus_strategy="majority",
-            )
-            .agent("implementer", cli="claude")
-            .agent("reviewer-1", cli="codex", interactive=False)
-            .agent("reviewer-2", cli="claude", interactive=False)
-            .step("implement", agent="implementer", task="Do work")
-            .step("review-1", agent="reviewer-1", task="Review 1", depends_on=["implement"])
-            .step("review-2", agent="reviewer-2", task="Review 2", depends_on=["implement"])
-            .step("consolidate", agent="implementer", task="Merge", depends_on=["review-1", "review-2"])
-            .to_config()
-        )
-
-        assert config["coordination"]["consensusStrategy"] == "majority"
-        assert len(config["coordination"]["barriers"]) == 1
-        assert config["coordination"]["barriers"][0]["waitFor"] == ["review-1", "review-2"]
-
-    def test_review_loop_yaml_roundtrip(self):
-        """Test that review-loop config survives YAML roundtrip."""
-        builder = (
-            workflow("review-loop-yaml")
-            .pattern("review-loop")
-            .agent("impl", cli="claude")
-            .agent("rev", cli="codex", interactive=False)
-            .step("do", agent="impl", task="Do it")
-            .step("check", agent="rev", task="Check it", depends_on=["do"])
-        )
-
-        yaml_str = builder.to_yaml()
-        parsed = yaml.safe_load(yaml_str)
-
-        assert parsed["swarm"]["pattern"] == "review-loop"
-        assert len(parsed["agents"]) == 2
-        assert parsed["agents"][1]["interactive"] is False
-
-
-class TestHubSpokePattern:
-    """Tests for hub-spoke workflow pattern."""
-
-    def test_basic_hub_spoke(self):
-        """Test basic hub-spoke with lead and workers."""
-        config = (
-            workflow("hub-spoke-test")
-            .pattern("hub-spoke")
-            .agent("lead", cli="claude", role="lead")
-            .agent("worker-1", cli="codex")
-            .agent("worker-2", cli="codex")
-            .agent("worker-3", cli="codex")
-            .step("plan", agent="lead", task="Create plan")
-            .step("work-1", agent="worker-1", task="Task 1", depends_on=["plan"])
-            .step("work-2", agent="worker-2", task="Task 2", depends_on=["plan"])
-            .step("work-3", agent="worker-3", task="Task 3", depends_on=["plan"])
-            .step("consolidate", agent="lead", task="Merge work", depends_on=["work-1", "work-2", "work-3"])
-            .to_config()
-        )
-
-        assert config["swarm"]["pattern"] == "hub-spoke"
-        assert len(config["agents"]) == 4
-        assert config["agents"][0]["role"] == "lead"
-
-
-class TestPipelinePattern:
-    """Tests for pipeline workflow pattern."""
-
-    def test_pipeline_with_stages(self):
-        """Test pipeline with multiple stages."""
-        config = pipeline(
-            "pipeline-test",
-            stages=[
-                PipelineStage(name="stage-1", task="First stage"),
-                PipelineStage(name="stage-2", task="Second stage"),
-                PipelineStage(name="stage-3", task="Third stage"),
-            ],
-        ).to_config()
-
-        assert config["swarm"]["pattern"] == "pipeline"
-        steps = config["workflows"][0]["steps"]
-        assert len(steps) == 3
-        assert steps[1]["dependsOn"] == ["stage-1"]
-        assert steps[2]["dependsOn"] == ["stage-2"]
-
-
-class TestDAGPattern:
-    """Tests for DAG workflow pattern."""
-
-    def test_dag_with_dependencies(self):
-        """Test DAG with complex dependencies."""
-        config = dag(
-            "dag-test",
-            agents=[
-                TemplateAgent(name="frontend", cli="claude"),
-                TemplateAgent(name="backend", cli="codex"),
-                TemplateAgent(name="tester", cli="claude"),
-            ],
-            steps=[
-                TemplateStep(name="design", agent="frontend", task="Design UI"),
-                TemplateStep(name="api", agent="backend", task="Build API"),
-                TemplateStep(name="integrate", agent="frontend", task="Integrate", depends_on=["design", "api"]),
-                TemplateStep(name="test", agent="tester", task="Test all", depends_on=["integrate"]),
-            ],
-        ).to_config()
-
-        assert config["swarm"]["pattern"] == "dag"
-        steps = config["workflows"][0]["steps"]
-        assert steps[2]["dependsOn"] == ["design", "api"]
-        assert steps[3]["dependsOn"] == ["integrate"]
-
-
-class TestFanOutPattern:
-    """Tests for fan-out workflow pattern."""
-
-    def test_fan_out_with_synthesis(self):
-        """Test fan-out with parallel tasks and synthesis."""
-        config = fan_out(
-            "fan-out-test",
-            tasks=["Analyze module A", "Analyze module B", "Analyze module C"],
-            synthesis_task="Combine all analyses into report",
-        ).to_config()
-
-        assert config["swarm"]["pattern"] == "fan-out"
-        steps = config["workflows"][0]["steps"]
-        assert len(steps) == 4  # 3 tasks + 1 synthesis
-        # Synthesis depends on all tasks
-        assert steps[3]["dependsOn"] == ["task-1", "task-2", "task-3"]
-
-
-class TestMultiCLIWorkflows:
-    """Tests for workflows with multiple CLI types."""
-
-    def test_mixed_cli_workflow(self):
-        """Test workflow with Claude, Codex, and other CLIs."""
-        config = (
-            workflow("multi-cli")
-            .pattern("dag")
-            .agent("planner", cli="claude", role="Planning and coordination")
-            .agent("coder", cli="codex", role="Implementation")
-            .agent("reviewer", cli="gemini", role="Code review")
-            .agent("tester", cli="aider", role="Test writing")
-            .step("plan", agent="planner", task="Create implementation plan")
-            .step("code", agent="coder", task="Implement feature", depends_on=["plan"])
-            .step("review", agent="reviewer", task="Review code", depends_on=["code"])
-            .step("test", agent="tester", task="Write tests", depends_on=["code"])
-            .step("finalize", agent="planner", task="Final review", depends_on=["review", "test"])
-            .to_config()
-        )
-
-        clis = [a["cli"] for a in config["agents"]]
-        assert "claude" in clis
-        assert "codex" in clis
-        assert "gemini" in clis
-        assert "aider" in clis
-
-
-class TestWorkflowValidation:
-    """Tests for workflow validation."""
-
-    def test_dependency_cycle_detection(self):
-        """Test that circular dependencies are detected (runtime validation)."""
-        # Note: Current builder doesn't validate cycles at build time,
-        # but this documents expected behavior
-        config = (
-            workflow("cycle-test")
-            .pattern("dag")
-            .agent("a", cli="claude")
-            .step("s1", agent="a", task="First", depends_on=["s2"])
-            .step("s2", agent="a", task="Second", depends_on=["s1"])
-            .to_config()
-        )
-
-        # Config builds but would fail at runtime
-        # This test documents the current behavior
-        steps = config["workflows"][0]["steps"]
-        assert steps[0]["dependsOn"] == ["s2"]
-        assert steps[1]["dependsOn"] == ["s1"]
-
-    def test_unique_agent_names(self):
-        """Test that duplicate agent names are handled."""
-        # Builder allows duplicates (latest wins or both appear)
-        # This documents expected behavior
-        config = (
-            workflow("dup-test")
-            .pattern("dag")
-            .agent("worker", cli="claude")
-            .agent("worker", cli="codex")  # Same name, different CLI
-            .step("s1", agent="worker", task="Do work")
-            .to_config()
-        )
-
-        # Current behavior: both agents appear
-        assert len(config["agents"]) == 2
-
-    def test_step_references_existing_agent(self):
-        """Test step references an agent that exists."""
-        config = (
-            workflow("ref-test")
-            .pattern("dag")
-            .agent("worker", cli="claude")
-            .step("s1", agent="worker", task="Valid reference")
-            .to_config()
-        )
-
-        # Step agent matches defined agent
-        assert config["workflows"][0]["steps"][0]["agent"] == "worker"
-        assert config["agents"][0]["name"] == "worker"
-
-
-class TestWorkflowConfiguration:
-    """Tests for advanced workflow configuration."""
-
-    def test_error_handling_config(self):
-        """Test error handling configuration."""
-        config = (
-            workflow("error-test")
-            .pattern("dag")
-            .on_error("retry", max_retries=3, retry_delay_ms=5000, notify_channel="errors")
-            .agent("a", cli="claude")
-            .step("s1", agent="a", task="May fail")
-            .to_config()
-        )
-
-        assert config["errorHandling"]["strategy"] == "retry"
-        assert config["errorHandling"]["maxRetries"] == 3
-        assert config["errorHandling"]["retryDelayMs"] == 5000
-        assert config["errorHandling"]["notifyChannel"] == "errors"
-
-    def test_idle_nudge_config(self):
-        """Test idle agent detection configuration."""
-        config = (
-            workflow("idle-test")
-            .pattern("dag")
-            .idle_nudge(nudge_after_ms=60000, escalate_after_ms=120000, max_nudges=2)
-            .agent("a", cli="claude")
-            .step("s1", agent="a", task="Long running task")
-            .to_config()
-        )
-
-        nudge = config["swarm"]["idleNudge"]
-        assert nudge["nudgeAfterMs"] == 60000
-        assert nudge["escalateAfterMs"] == 120000
-        assert nudge["maxNudges"] == 2
-
-    def test_state_config(self):
-        """Test state management configuration."""
-        config = (
-            workflow("state-test")
-            .pattern("dag")
-            .state("redis", ttl_ms=3600000, namespace="myapp")
-            .agent("a", cli="claude")
-            .step("s1", agent="a", task="Stateful task")
-            .to_config()
-        )
-
-        assert config["state"]["backend"] == "redis"
-        assert config["state"]["ttlMs"] == 3600000
-        assert config["state"]["namespace"] == "myapp"
-
-    def test_trajectory_config(self):
-        """Test trajectory recording configuration."""
-        config = (
-            workflow("trajectory-test")
-            .pattern("dag")
-            .trajectories(enabled=True, reflect_on_barriers=True, auto_decisions=True)
-            .agent("a", cli="claude")
-            .step("s1", agent="a", task="Tracked task")
-            .to_config()
-        )
-
-        traj = config["trajectories"]
-        assert traj["enabled"] is True
-        assert traj["reflectOnBarriers"] is True
-        assert traj["autoDecisions"] is True
-
-    def test_agent_constraints(self):
-        """Test agent resource constraints."""
-        config = (
-            workflow("constraints-test")
-            .pattern("dag")
-            .agent(
-                "constrained",
-                cli="claude",
-                model="claude-opus",
-                max_tokens=8000,
-                timeout_ms=300000,
-                retries=2,
-                idle_threshold_secs=30,
-            )
-            .step("s1", agent="constrained", task="Constrained task")
-            .to_config()
-        )
-
-        constraints = config["agents"][0]["constraints"]
-        assert constraints["model"] == "claude-opus"
-        assert constraints["maxTokens"] == 8000
-        assert constraints["timeoutMs"] == 300000
-        assert constraints["retries"] == 2
-        assert constraints["idleThresholdSecs"] == 30
-
-
-class TestYAMLGeneration:
-    """Tests for YAML output generation."""
-
-    def test_yaml_output_is_valid(self):
-        """Test that generated YAML is parseable."""
-        builder = (
-            workflow("yaml-valid")
-            .pattern("dag")
-            .agent("a", cli="claude")
-            .step("s1", agent="a", task="Test task")
-        )
-
-        yaml_str = builder.to_yaml()
-
-        # Should parse without error
-        parsed = yaml.safe_load(yaml_str)
-        assert parsed is not None
-        assert isinstance(parsed, dict)
-
-    def test_yaml_preserves_multiline_tasks(self):
-        """Test that multiline tasks are preserved in YAML."""
-        multiline_task = """Do the following:
-1. First step
-2. Second step
-3. Third step"""
-
-        builder = (
-            workflow("multiline")
-            .pattern("dag")
-            .agent("a", cli="claude")
-            .step("s1", agent="a", task=multiline_task)
-        )
-
-        yaml_str = builder.to_yaml()
-        parsed = yaml.safe_load(yaml_str)
-
-        assert "1. First step" in parsed["workflows"][0]["steps"][0]["task"]
-        assert "3. Third step" in parsed["workflows"][0]["steps"][0]["task"]
-
-    def test_yaml_special_characters(self):
-        """Test that special characters are properly escaped."""
-        config = (
-            workflow("special-chars")
-            .description("Test: 'quotes' and \"double quotes\"")
-            .pattern("dag")
-            .agent("a", cli="claude")
-            .step("s1", agent="a", task="Use {{variable}} syntax")
-            .to_config()
-        )
-
-        # Should handle special characters
-        assert "quotes" in config["description"]
-        assert "{{variable}}" in config["workflows"][0]["steps"][0]["task"]
diff --git a/packages/sdk/README.md b/packages/sdk/README.md
index 754093fc6..92ee91b6c 100644
--- a/packages/sdk/README.md
+++ b/packages/sdk/README.md
@@ -15,7 +15,7 @@ npm install @agent-relay/sdk
 The workflow builder is the primary way to define and run multi-agent workflows:
 
 ```ts
-import { workflow } from '@agent-relay/sdk/workflows';
+import { workflow } from '@relayflows/core';
 
 const result = await workflow('my-feature')
   .pattern('dag')
@@ -179,7 +179,7 @@ Notes:
 
 ```ts
 import { AgentRelayClient } from '@agent-relay/sdk/client';
-import { workflow, WorkflowBuilder } from '@agent-relay/sdk/workflows';
+import { workflow, WorkflowBuilder } from '@relayflows/core';
 import { ConsensusCoordinator } from '@agent-relay/sdk/consensus';
 import { ShadowCoordinator } from '@agent-relay/sdk/shadow';
 ```
@@ -189,7 +189,7 @@ import { ShadowCoordinator } from '@agent-relay/sdk/shadow';
 Built-in templates for common patterns:
 
 ```ts
-import { fanOut, pipeline, dag } from '@agent-relay/sdk/workflows';
+import { fanOut, pipeline, dag } from '@relayflows/core';
 
 // Fan-out: parallel execution with synthesis
 const builder = fanOut('analysis', {
diff --git a/packages/sdk/package.json b/packages/sdk/package.json
index 380fc60c1..04393a101 100644
--- a/packages/sdk/package.json
+++ b/packages/sdk/package.json
@@ -52,11 +52,6 @@
       "import": "./dist/browser.js",
       "default": "./dist/browser.js"
     },
-    "./workflows": {
-      "types": "./dist/workflows/index.d.ts",
-      "import": "./dist/workflows/index.js",
-      "default": "./dist/workflows/index.js"
-    },
     "./communicate": {
       "types": "./dist/communicate/index.d.ts",
       "import": "./dist/communicate/index.js",
@@ -121,21 +116,6 @@
       "types": "./dist/slack.d.ts",
       "import": "./dist/slack.js",
       "default": "./dist/slack.js"
-    },
-    "./provisioner/seeder": {
-      "types": "./dist/provisioner/seeder.d.ts",
-      "import": "./dist/provisioner/seeder.js",
-      "default": "./dist/provisioner/seeder.js"
-    },
-    "./provisioner/local-jwks": {
-      "types": "./dist/provisioner/local-jwks.d.ts",
-      "import": "./dist/provisioner/local-jwks.js",
-      "default": "./dist/provisioner/local-jwks.js"
-    },
-    "./provisioner/token": {
-      "types": "./dist/provisioner/token.d.ts",
-      "import": "./dist/provisioner/token.js",
-      "default": "./dist/provisioner/token.js"
     }
   },
   "files": [
@@ -150,13 +130,12 @@
     "directory": "packages/sdk"
   },
   "scripts": {
-    "prebuild": "npm --prefix ../workflow-types run build && npm --prefix ../github-primitive run build && npm --prefix ../slack-primitive run build && npm --prefix ../config run build && npm --prefix ../cloud run build",
+    "prebuild": "npm --prefix ../github-primitive run build && npm --prefix ../slack-primitive run build && npm --prefix ../config run build && npm --prefix ../cloud run build",
     "build": "npx tsc -p tsconfig.build.json",
     "build:full": "tsc -p tsconfig.json && npm run bundle:binary",
     "bundle:binary": "node ./scripts/bundle-agent-relay.mjs",
     "check": "tsc -p tsconfig.json --noEmit",
-    "test": "npm run build && node --test dist/__tests__/integration.test.js && npm run test:vitest",
-    "test:vitest": "vitest run --config vitest.config.ts src/workflows/__tests__/run-script.test.ts",
+    "test": "npm run build && node --test dist/__tests__/integration.test.js",
     "test:quickstart": "node --test dist/__tests__/quickstart.test.js",
     "quickstart": "node dist/examples/quickstart.js",
     "demo": "node dist/examples/demo.js",
@@ -174,7 +153,6 @@
     "@agent-relay/config": "7.1.1",
     "@agent-relay/github-primitive": "7.1.1",
     "@agent-relay/slack-primitive": "7.1.1",
-    "@agent-relay/workflow-types": "7.1.1",
     "@agentworkforce/persona-kit": "^3.0.20",
     "@relaycast/sdk": "^1.1.0",
     "@relayfile/sdk": ">=0.1.2 <1",
diff --git a/packages/sdk/src/__tests__/builder-deterministic.test.ts b/packages/sdk/src/__tests__/builder-deterministic.test.ts
deleted file mode 100644
index 5651534ed..000000000
--- a/packages/sdk/src/__tests__/builder-deterministic.test.ts
+++ /dev/null
@@ -1,192 +0,0 @@
-/**
- * Tests for deterministic and worktree step support in WorkflowBuilder.
- */
-import { afterEach, describe, it, expect, vi } from 'vitest';
-import { workflow } from '../workflows/builder.js';
-
-describe('deterministic/worktree steps in builder', () => {
-  afterEach(() => {
-    vi.restoreAllMocks();
-  });
-
-  it('deterministic step emits correct config', () => {
-    const config = workflow('test')
-      .agent('worker', { cli: 'claude' })
-      .step('read-files', {
-        type: 'deterministic',
-        command: 'cat src/index.ts',
-        verification: { type: 'exit_code', value: '0' },
-      })
-      .step('build', { agent: 'worker', task: 'Build the project' })
-      .toConfig();
-
-    const steps = config.workflows![0].steps;
-    expect(steps).toHaveLength(2);
-
-    // Deterministic step
-    expect(steps[0].name).toBe('read-files');
-    expect(steps[0].type).toBe('deterministic');
-    expect(steps[0].command).toBe('cat src/index.ts');
-    expect(steps[0].agent).toBeUndefined();
-    expect(steps[0].task).toBeUndefined();
-    expect(steps[0].verification).toEqual({ type: 'exit_code', value: '0' });
-
-    // Agent step
-    expect(steps[1].name).toBe('build');
-    expect(steps[1].agent).toBe('worker');
-    expect(steps[1].task).toBe('Build the project');
-    expect(steps[1].type).toBeUndefined();
-  });
-
-  it('deterministic step with all options', () => {
-    const config = workflow('test')
-      .agent('worker', { cli: 'claude' })
-      .step('run-cmd', {
-        type: 'deterministic',
-        command: 'npm test',
-        captureOutput: true,
-        failOnError: false,
-        dependsOn: ['build'],
-        timeoutMs: 30000,
-      })
-      .step('final', { agent: 'worker', task: 'Finalize' })
-      .toConfig();
-
-    const step = config.workflows![0].steps[0];
-    expect(step.captureOutput).toBe(true);
-    expect(step.failOnError).toBe(false);
-    expect(step.dependsOn).toEqual(['build']);
-    expect(step.timeoutMs).toBe(30000);
-  });
-
-  it('worktree step emits correct config', () => {
-    const config = workflow('test')
-      .agent('worker', { cli: 'claude' })
-      .step('setup-worktree', {
-        type: 'worktree',
-        branch: 'feature/new',
-        baseBranch: 'main',
-        path: '.worktrees/feature-new',
-        createBranch: true,
-      })
-      .step('work', { agent: 'worker', task: 'Do work', dependsOn: ['setup-worktree'] })
-      .toConfig();
-
-    const step = config.workflows![0].steps[0];
-    expect(step.type).toBe('worktree');
-    expect(step.branch).toBe('feature/new');
-    expect(step.baseBranch).toBe('main');
-    expect(step.path).toBe('.worktrees/feature-new');
-    expect(step.createBranch).toBe(true);
-    expect(step.agent).toBeUndefined();
-    expect(step.command).toBeUndefined();
-  });
-
-  it('deterministic-only workflow does not require agents', () => {
-    const config = workflow('infra')
-      .step('lint', { type: 'deterministic', command: 'npm run lint' })
-      .step('test', {
-        type: 'deterministic',
-        command: 'npm test',
-        dependsOn: ['lint'],
-      })
-      .toConfig();
-
-    expect(config.agents).toHaveLength(0);
-    expect(config.workflows![0].steps).toHaveLength(2);
-  });
-
-  it('deterministic step without command throws', () => {
-    expect(() => {
-      workflow('test').step('bad', { type: 'deterministic' } as any);
-    }).toThrow('deterministic steps must have a command');
-  });
-
-  it('deterministic step with agent throws', () => {
-    expect(() => {
-      workflow('test').step('bad', { type: 'deterministic', command: 'ls', agent: 'x', task: 'y' } as any);
-    }).toThrow('deterministic steps must not have agent or task');
-  });
-
-  it('agent step without agent/task throws', () => {
-    expect(() => {
-      workflow('test').step('bad', {} as any);
-    }).toThrow('Agent steps must have both agent and task');
-  });
-
-  it('agent steps without any agent definition throws', () => {
-    expect(() => {
-      workflow('test').step('work', { agent: 'worker', task: 'Do work' }).toConfig();
-    }).toThrow('Workflow must have at least one agent when using agent steps');
-  });
-
-  it('toYaml includes deterministic steps', () => {
-    const yamlStr = workflow('test').step('check', { type: 'deterministic', command: 'echo hello' }).toYaml();
-
-    expect(yamlStr).toContain('type: deterministic');
-    expect(yamlStr).toContain('command: echo hello');
-  });
-
-  it('preserves diagnosticAgent in agent step verification', () => {
-    const config = workflow('traceback')
-      .agent('generator', { cli: 'claude' })
-      .agent('reviewer', { cli: 'claude' })
-      .step('generate', {
-        agent: 'generator',
-        task: 'Implement the change',
-        verification: {
-          type: 'custom',
-          value: 'npx nango compile',
-          diagnosticAgent: 'reviewer',
-        },
-        retries: 2,
-      })
-      .toConfig();
-
-    expect(config.workflows?.[0].steps[0].verification).toEqual({
-      type: 'custom',
-      value: 'npx nango compile',
-      diagnosticAgent: 'reviewer',
-    });
-  });
-
-  it('throws when diagnosticAgent is not in the agents list', () => {
-    expect(() => {
-      workflow('traceback')
-        .agent('generator', { cli: 'claude' })
-        .step('generate', {
-          agent: 'generator',
-          task: 'Implement the change',
-          verification: {
-            type: 'custom',
-            value: 'npx nango compile',
-            diagnosticAgent: 'reviewer',
-          },
-          retries: 2,
-        })
-        .toConfig();
-    }).toThrow('Step "generate" references unknown diagnosticAgent "reviewer"');
-  });
-
-  it('warns when diagnosticAgent is configured without step retries', () => {
-    const warnSpy = vi.spyOn(console, 'warn').mockImplementation(() => {});
-
-    workflow('traceback')
-      .agent('generator', { cli: 'claude' })
-      .agent('reviewer', { cli: 'claude' })
-      .step('generate', {
-        agent: 'generator',
-        task: 'Implement the change',
-        verification: {
-          type: 'custom',
-          value: 'npx nango compile',
-          diagnosticAgent: 'reviewer',
-        },
-      })
-      .toConfig();
-
-    expect(warnSpy).toHaveBeenCalledWith(
-      'Step "generate": diagnosticAgent configured but no retries — diagnostic will never run'
-    );
-  });
-});
diff --git a/packages/sdk/src/__tests__/completion-pipeline.test.ts b/packages/sdk/src/__tests__/completion-pipeline.test.ts
deleted file mode 100644
index c6bbcd1d8..000000000
--- a/packages/sdk/src/__tests__/completion-pipeline.test.ts
+++ /dev/null
@@ -1,1895 +0,0 @@
-/**
- * Completion Pipeline tests for Point-Person-Led Completion spec.
- *
- * Validates:
- * 1. Evidence-based completion (verification passes without marker)
- * 2. Owner decision parsing (OWNER_DECISION: COMPLETE/INCOMPLETE_RETRY/INCOMPLETE_FAIL)
- * 3. Tolerant review parsing (accepts semantic equivalents)
- * 4. Channel evidence contributions (WORKER_DONE signals)
- * 5. Backward compatibility with marker-based workflows
- * 6. Codex/Gemini/Supervisor pattern compatibility
- * 7. Map-reduce workflows remain unaffected
- */
-
-import { describe, it, expect, vi, beforeEach } from 'vitest';
-import type { WorkflowDb } from '../workflows/runner.js';
-import type {
-  RelayYamlConfig,
-  WorkflowRunRow,
-  WorkflowStepRow,
-  WorkflowStepCompletionReason,
-  StepCompletionEvidence,
-  StepCompletionDecision,
-} from '../workflows/types.js';
-
-// ── Mock fetch to prevent real HTTP calls (Relaycast provisioning) ───────────
-
-const mockFetch = vi.fn().mockResolvedValue({
-  ok: true,
-  json: () => Promise.resolve({ data: { api_key: 'rk_live_test', workspace_id: 'ws-test' } }),
-  text: () => Promise.resolve(''),
-});
-vi.stubGlobal('fetch', mockFetch);
-
-// ── Mock RelayCast SDK ───────────────────────────────────────────────────────
-
-const mockRelaycastAgent = {
-  send: vi.fn().mockResolvedValue(undefined),
-  heartbeat: vi.fn().mockResolvedValue(undefined),
-  channels: {
-    create: vi.fn().mockResolvedValue(undefined),
-    join: vi.fn().mockResolvedValue(undefined),
-    invite: vi.fn().mockResolvedValue(undefined),
-  },
-};
-
-const mockRelaycast = {
-  agents: {
-    register: vi.fn().mockResolvedValue({ token: 'token-1' }),
-  },
-  as: vi.fn().mockReturnValue(mockRelaycastAgent),
-};
-
-class MockRelayError extends Error {
-  code: string;
-  constructor(code: string, message: string, status = 400) {
-    super(message);
-    this.code = code;
-    this.name = 'RelayError';
-    (this as any).status = status;
-  }
-}
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn().mockImplementation(() => mockRelaycast),
-  RelayError: MockRelayError,
-}));
-
-// ── Mock AgentRelay ──────────────────────────────────────────────────────────
-
-let waitForExitFn: (ms?: number) => Promise<'exited' | 'timeout' | 'released'>;
-let waitForIdleFn: (ms?: number) => Promise<'idle' | 'timeout' | 'exited'>;
-let mockSpawnOutputs: string[] = [];
-
-vi.mock('node:child_process', async () => {
-  const actual = await vi.importActual<typeof import('node:child_process')>('node:child_process');
-  const { EventEmitter } = await import('node:events');
-
-  return {
-    ...actual,
-    spawn: vi.fn().mockImplementation(() => {
-      const child = new EventEmitter() as any;
-      child.pid = 4242;
-      child.kill = vi.fn();
-      child.stdout = new EventEmitter();
-      child.stderr = new EventEmitter();
-
-      const output = mockSpawnOutputs.shift() ?? '';
-      queueMicrotask(() => {
-        if (output) child.stdout.emit('data', Buffer.from(output));
-        child.emit('close', 0, null);
-      });
-
-      return child;
-    }),
-  };
-});
-
-const mockAgent = {
-  name: 'test-agent-abc',
-  get waitForExit() {
-    return waitForExitFn;
-  },
-  get waitForIdle() {
-    return waitForIdleFn;
-  },
-  release: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockHuman = {
-  name: 'WorkflowRunner',
-  sendMessage: vi.fn().mockResolvedValue(undefined),
-};
-
-function never<T>(): Promise<T> {
-  return new Promise(() => {});
-}
-
-const defaultSpawnPtyImplementation = async ({ name, task }: { name: string; task?: string }) => {
-  const queued = mockSpawnOutputs.shift();
-  const stepComplete = task?.match(/STEP_COMPLETE:([^\n]+)/)?.[1]?.trim();
-  const isReview = task?.includes('REVIEW_DECISION: APPROVE or REJECT');
-  const output =
-    queued ??
-    (isReview
-      ? 'REVIEW_DECISION: APPROVE\nREVIEW_REASON: looks good\n'
-      : stepComplete
-        ? `STEP_COMPLETE:${stepComplete}\n`
-        : 'STEP_COMPLETE:unknown\n');
-
-  queueMicrotask(() => {
-    emitRelayEvent('workerOutput', { name, chunk: output });
-  });
-
-  return { ...mockAgent, name };
-};
-
-const relayListeners = new Map<string, Set<(...args: any[]) => void>>();
-
-function emitRelayEvent(event: string, payload: any) {
-  const set = relayListeners.get(event);
-  if (!set) return;
-  for (const fn of set) fn(payload);
-}
-
-const mockRelayInstance = {
-  spawnPty: vi.fn().mockImplementation(defaultSpawnPtyImplementation),
-  human: vi.fn().mockReturnValue(mockHuman),
-  shutdown: vi.fn().mockResolvedValue(undefined),
-  onBrokerStderr: vi.fn().mockReturnValue(() => {}),
-  addListener: vi.fn((event: string, fn: (...args: any[]) => void) => {
-    let set = relayListeners.get(event);
-    if (!set) {
-      set = new Set();
-      relayListeners.set(event, set);
-    }
-    set.add(fn);
-    return () => {
-      set!.delete(fn);
-    };
-  }),
-  listAgents: vi.fn().mockResolvedValue([]),
-  listAgentsRaw: vi.fn().mockResolvedValue([]),
-};
-
-let relayEventCounter = 0;
-
-function emitRelayChannelMessage(message: { from: string; to: string; text: string }) {
-  setTimeout(() => {
-    emitRelayEvent('messageReceived', {
-      eventId: `evt-${++relayEventCounter}`,
-      from: message.from,
-      to: message.to,
-      text: message.text,
-      threadId: undefined,
-    });
-  }, 0);
-}
-
-vi.mock('../relay.js', () => ({
-  AgentRelay: vi.fn().mockImplementation(() => mockRelayInstance),
-}));
-
-// Import after mocking
-const { WorkflowRunner } = await import('../workflows/runner.js');
-
-// ── Test fixtures ────────────────────────────────────────────────────────────
-
-function makeDb(): WorkflowDb {
-  const runs = new Map<string, WorkflowRunRow>();
-  const steps = new Map<string, WorkflowStepRow>();
-
-  return {
-    insertRun: vi.fn(async (run: WorkflowRunRow) => {
-      runs.set(run.id, { ...run });
-    }),
-    updateRun: vi.fn(async (id: string, patch: Partial<WorkflowRunRow>) => {
-      const existing = runs.get(id);
-      if (existing) runs.set(id, { ...existing, ...patch });
-    }),
-    getRun: vi.fn(async (id: string) => {
-      const run = runs.get(id);
-      return run ? { ...run } : null;
-    }),
-    insertStep: vi.fn(async (step: WorkflowStepRow) => {
-      steps.set(step.id, { ...step });
-    }),
-    updateStep: vi.fn(async (id: string, patch: Partial<WorkflowStepRow>) => {
-      const existing = steps.get(id);
-      if (existing) steps.set(id, { ...existing, ...patch });
-    }),
-    getStepsByRunId: vi.fn(async (runId: string) => {
-      return [...steps.values()].filter((s) => s.runId === runId);
-    }),
-  };
-}
-
-function makeConfig(overrides: Partial<RelayYamlConfig> = {}): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'completion-pipeline-test',
-    swarm: { pattern: 'dag' },
-    agents: [
-      { name: 'agent-a', cli: 'claude' },
-      { name: 'agent-b', cli: 'claude' },
-    ],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'step-1', agent: 'agent-a', task: 'Do step 1' },
-          { name: 'step-2', agent: 'agent-b', task: 'Do step 2', dependsOn: ['step-1'] },
-        ],
-      },
-    ],
-    trajectories: false,
-    ...overrides,
-  };
-}
-
-type WorkflowStepOverride = Partial<NonNullable<RelayYamlConfig['workflows']>[number]['steps'][number]>;
-
-function makeSupervisedConfig(stepOverrides: WorkflowStepOverride = {}): RelayYamlConfig {
-  return makeConfig({
-    swarm: { pattern: 'hub-spoke' },
-    agents: [
-      { name: 'specialist', cli: 'claude', role: 'engineer' },
-      { name: 'team-lead', cli: 'claude', role: 'lead coordinator' },
-      { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-    ],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          {
-            name: 'step-1',
-            agent: 'specialist',
-            task: 'Implement the requested change',
-            ...stepOverrides,
-          },
-        ],
-      },
-    ],
-  });
-}
-
-function makeTwoStepSupervisedConfig(): RelayYamlConfig {
-  return makeConfig({
-    swarm: { pattern: 'hub-spoke' },
-    agents: [
-      { name: 'specialist-a', cli: 'claude', role: 'engineer' },
-      { name: 'specialist-b', cli: 'claude', role: 'engineer' },
-      { name: 'team-lead', cli: 'claude', role: 'lead coordinator' },
-      { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-    ],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'step-1', agent: 'specialist-a', task: 'Do step 1' },
-          { name: 'step-2', agent: 'specialist-b', task: 'Do step 2', dependsOn: ['step-1'] },
-        ],
-      },
-    ],
-  });
-}
-
-function makeChannelSupervisedConfig(
-  channel: string,
-  stepOverrides: WorkflowStepOverride = {}
-): RelayYamlConfig {
-  const config = makeSupervisedConfig(stepOverrides);
-  config.swarm = { ...config.swarm, channel };
-  return config;
-}
-
-async function getStepRow(
-  db: WorkflowDb,
-  runId: string,
-  stepName: string
-): Promise<WorkflowStepRow | undefined> {
-  const steps = await db.getStepsByRunId(runId);
-  return steps.find((step) => step.stepName === stepName);
-}
-
-// ── Tests ────────────────────────────────────────────────────────────────────
-
-describe('Completion Pipeline', () => {
-  let db: WorkflowDb;
-  let runner: InstanceType<typeof WorkflowRunner>;
-
-  beforeEach(() => {
-    vi.clearAllMocks();
-    relayEventCounter = 0;
-    waitForExitFn = vi.fn().mockResolvedValue('exited');
-    waitForIdleFn = vi.fn().mockImplementation(() => never());
-    mockSpawnOutputs = [];
-    mockAgent.release.mockResolvedValue(undefined);
-    mockRelayInstance.spawnPty.mockImplementation(defaultSpawnPtyImplementation);
-    relayListeners.clear();
-    db = makeDb();
-    runner = new WorkflowRunner({ db, workspaceId: 'ws-test' });
-  });
-
-  // ── Unit Test 1: Verification passes without marker ───────────────────
-
-  describe('evidence-based completion without marker', () => {
-    it('should complete step when verification passes but STEP_COMPLETE marker is missing', async () => {
-      // Worker output contains the verification target but no STEP_COMPLETE marker
-      mockSpawnOutputs = [
-        'worker output with expected content\n',
-        'Owner observed the work is done\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: verified\n',
-      ];
-
-      const config = makeSupervisedConfig({
-        verification: { type: 'output_contains', value: 'expected content' },
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-    }, 15000);
-
-    it('should complete self-owned step when verification passes without marker', async () => {
-      // Agent output has verified content but no STEP_COMPLETE marker
-      // With the completion pipeline, verification passing should be sufficient
-      mockSpawnOutputs = [
-        'All tests passed\nBuild successful\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: tests pass\n',
-      ];
-
-      const config = makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-1',
-                agent: 'agent-a',
-                task: 'Run tests',
-                verification: { type: 'output_contains', value: 'All tests passed' },
-              },
-            ],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-    }, 15000);
-  });
-
-  // ── Unit Test 2: Owner approves despite malformed worker marker ────────
-
-  describe('owner decision overrides malformed markers', () => {
-    it('should complete step when owner approves despite malformed worker marker', async () => {
-      // Worker outputs a malformed marker, but owner's STEP_COMPLETE is correct
-      mockSpawnOutputs = [
-        'STEP_COMPLET:step-1\n', // typo in worker marker
-        'Checked worker output, work is done\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: owner confirmed\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-    }, 15000);
-
-    it('should complete when owner provides OWNER_DECISION: COMPLETE', async () => {
-      // Owner uses the structured decision format
-      mockSpawnOutputs = [
-        'worker finished work\n',
-        'OWNER_DECISION: COMPLETE\nREASON: verified artifacts\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: owner confirmed\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-    }, 15000);
-  });
-
-  // ── Unit Test 3: Owner requests retry via OWNER_DECISION ──────────────
-
-  describe('owner decision retry', () => {
-    it('should fail with a clear error when owner requests INCOMPLETE_RETRY and retries are disabled', async () => {
-      mockSpawnOutputs = [
-        'worker first attempt\n',
-        'OWNER_DECISION: INCOMPLETE_RETRY\nREASON: missing error handling\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig({ retries: 0 }), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('no retries are configured (maxRetries=0)');
-      expect(run.error).toContain('OWNER_DECISION: INCOMPLETE_RETRY');
-
-      const steps = await db.getStepsByRunId(run.id);
-      expect(steps).toHaveLength(1);
-      expect(steps[0]?.status).toBe('failed');
-      expect(steps[0]?.completionReason).toBe('retry_requested_by_owner');
-      expect(mockRelayInstance.spawnPty).toHaveBeenCalledTimes(2);
-    }, 15000);
-
-    it('should retry and complete when owner requests INCOMPLETE_RETRY and retries remain', async () => {
-      const retryEvents: Array<{ type: string; stepName: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:retrying') {
-          retryEvents.push({ type: event.type, stepName: event.stepName });
-        }
-      });
-
-      // First attempt: owner requests retry
-      // Second attempt: owner approves
-      mockSpawnOutputs = [
-        'worker first attempt\n',
-        'OWNER_DECISION: INCOMPLETE_RETRY\nREASON: missing error handling\n',
-        'worker second attempt with error handling\n',
-        'STEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: retry succeeded\n',
-      ];
-
-      const config = makeSupervisedConfig({ retries: 1 });
-      const run = await runner.execute(config, 'default');
-
-      expect(run.status).toBe('completed');
-      expect(retryEvents).toEqual([{ type: 'step:retrying', stepName: 'step-1' }]);
-
-      const steps = await db.getStepsByRunId(run.id);
-      expect(steps).toHaveLength(1);
-      expect(steps[0]?.status).toBe('completed');
-      expect(steps[0]?.retryCount).toBe(1);
-      expect(mockRelayInstance.spawnPty).toHaveBeenCalledTimes(5);
-    }, 15000);
-
-    it('should fail after retries are exhausted when owner keeps requesting INCOMPLETE_RETRY', async () => {
-      mockSpawnOutputs = [
-        'worker first attempt\n',
-        'OWNER_DECISION: INCOMPLETE_RETRY\nREASON: missing tests\n',
-        'worker second attempt\n',
-        'OWNER_DECISION: INCOMPLETE_RETRY\nREASON: still missing tests\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig({ retries: 1 }), 'default');
-
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('retry budget is exhausted (maxRetries=1)');
-      expect(run.error).toContain('after 2 total attempts');
-
-      const steps = await db.getStepsByRunId(run.id);
-      expect(steps).toHaveLength(1);
-      expect(steps[0]?.status).toBe('failed');
-      expect(steps[0]?.completionReason).toBe('retry_requested_by_owner');
-      expect(steps[0]?.retryCount).toBe(1);
-      expect(mockRelayInstance.spawnPty).toHaveBeenCalledTimes(4);
-    }, 15000);
-
-    it('should honor INCOMPLETE_RETRY from a non-interactive reviewer step', async () => {
-      const localDb = makeDb();
-      runner = new WorkflowRunner({ db: localDb, workspaceId: 'ws-test' });
-      mockSpawnOutputs = ['OWNER_DECISION: INCOMPLETE_RETRY\nREASON: explicit retry requested\n'];
-
-      const run = await runner.execute(
-        makeConfig({
-          agents: [{ name: 'reviewer', cli: 'claude', preset: 'reviewer' }],
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                {
-                  name: 'review-step',
-                  agent: 'reviewer',
-                  task: 'Review the artifact and decide whether to retry.',
-                  verification: { type: 'output_contains', value: 'OWNER_DECISION: INCOMPLETE_RETRY' },
-                },
-              ],
-            },
-          ],
-        }),
-        'default'
-      );
-
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('owner requested another attempt');
-
-      const steps = await localDb.getStepsByRunId(run.id);
-      expect(steps).toHaveLength(1);
-      expect(steps[0]?.status).toBe('failed');
-      expect(steps[0]?.completionReason).toBe('retry_requested_by_owner');
-    }, 15000);
-
-    it('should not complete a self-owned step when INCOMPLETE_RETRY conflicts with success signals', async () => {
-      mockSpawnOutputs = [
-        [
-          'OWNER_DECISION: INCOMPLETE_RETRY',
-          'REASON: owner wants another verification pass',
-          'STEP_COMPLETE:step-1',
-          'expected content',
-          'verified locally',
-        ].join('\n'),
-      ];
-
-      const run = await runner.execute(
-        makeConfig({
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                {
-                  name: 'step-1',
-                  agent: 'agent-a',
-                  task: 'Run tests',
-                  retries: 0,
-                  verification: { type: 'output_contains', value: 'expected content' },
-                },
-              ],
-            },
-          ],
-        }),
-        'default'
-      );
-
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('no retries are configured (maxRetries=0)');
-
-      const steps = await db.getStepsByRunId(run.id);
-      expect(steps).toHaveLength(1);
-      expect(steps[0]?.status).toBe('failed');
-      expect(steps[0]?.completionReason).toBe('retry_requested_by_owner');
-      expect(mockRelayInstance.spawnPty).toHaveBeenCalledTimes(1);
-    }, 15000);
-
-    it('should not let passing verification override INCOMPLETE_RETRY', async () => {
-      mockSpawnOutputs = [
-        'worker output with expected content\n',
-        [
-          'OWNER_DECISION: INCOMPLETE_RETRY',
-          'REASON: missing WORKER_DONE marker',
-          'verified artifacts after inspecting output',
-          'worker finished implementation',
-        ].join('\n'),
-      ];
-
-      const run = await runner.execute(
-        makeSupervisedConfig({
-          verification: { type: 'output_contains', value: 'expected content' },
-        }),
-        'default'
-      );
-
-      expect(run.status).toBe('failed');
-      expect(mockRelayInstance.spawnPty).toHaveBeenCalledTimes(2);
-    }, 15000);
-
-    it('should not let passing verification override NEEDS_CLARIFICATION', async () => {
-      mockSpawnOutputs = [
-        'worker output with expected content\n',
-        [
-          'OWNER_DECISION: NEEDS_CLARIFICATION',
-          'REASON: owner needs proof of the channel handoff',
-          'verified artifacts after inspecting output',
-        ].join('\n'),
-      ];
-
-      const run = await runner.execute(
-        makeSupervisedConfig({
-          verification: { type: 'output_contains', value: 'expected content' },
-        }),
-        'default'
-      );
-
-      expect(run.status).toBe('failed');
-      expect(mockRelayInstance.spawnPty).toHaveBeenCalledTimes(2);
-    }, 15000);
-  });
-
-  // ── Unit Test 4: Owner rejects AND verification fails ─────────────────
-
-  describe('double failure: owner reject + verification fail', () => {
-    it('should fail step when owner rejects AND verification also fails', async () => {
-      mockSpawnOutputs = [
-        'worker output without expected content\n',
-        'OWNER_DECISION: INCOMPLETE_FAIL\nREASON: work is wrong\n',
-      ];
-
-      const config = makeSupervisedConfig({
-        verification: { type: 'output_contains', value: 'expected output' },
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('failed');
-    }, 15000);
-
-    it('should fail when owner rejects even if verification passes', async () => {
-      mockSpawnOutputs = [
-        'worker output with expected content\n',
-        [
-          'OWNER_DECISION: INCOMPLETE_FAIL',
-          'REASON: work is incomplete without WORKER_DONE proof',
-          'artifacts verified locally',
-          'worker finished implementation',
-        ].join('\n'),
-      ];
-
-      const run = await runner.execute(
-        makeSupervisedConfig({
-          verification: { type: 'output_contains', value: 'expected content' },
-        }),
-        'default'
-      );
-
-      expect(run.status).toBe('failed');
-      expect(mockRelayInstance.spawnPty).toHaveBeenCalledTimes(2);
-    }, 15000);
-
-    it('should mark the run failed even with errorHandling.strategy=continue when a step fails', async () => {
-      // Regression: previously `allCompleted` counted failed steps as success
-      // whenever continueOnError was true, so the summary table would render
-      // "FAILED 1 passed, 1 failed" while run.status landed on 'completed'.
-      // Any wrapper that keys off run.status (e.g. the cloud orchestrator's
-      // bootstrap) would then propagate a false success.
-      mockSpawnOutputs = [
-        'worker output\n',
-        'OWNER_DECISION: INCOMPLETE_FAIL\nREASON: relaycast unavailable\n',
-      ];
-
-      const config: RelayYamlConfig = {
-        ...makeSupervisedConfig({}),
-        errorHandling: { strategy: 'continue' },
-      };
-
-      const run = await runner.execute(config, 'default');
-
-      expect(run.status).toBe('failed');
-      const steps = await db.getStepsByRunId(run.id);
-      expect(steps[0]?.status).toBe('failed');
-      expect(steps[0]?.completionReason).toBe('failed_owner_decision');
-    }, 15000);
-
-    it('should still complete by owner decision when COMPLETE and verification both pass', async () => {
-      mockSpawnOutputs = [
-        'worker output with expected content\n',
-        'OWNER_DECISION: COMPLETE\nREASON: verified artifacts\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: owner confirmed\n',
-      ];
-
-      const run = await runner.execute(
-        makeSupervisedConfig({
-          verification: { type: 'output_contains', value: 'expected content' },
-        }),
-        'default'
-      );
-
-      expect(run.status).toBe('completed');
-      const [step] = await db.getStepsByRunId(run.id);
-      expect(step?.completionReason).toBe('completed_by_owner_decision');
-    }, 15000);
-
-    it('should fail verification before accepting OWNER_DECISION COMPLETE', async () => {
-      mockSpawnOutputs = [
-        'worker output without the required token\n',
-        'OWNER_DECISION: COMPLETE\nREASON: verified artifacts\n',
-      ];
-
-      const run = await runner.execute(
-        makeSupervisedConfig({
-          verification: { type: 'output_contains', value: 'expected content' },
-        }),
-        'default'
-      );
-
-      expect(run.status).toBe('failed');
-      expect(mockRelayInstance.spawnPty).toHaveBeenCalledTimes(2);
-    }, 15000);
-
-    it('should still complete as verified when no owner decision is provided and verification passes', async () => {
-      mockSpawnOutputs = [
-        'worker output with expected content\n',
-        'Owner checked the output and left no structured decision.\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: verification passed\n',
-      ];
-
-      const run = await runner.execute(
-        makeSupervisedConfig({
-          verification: { type: 'output_contains', value: 'expected content' },
-        }),
-        'default'
-      );
-
-      expect(run.status).toBe('completed');
-      const [step] = await db.getStepsByRunId(run.id);
-      expect(step?.completionReason).toBe('completed_verified');
-    }, 15000);
-  });
-
-  // ── Unit Test 5: Tolerant review parser ────────────────────────────────
-
-  describe('tolerant review parsing', () => {
-    it('should accept standard REVIEW_DECISION: APPROVE format', async () => {
-      const events: Array<{ type: string; decision?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:review-completed') {
-          events.push({ type: event.type, decision: event.decision });
-        }
-      });
-
-      mockSpawnOutputs = [
-        'worker finished\n',
-        'STEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: all good\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-      expect(events).toContainEqual({ type: 'step:review-completed', decision: 'approved' });
-    }, 15000);
-
-    it('should accept standard REVIEW_DECISION: REJECT format', async () => {
-      const events: Array<{ type: string; decision?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:review-completed') {
-          events.push({ type: event.type, decision: event.decision });
-        }
-      });
-
-      mockSpawnOutputs = [
-        'worker finished\n',
-        'STEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: REJECT\nREVIEW_REASON: needs work\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('review rejected');
-      expect(events).toContainEqual({ type: 'step:review-completed', decision: 'rejected' });
-    }, 15000);
-
-    // These tests validate the tolerant parser once it's implemented.
-    // The tolerant parser should accept semantic equivalents.
-
-    it('should still fail on review output with no usable approval or rejection signal', async () => {
-      mockSpawnOutputs = [
-        'worker finished\n',
-        'STEP_COMPLETE:step-1\n',
-        'I need more context before deciding.\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('review response malformed');
-    }, 15000);
-  });
-
-  // ── Unit Test 6: Channel evidence ─────────────────────────────────────
-
-  describe('channel evidence for completion', () => {
-    it('should capture WORKER_DONE signals from channel messages', async () => {
-      // Worker posts done signal, owner observes and confirms
-      mockSpawnOutputs = [
-        'WORKER_DONE: all tasks completed\n',
-        'Worker reported done on channel, verified artifacts\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: channel evidence confirms\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-
-      // Verify the channel received the worker done signal
-      const channelMessages = (mockRelaycastAgent.send as any).mock.calls.map(
-        ([, text]: [string, string]) => text
-      );
-      expect(channelMessages.some((text: string) => text.includes('WORKER_DONE'))).toBe(true);
-
-      const evidence = runner.getStepCompletionEvidence('step-1');
-      const workerDoneSignals =
-        evidence?.coordinationSignals.filter(
-          (signal) => signal.kind === 'worker_done' && signal.source === 'channel'
-        ) ?? [];
-      expect(workerDoneSignals.some((signal) => signal.sender === 'specialist')).toBe(true);
-    }, 15000);
-
-    it('should forward worker channel evidence to the owner prompt', async () => {
-      mockSpawnOutputs = [
-        'implementation complete\nWORKER_DONE: finished feature\n',
-        'Observed WORKER_DONE on channel\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: looks good\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-    }, 15000);
-
-    it('should not count lead-authored WORKER_DONE channel posts as worker completion evidence', async () => {
-      waitForExitFn = vi.fn().mockImplementation(async () => {
-        await new Promise((resolve) => setTimeout(resolve, 5));
-        return 'exited';
-      });
-      mockRelayInstance.spawnPty.mockImplementation(
-        async ({ name, task }: { name: string; task?: string }) => {
-          const agent = await defaultSpawnPtyImplementation({ name, task });
-          if (task?.includes('You are the step owner/supervisor for step "step-1".')) {
-            emitRelayChannelMessage({
-              from: agent.name,
-              to: 'completion-provenance',
-              text: 'WORKER_DONE: lead summarized the handoff',
-            });
-          }
-          return agent;
-        }
-      );
-      mockSpawnOutputs = [
-        'worker progress update only\n',
-        'Owner observed the channel but left no decision.\n',
-      ];
-
-      const config = makeSupervisedConfig();
-      config.swarm = { ...config.swarm, channel: 'completion-provenance' };
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('owner completion decision missing');
-      await new Promise((resolve) => setTimeout(resolve, 0));
-
-      const evidence = runner.getStepCompletionEvidence('step-1');
-      const spoofedPosts =
-        evidence?.channelPosts.filter(
-          (post) => post.sender === 'team-lead' && post.text.includes('WORKER_DONE')
-        ) ?? [];
-      expect(spoofedPosts.length).toBeGreaterThan(0);
-      expect(
-        evidence?.coordinationSignals.filter((signal) => signal.kind === 'worker_done') ?? []
-      ).toHaveLength(0);
-      const spoofedPost = evidence?.channelPosts.find(
-        (post) => post.sender === 'team-lead' && post.text.includes('WORKER_DONE')
-      );
-      expect(spoofedPost?.signals.some((signal) => signal.kind === 'worker_done') ?? false).toBe(false);
-    }, 15000);
-
-    it('should filter wrong-agent coordination signals from the evidence view', async () => {
-      mockSpawnOutputs = [
-        'LEAD_DONE: worker cannot declare lead completion\nWORKER_DONE: all tasks completed\n',
-        'Owner confirmed\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: verified\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-
-      const evidence = runner.getStepCompletionEvidence('step-1');
-      expect(evidence?.coordinationSignals.filter((signal) => signal.kind === 'lead_done')).toHaveLength(0);
-      expect(
-        evidence?.coordinationSignals.some(
-          (signal) => signal.kind === 'worker_done' && signal.sender === 'specialist'
-        )
-      ).toBe(true);
-    }, 15000);
-  });
-
-  describe('happy-path lead-worker workflow proof', () => {
-    it('should complete by evidence when the worker posts WORKER_DONE on the channel', async () => {
-      const channel = 'happy-path-worker-done';
-      waitForExitFn = vi.fn().mockImplementation(async () => {
-        await new Promise((resolve) => setTimeout(resolve, 5));
-        return 'exited';
-      });
-      mockRelayInstance.spawnPty.mockImplementation(
-        async ({ name, task }: { name: string; task?: string }) => {
-          const agent = await defaultSpawnPtyImplementation({ name, task });
-          if (name.includes('step-1-worker')) {
-            emitRelayChannelMessage({
-              from: agent.name,
-              to: channel,
-              text: 'WORKER_DONE: implementation shipped',
-            });
-          }
-          return agent;
-        }
-      );
-      mockSpawnOutputs = [
-        'artifact bundle ready\n',
-        'Lead verified the worker handoff is complete and safe.\n',
-      ];
-
-      const run = await runner.execute(makeChannelSupervisedConfig(channel), 'default');
-
-      expect(run.status).toBe('completed');
-      const step = await getStepRow(db, run.id, 'step-1');
-      expect(step?.completionReason).toBe('completed_by_evidence');
-
-      const evidence = runner.getStepCompletionEvidence('step-1');
-      expect(
-        evidence?.coordinationSignals.some(
-          (signal) =>
-            signal.kind === 'worker_done' && signal.source === 'channel' && signal.sender === 'specialist'
-        )
-      ).toBe(true);
-      expect(evidence?.coordinationSignals.some((signal) => signal.kind === 'step_complete')).toBe(false);
-    }, 15000);
-
-    it('should capture WORKER_DONE plus LEAD_DONE and complete cleanly', async () => {
-      const channel = 'happy-path-lead-worker-done';
-      waitForExitFn = vi.fn().mockImplementation(async () => {
-        await new Promise((resolve) => setTimeout(resolve, 5));
-        return 'exited';
-      });
-      mockRelayInstance.spawnPty.mockImplementation(
-        async ({ name, task }: { name: string; task?: string }) => {
-          const agent = await defaultSpawnPtyImplementation({ name, task });
-          if (name.includes('step-1-worker')) {
-            emitRelayChannelMessage({
-              from: agent.name,
-              to: channel,
-              text: 'WORKER_DONE: handoff package posted',
-            });
-          }
-          if (name.includes('step-1-owner')) {
-            emitRelayChannelMessage({
-              from: agent.name,
-              to: channel,
-              text: 'LEAD_DONE: lead confirmed the worker handoff',
-            });
-          }
-          return agent;
-        }
-      );
-      mockSpawnOutputs = [
-        'artifact bundle ready\n',
-        'Lead confirmed the handoff is complete and safe for review.\n',
-      ];
-
-      const run = await runner.execute(makeChannelSupervisedConfig(channel), 'default');
-
-      expect(run.status).toBe('completed');
-      const step = await getStepRow(db, run.id, 'step-1');
-      expect(step?.completionReason).toBe('completed_by_evidence');
-
-      const evidence = runner.getStepCompletionEvidence('step-1');
-      expect(
-        evidence?.coordinationSignals.some(
-          (signal) =>
-            signal.kind === 'worker_done' && signal.source === 'channel' && signal.sender === 'specialist'
-        )
-      ).toBe(true);
-      expect(
-        evidence?.coordinationSignals.some(
-          (signal) =>
-            signal.kind === 'lead_done' && signal.source === 'channel' && signal.sender === 'team-lead'
-        )
-      ).toBe(true);
-    }, 15000);
-
-    it('should complete as verified when lead-worker verification passes without coordination markers', async () => {
-      mockSpawnOutputs = [
-        'worker output with expected content\n',
-        'Lead checked the implementation and found it correct.\n',
-      ];
-
-      const run = await runner.execute(
-        makeSupervisedConfig({ verification: { type: 'output_contains', value: 'expected content' } }),
-        'default'
-      );
-
-      expect(run.status).toBe('completed');
-      const step = await getStepRow(db, run.id, 'step-1');
-      expect(step?.completionReason).toBe('completed_verified');
-
-      const evidence = runner.getStepCompletionEvidence('step-1');
-      expect(evidence?.coordinationSignals.some((signal) => signal.kind === 'worker_done')).toBe(false);
-      expect(evidence?.coordinationSignals.some((signal) => signal.kind === 'lead_done')).toBe(false);
-    }, 15000);
-
-    it('should complete multiple supervised workers in sequence for a map-reduce style flow', async () => {
-      const channel = 'happy-path-map-reduce';
-      waitForExitFn = vi.fn().mockImplementation(async () => {
-        await new Promise((resolve) => setTimeout(resolve, 5));
-        return 'exited';
-      });
-      mockRelayInstance.spawnPty.mockImplementation(
-        async ({ name, task }: { name: string; task?: string }) => {
-          const isReview = task?.includes('REVIEW_DECISION: APPROVE or REJECT');
-          const output = isReview
-            ? 'REVIEW_DECISION: APPROVE\nREVIEW_REASON: map-reduce happy path verified\n'
-            : name.includes('map-1-worker')
-              ? 'map artifact A ready\n'
-              : name.includes('map-1-owner')
-                ? 'Lead verified shard A is complete and safe.\n'
-                : name.includes('map-2-worker')
-                  ? 'map artifact B ready\n'
-                  : name.includes('map-2-owner')
-                    ? 'Lead verified shard B is complete and safe.\n'
-                    : name.includes('reduce-worker')
-                      ? 'reduce artifact ready\n'
-                      : name.includes('reduce-owner')
-                        ? 'Lead verified the reduction is complete and safe.\n'
-                        : 'STEP_COMPLETE:unknown\n';
-
-          queueMicrotask(() => {
-            emitRelayEvent('workerOutput', { name, chunk: output });
-          });
-
-          const agent = { ...mockAgent, name };
-          if (name.includes('map-1-worker')) {
-            emitRelayChannelMessage({
-              from: agent.name,
-              to: channel,
-              text: 'WORKER_DONE: map shard A complete',
-            });
-          }
-          if (name.includes('map-2-worker')) {
-            emitRelayChannelMessage({
-              from: agent.name,
-              to: channel,
-              text: 'WORKER_DONE: map shard B complete',
-            });
-          }
-          if (name.includes('reduce-worker')) {
-            emitRelayChannelMessage({
-              from: agent.name,
-              to: channel,
-              text: 'WORKER_DONE: reduce pass complete',
-            });
-          }
-          return agent;
-        }
-      );
-
-      const config = makeConfig({
-        swarm: { pattern: 'map-reduce', channel },
-        agents: [
-          { name: 'mapper-1', cli: 'claude', role: 'engineer' },
-          { name: 'mapper-2', cli: 'claude', role: 'engineer' },
-          { name: 'reducer', cli: 'claude', role: 'engineer' },
-          { name: 'team-lead', cli: 'claude', role: 'lead coordinator' },
-          { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              { name: 'map-1', agent: 'mapper-1', task: 'Process shard A' },
-              { name: 'map-2', agent: 'mapper-2', task: 'Process shard B' },
-              {
-                name: 'reduce',
-                agent: 'reducer',
-                task: 'Combine mapped results',
-                dependsOn: ['map-1', 'map-2'],
-              },
-            ],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-
-      expect(run.status).toBe('completed');
-      const steps = await db.getStepsByRunId(run.id);
-      expect(steps.map((step) => step.stepName)).toEqual(['map-1', 'map-2', 'reduce']);
-      expect(steps.map((step) => step.status)).toEqual(['completed', 'completed', 'completed']);
-      expect(steps.map((step) => step.completionReason)).toEqual([
-        'completed_by_evidence',
-        'completed_by_evidence',
-        'completed_by_evidence',
-      ]);
-      expect(
-        runner
-          .getStepCompletionEvidence('reduce')
-          ?.coordinationSignals.some(
-            (signal) =>
-              signal.kind === 'worker_done' && signal.source === 'channel' && signal.sender === 'reducer'
-          )
-      ).toBe(true);
-    }, 15000);
-
-    it('should still complete when WORKER_DONE lands after the lead checks the work', async () => {
-      const channel = 'happy-path-delayed-worker-done';
-      const observedOrder: string[] = [];
-      mockRelayInstance.spawnPty.mockImplementation(
-        async ({ name, task }: { name: string; task?: string }) => {
-          const agent = await defaultSpawnPtyImplementation({ name, task });
-
-          if (name.includes('step-1-worker')) {
-            setTimeout(() => {
-              observedOrder.push('worker-done-message');
-              emitRelayChannelMessage({
-                from: agent.name,
-                to: channel,
-                text: 'WORKER_DONE: delayed handoff posted',
-              });
-            }, 10);
-            return {
-              ...agent,
-              waitForExit: vi.fn().mockImplementation(async () => {
-                await new Promise((resolve) => setTimeout(resolve, 15));
-                return 'exited' as const;
-              }),
-            };
-          }
-
-          if (name.includes('step-1-owner')) {
-            return {
-              ...agent,
-              waitForExit: vi.fn().mockImplementation(async () => {
-                observedOrder.push('owner-finished-check');
-                return 'exited' as const;
-              }),
-            };
-          }
-
-          return agent;
-        }
-      );
-      mockSpawnOutputs = [
-        'artifact bundle ready but handoff signal is delayed\n',
-        'Lead checked the artifacts early and the work still looks complete and safe.\n',
-      ];
-
-      const run = await runner.execute(makeChannelSupervisedConfig(channel), 'default');
-
-      expect(run.status).toBe('completed');
-      expect(observedOrder).toEqual(['owner-finished-check', 'worker-done-message']);
-
-      const step = await getStepRow(db, run.id, 'step-1');
-      expect(step?.completionReason).toBe('completed_by_evidence');
-      expect(
-        runner
-          .getStepCompletionEvidence('step-1')
-          ?.coordinationSignals.some(
-            (signal) =>
-              signal.kind === 'worker_done' &&
-              signal.source === 'channel' &&
-              signal.value === 'delayed handoff posted'
-          )
-      ).toBe(true);
-    }, 15000);
-  });
-
-  // ── Integration Test 1: Codex lead/worker without marker ──────────────
-
-  describe('Codex lead/worker completion', () => {
-    it('should complete when codex lead omits STEP_COMPLETE but owner logic still completes', async () => {
-      // Codex agents use `codex exec` and may not emit the exact marker.
-      // With a verification gate, the step should still complete.
-      mockSpawnOutputs = [
-        'worker: implemented the feature\n',
-        'Lead verified: all changes look correct\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: verified\n',
-      ];
-
-      const config = makeSupervisedConfig();
-      // Override to codex CLI
-      config.agents = [
-        { name: 'specialist', cli: 'codex', role: 'engineer' },
-        { name: 'team-lead', cli: 'codex', role: 'lead coordinator' },
-        { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-      ];
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-      expect(
-        mockRelayInstance.spawnPty.mock.calls.some(
-          ([input]) =>
-            input.cli === 'codex' &&
-            Array.isArray(input.args) &&
-            input.args.includes('--dangerously-bypass-approvals-and-sandbox')
-        )
-      ).toBe(true);
-    }, 15000);
-  });
-
-  // ── Integration Test 2: Gemini lead/worker with channel completion ────
-
-  describe('Gemini lead/worker with channel completion', () => {
-    it('should complete when gemini worker posts channel completion and owner finalizes', async () => {
-      mockSpawnOutputs = [
-        'Worker output: feature implemented\nWORKER_DONE: task complete\n',
-        'Observed worker completion on channel\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: channel evidence\n',
-      ];
-
-      const config = makeSupervisedConfig();
-      config.agents = [
-        { name: 'specialist', cli: 'gemini', role: 'engineer' },
-        { name: 'team-lead', cli: 'gemini', role: 'lead coordinator' },
-        { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-      ];
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-    }, 15000);
-  });
-
-  // ── Integration Test 3: Supervisor without exact review sentinel ───────
-
-  describe('Supervisor workflow completion', () => {
-    it('should complete supervised step with standard review flow', async () => {
-      mockSpawnOutputs = [
-        'worker built the feature\n',
-        'Verified: code passes tests\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: correct implementation\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-    }, 15000);
-  });
-
-  // ── Integration Test 4: Map-reduce workflow remains unaffected ─────────
-
-  describe('Map-reduce workflow backward compatibility', () => {
-    it('should complete map-reduce workflow with standard markers', async () => {
-      const config = makeConfig({
-        swarm: { pattern: 'map-reduce' },
-        agents: [
-          { name: 'mapper-1', cli: 'claude' },
-          { name: 'mapper-2', cli: 'claude' },
-          { name: 'reducer', cli: 'claude' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              { name: 'map-1', agent: 'mapper-1', task: 'Process chunk A' },
-              { name: 'map-2', agent: 'mapper-2', task: 'Process chunk B' },
-              { name: 'reduce', agent: 'reducer', task: 'Combine results', dependsOn: ['map-1', 'map-2'] },
-            ],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-    }, 15000);
-  });
-
-  // ── Integration Test 5: Legacy marker-based workflows ─────────────────
-
-  describe('Legacy marker-based workflows', () => {
-    it('should still complete with explicit STEP_COMPLETE marker (backward compat)', async () => {
-      // The classic marker-based flow should continue to work unchanged
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('completed');
-    }, 15000);
-
-    it('should still fail when marker, owner decision, and evidence are all missing', async () => {
-      mockSpawnOutputs = ['Did the work but no marker\n'];
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('owner completion decision missing');
-    }, 15000);
-
-    it('should still support explicit REVIEW_DECISION: APPROVE flow', async () => {
-      mockSpawnOutputs = [
-        'STEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: standard approval\n',
-      ];
-
-      const events: Array<{ type: string; decision?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:review-completed') {
-          events.push({ type: event.type, decision: event.decision });
-        }
-      });
-
-      mockSpawnOutputs = [
-        'worker finished\n',
-        'STEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: legacy approval\n',
-        'worker finished step 2\n',
-        'STEP_COMPLETE:step-2\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: legacy approval step 2\n',
-      ];
-
-      const run = await runner.execute(makeTwoStepSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-      expect(events).toContainEqual({ type: 'step:review-completed', decision: 'approved' });
-    }, 15000);
-
-    it('should still support explicit REVIEW_DECISION: REJECT flow', async () => {
-      mockSpawnOutputs = [
-        'worker finished\n',
-        'STEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: REJECT\nREVIEW_REASON: standard rejection\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('review rejected');
-    }, 15000);
-
-    it('should still fail closed on malformed review output', async () => {
-      mockSpawnOutputs = ['worker finished\n', 'STEP_COMPLETE:step-1\n', 'I think this looks ok\n'];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('review response malformed');
-    }, 15000);
-
-    it('should preserve owner/specialist separation in supervised workflows', async () => {
-      mockSpawnOutputs = [
-        'worker finished\n',
-        'Owner verified\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: good\n',
-      ];
-
-      const ownerAssignments: Array<{ owner: string; specialist: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') {
-          ownerAssignments.push({ owner: event.ownerName, specialist: event.specialistName });
-        }
-      });
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-      expect(ownerAssignments).toHaveLength(1);
-      expect(ownerAssignments[0].owner).toBe('team-lead');
-      expect(ownerAssignments[0].specialist).toBe('specialist');
-    }, 15000);
-  });
-
-  // ── Backward compat: event emission ───────────────────────────────────
-
-  describe('backward compatibility: event emission', () => {
-    it('should emit run:started and run:completed events', async () => {
-      const events: string[] = [];
-      runner.on((event) => events.push(event.type));
-
-      await runner.execute(makeConfig(), 'default');
-
-      expect(events).toContain('run:started');
-      expect(events).toContain('run:completed');
-    }, 15000);
-
-    it('should emit step:started and step:completed events in order', async () => {
-      const stepEvents: Array<{ type: string; stepName?: string }> = [];
-      runner.on((event) => {
-        if (event.type.startsWith('step:')) {
-          stepEvents.push({
-            type: event.type,
-            stepName: 'stepName' in event ? event.stepName : undefined,
-          });
-        }
-      });
-
-      await runner.execute(makeConfig(), 'default');
-
-      const startedSteps = stepEvents.filter((e) => e.type === 'step:started');
-      const completedSteps = stepEvents.filter((e) => e.type === 'step:completed');
-      expect(startedSteps).toHaveLength(2);
-      expect(completedSteps).toHaveLength(2);
-    }, 15000);
-
-    it('should emit owner-assigned events for all steps', async () => {
-      const ownerEvents: string[] = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') {
-          ownerEvents.push(event.stepName);
-        }
-      });
-
-      await runner.execute(makeConfig(), 'default');
-      expect(ownerEvents).toHaveLength(2);
-    }, 15000);
-
-    it('should emit review-completed events for all interactive steps', async () => {
-      const reviewEvents: string[] = [];
-      runner.on((event) => {
-        if (event.type === 'step:review-completed') {
-          reviewEvents.push(event.stepName);
-        }
-      });
-
-      mockSpawnOutputs = [
-        'worker finished\n',
-        'STEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: looks good\n',
-        'worker finished step 2\n',
-        'STEP_COMPLETE:step-2\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: looks good\n',
-      ];
-
-      await runner.execute(makeTwoStepSupervisedConfig(), 'default');
-      expect(reviewEvents).toHaveLength(2);
-    }, 15000);
-  });
-
-  // ── Backward compat: DAG execution ordering ───────────────────────────
-
-  describe('backward compatibility: DAG execution', () => {
-    it('should execute steps in dependency order', async () => {
-      const completedSteps: string[] = [];
-      runner.on((event) => {
-        if (event.type === 'step:completed') {
-          completedSteps.push(event.stepName);
-        }
-      });
-
-      await runner.execute(makeConfig(), 'default');
-
-      const idx1 = completedSteps.indexOf('step-1');
-      const idx2 = completedSteps.indexOf('step-2');
-      expect(idx1).toBeLessThan(idx2);
-    }, 15000);
-
-    it('should run parallel steps concurrently', async () => {
-      const startTimes: Record<string, number> = {};
-      runner.on((event) => {
-        if (event.type === 'step:started') {
-          startTimes[event.stepName] = Date.now();
-        }
-      });
-
-      const config = makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              { name: 'a', agent: 'agent-a', task: 'Do A' },
-              { name: 'b', agent: 'agent-b', task: 'Do B' },
-              { name: 'c', agent: 'agent-a', task: 'Do C', dependsOn: ['a', 'b'] },
-            ],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-
-      // a and b should start nearly simultaneously (within 100ms)
-      const diff = Math.abs((startTimes['a'] ?? 0) - (startTimes['b'] ?? 0));
-      expect(diff).toBeLessThan(1000);
-    }, 15000);
-  });
-
-  // ── Backward compat: CLI command building ─────────────────────────────
-
-  describe('backward compatibility: CLI command building', () => {
-    it('should build claude command correctly', () => {
-      const { cmd, args } = WorkflowRunner.buildNonInteractiveCommand('claude', 'Task');
-      expect(cmd).toBe('claude');
-      expect(args).toContain('-p');
-    });
-
-    it('should build codex command correctly', () => {
-      const { cmd, args } = WorkflowRunner.buildNonInteractiveCommand('codex', 'Task');
-      expect(cmd).toBe('codex');
-      expect(args).toContain('exec');
-    });
-
-    it('should build gemini command correctly', () => {
-      const { cmd, args } = WorkflowRunner.buildNonInteractiveCommand('gemini', 'Task');
-      expect(cmd).toBe('gemini');
-      expect(args).toContain('-p');
-    });
-  });
-
-  // ── Backward compat: variable resolution ──────────────────────────────
-
-  describe('backward compatibility: variable resolution', () => {
-    it('should resolve {{var}} in step tasks', async () => {
-      const config = makeConfig();
-      config.workflows![0].steps[0].task = 'Build {{feature}}';
-      const run = await runner.execute(config, 'default', { feature: 'auth' });
-      expect(run.status, run.error).toBe('completed');
-    }, 15000);
-
-    it('should throw on unresolved variables', () => {
-      const config = makeConfig({
-        agents: [{ name: 'a', cli: 'claude', task: 'Fix {{unknown}}' }],
-      });
-      expect(() => runner.resolveVariables(config, {})).toThrow('Unresolved variable: {{unknown}}');
-    });
-  });
-
-  // ── Backward compat: review PTY echo handling ─────────────────────────
-
-  describe('backward compatibility: review PTY echo handling', () => {
-    it('should parse last REVIEW_DECISION when PTY echoes prompt', async () => {
-      const events: Array<{ type: string; decision?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:review-completed') {
-          events.push({ type: event.type, decision: event.decision });
-        }
-      });
-
-      const echoedPrompt =
-        'Return exactly:\nREVIEW_DECISION: APPROVE or REJECT\nREVIEW_REASON: <one sentence>\n';
-      const actualResponse = 'REVIEW_DECISION: REJECT\nREVIEW_REASON: code has bugs\n';
-      mockSpawnOutputs = ['worker finished\n', 'STEP_COMPLETE:step-1\n', echoedPrompt + actualResponse];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(events).toContainEqual({ type: 'step:review-completed', decision: 'rejected' });
-    }, 15000);
-  });
-
-  // ── Backward compat: timeout handling ─────────────────────────────────
-
-  describe('backward compatibility: timeout handling', () => {
-    it('should emit step:owner-timeout on timeout', async () => {
-      const events: Array<{ type: string; stepName?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-timeout') {
-          events.push({ type: event.type, stepName: event.stepName });
-        }
-      });
-
-      waitForExitFn = vi.fn().mockResolvedValue('timeout');
-      waitForIdleFn = vi.fn().mockResolvedValue('timeout');
-
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(events).toContainEqual({ type: 'step:owner-timeout', stepName: 'step-1' });
-    }, 15000);
-  });
-
-  // ── Phase 1 compatibility mode ────────────────────────────────────────
-
-  describe('Phase 1 compatibility mode', () => {
-    it('should keep markers as fast-path for completion', async () => {
-      // When the marker is present, it should complete immediately without
-      // needing to evaluate the full evidence pipeline
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('completed');
-    }, 15000);
-
-    it('should accept both old marker format and new OWNER_DECISION format', async () => {
-      // Old format still works
-      mockSpawnOutputs = ['STEP_COMPLETE:step-1\n'];
-      const run1 = await runner.execute(
-        makeConfig({
-          workflows: [{ name: 'default', steps: [{ name: 'step-1', agent: 'agent-a', task: 'Do it' }] }],
-        }),
-        'default'
-      );
-      expect(run1.status).toBe('completed');
-    }, 15000);
-  });
-
-  // ── Evidence interface tests ──────────────────────────────────────────
-
-  describe('evidence collection interface', () => {
-    it('should expose getStepCompletionEvidence() on runner', () => {
-      expect(typeof runner.getStepCompletionEvidence).toBe('function');
-    });
-
-    it('should return undefined for unknown step names', () => {
-      const evidence = runner.getStepCompletionEvidence('nonexistent-step');
-      expect(evidence).toBeUndefined();
-    });
-
-    it('should return evidence with correct shape after step execution', async () => {
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('completed');
-
-      const evidence = runner.getStepCompletionEvidence('step-1');
-      if (evidence) {
-        // Verify the evidence structure matches StepCompletionEvidence
-        expect(evidence.stepName).toBe('step-1');
-        expect(evidence).toHaveProperty('channelPosts');
-        expect(evidence).toHaveProperty('files');
-        expect(evidence).toHaveProperty('process');
-        expect(evidence).toHaveProperty('toolSideEffects');
-        expect(evidence).toHaveProperty('coordinationSignals');
-        expect(Array.isArray(evidence.channelPosts)).toBe(true);
-        expect(Array.isArray(evidence.files)).toBe(true);
-        expect(Array.isArray(evidence.toolSideEffects)).toBe(true);
-        expect(Array.isArray(evidence.coordinationSignals)).toBe(true);
-      }
-    }, 15000);
-
-    it('should collect evidence for supervised steps', async () => {
-      mockSpawnOutputs = [
-        'worker completed the implementation\n',
-        'Owner verified work\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: good\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-
-      const evidence = runner.getStepCompletionEvidence('step-1');
-      if (evidence) {
-        expect(evidence.stepName).toBe('step-1');
-        // Supervised steps should have channel posts from worker output forwarding
-        expect(evidence.channelPosts.length).toBeGreaterThanOrEqual(0);
-      }
-    }, 15000);
-
-    it('should capture WORKER_DONE as a coordination signal', async () => {
-      mockSpawnOutputs = [
-        'WORKER_DONE: all tasks completed\n',
-        'Owner confirmed\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: verified\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-
-      const evidence = runner.getStepCompletionEvidence('step-1');
-      if (evidence) {
-        const workerDoneSignals = evidence.coordinationSignals.filter((s) => s.kind === 'worker_done');
-        // If the evidence collector detected the WORKER_DONE signal, it should be present
-        if (workerDoneSignals.length > 0) {
-          expect(workerDoneSignals[0].kind).toBe('worker_done');
-        }
-      }
-    }, 15000);
-
-    it('should return a defensive copy (not a live reference)', async () => {
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('completed');
-
-      const evidence1 = runner.getStepCompletionEvidence('step-1');
-      const evidence2 = runner.getStepCompletionEvidence('step-1');
-      if (evidence1 && evidence2) {
-        expect(evidence1).not.toBe(evidence2); // structuredClone should return a new object
-        expect(evidence1).toEqual(evidence2); // but with the same content
-      }
-    }, 15000);
-  });
-
-  // ── completionReason field on step rows ───────────────────────────────
-
-  describe('completionReason on step rows', () => {
-    it('should set completionReason on completed steps', async () => {
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('completed');
-
-      const steps = await db.getStepsByRunId(run.id);
-      const completedSteps = steps.filter((s) => s.status === 'completed');
-      expect(completedSteps.length).toBeGreaterThan(0);
-
-      for (const step of completedSteps) {
-        if (step.completionReason) {
-          // completionReason should be a valid value
-          const validReasons: WorkflowStepCompletionReason[] = [
-            'completed_verified',
-            'completed_by_owner_decision',
-            'completed_by_evidence',
-            'completed_by_process_exit',
-            'retry_requested_by_owner',
-            'failed_verification',
-            'failed_owner_decision',
-            'failed_no_evidence',
-          ];
-          expect(validReasons).toContain(step.completionReason);
-        }
-      }
-    }, 15000);
-  });
-
-  describe('process-exit fallback (compliance reduction)', () => {
-    it('should complete step via process exit code 0 when no coordination signal is posted', async () => {
-      // Agent exits cleanly (code 0) but doesn't post STEP_COMPLETE or OWNER_DECISION.
-      // With verification configured (exit_code), the runner should infer completion.
-      const config = makeConfig({
-        swarm: { pattern: 'dag', completionGracePeriodMs: 5000 },
-        agents: [{ name: 'agent-a', cli: 'claude' }],
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'silent-worker',
-                agent: 'agent-a',
-                task: 'Do some work silently',
-                verification: { type: 'exit_code', value: '0' },
-              },
-            ],
-          },
-        ],
-      });
-
-      // Output has no STEP_COMPLETE, no OWNER_DECISION — just normal work output
-      mockSpawnOutputs = ['Implemented the auth module. All tests pass.'];
-
-      const localDb = makeDb();
-      runner = new WorkflowRunner({ db: localDb, workspaceId: 'ws-test' });
-      const events: any[] = [];
-      const run = await runner.execute(config, 'default');
-
-      expect(run.status).toBe('completed');
-      const steps = await localDb.getStepsByRunId(run.id);
-      const step = steps.find((s: any) => s.stepName === 'silent-worker');
-      expect(step?.status).toBe('completed');
-      // Should be completed_by_process_exit or completed_verified (exit_code verification)
-      expect(step?.completionReason).toBeDefined();
-    }, 15000);
-
-    it('should fail when process exits with non-zero code and no signal', async () => {
-      // Agent exits with non-zero and no coordination signal — should fail
-      const config = makeConfig({
-        swarm: { pattern: 'dag', completionGracePeriodMs: 5000 },
-        agents: [{ name: 'agent-a', cli: 'claude' }],
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'failing-worker',
-                agent: 'agent-a',
-                task: 'Try something',
-              },
-            ],
-          },
-        ],
-      });
-
-      // No STEP_COMPLETE, no OWNER_DECISION, and we'll simulate a non-clean exit
-      // by having the output lack any positive signals
-      mockSpawnOutputs = ['Error: something went wrong'];
-
-      const localDb = makeDb();
-      runner = new WorkflowRunner({ db: localDb, workspaceId: 'ws-test' });
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('failed');
-    }, 15000);
-
-    it('should respect completionGracePeriodMs: 0 to disable fallback', async () => {
-      // With grace period disabled, missing signals should always fail
-      const config = makeConfig({
-        swarm: { pattern: 'dag', completionGracePeriodMs: 0 },
-        agents: [{ name: 'agent-a', cli: 'claude' }],
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'strict-worker',
-                agent: 'agent-a',
-                task: 'Do work with strict compliance required',
-              },
-            ],
-          },
-        ],
-      });
-
-      // Output has no signals at all
-      mockSpawnOutputs = ['Work completed but no signal posted.'];
-
-      const localDb = makeDb();
-      runner = new WorkflowRunner({ db: localDb, workspaceId: 'ws-test' });
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('failed');
-    }, 15000);
-
-    it('should complete via evidence when process exits 0 and owner output has positive conclusion', async () => {
-      // Agent posts no explicit signal but says "done" + exit code 0 is captured as evidence
-      const config = makeConfig({
-        swarm: { pattern: 'dag' },
-        agents: [{ name: 'agent-a', cli: 'claude' }],
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'wordy-worker',
-                agent: 'agent-a',
-                task: 'Implement the feature',
-                verification: { type: 'exit_code', value: '0' },
-              },
-            ],
-          },
-        ],
-      });
-
-      // Output contains positive conclusion words but no explicit marker
-      mockSpawnOutputs = ['Feature implemented and verified. All artifacts are correct and complete.'];
-
-      const localDb = makeDb();
-      runner = new WorkflowRunner({ db: localDb, workspaceId: 'ws-test' });
-      const run = await runner.execute(config, 'default');
-
-      expect(run.status).toBe('completed');
-    }, 15000);
-  });
-
-  describe('template re-quoting regression (parseOwnerDecision)', () => {
-    it('should not pick COMPLETE from re-quoted template when agent said INCOMPLETE_RETRY', async () => {
-      // Bug repro: agent says INCOMPLETE_RETRY then re-quotes the template format,
-      // causing the last-match heuristic to pick COMPLETE from the template line.
-      mockSpawnOutputs = [
-        'worker did the task\n',
-        [
-          'STEP OWNER CONTRACT:',
-          '- Preferred final decision format:',
-          '  OWNER_DECISION: COMPLETE|INCOMPLETE_RETRY|INCOMPLETE_FAIL|NEEDS_CLARIFICATION',
-          '  REASON: <one sentence>',
-          '',
-          'OWNER_DECISION: INCOMPLETE_RETRY',
-          'REASON: Tests are still failing',
-          '',
-          'I chose INCOMPLETE_RETRY as per the options OWNER_DECISION: COMPLETE|INCOMPLETE_RETRY|INCOMPLETE_FAIL|NEEDS_CLARIFICATION',
-        ].join('\n'),
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig({ retries: 0 }), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('INCOMPLETE_RETRY');
-
-      const steps = await db.getStepsByRunId(run.id);
-      expect(steps[0]?.completionReason).toBe('retry_requested_by_owner');
-    }, 15000);
-
-    it('should correctly parse COMPLETE when it is the real decision, not just template text', async () => {
-      // Ensure the fix doesn't break the happy path — agent says COMPLETE after echoed template
-      mockSpawnOutputs = [
-        'worker did the task\n',
-        [
-          'STEP OWNER CONTRACT:',
-          '- Preferred final decision format:',
-          '  OWNER_DECISION: COMPLETE|INCOMPLETE_RETRY|INCOMPLETE_FAIL|NEEDS_CLARIFICATION',
-          '',
-          'OWNER_DECISION: COMPLETE',
-          'REASON: Worker finished the task successfully',
-        ].join('\n'),
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig({ retries: 0 }), 'default');
-      expect(run.status).toBe('completed');
-
-      const steps = await db.getStepsByRunId(run.id);
-      expect(steps[0]?.completionReason).toBe('completed_by_owner_decision');
-    }, 15000);
-  });
-
-  describe('fallback guards against explicit retry signals', () => {
-    it('should not complete via evidence fallback when output contains INCOMPLETE_RETRY', async () => {
-      // Bug repro: parseOwnerDecision returns null (garbled PTY), but raw output
-      // contains INCOMPLETE_RETRY. judgeOwnerCompletionByEvidence should refuse
-      // to infer completion.
-      mockSpawnOutputs = [
-        'worker completed locally\n',
-        [
-          'I reviewed the worker output. The task looks done but tests are failing.',
-          'OW NER_DECISION: INCOMPLETE_RETRY', // garbled by PTY line wrap
-          'REASON: tests failing',
-          'The worker completed the implementation but verification failed.',
-          'OWNER_DECISION: INCOMPLETE_RETRY', // clear signal in raw output
-        ].join('\n'),
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig({ retries: 0 }), 'default');
-      expect(run.status).toBe('failed');
-    }, 15000);
-
-    it('should not complete via process-exit fallback when output contains INCOMPLETE_RETRY', async () => {
-      const config = makeConfig({
-        swarm: { pattern: 'dag', completionGracePeriodMs: 5000 },
-        agents: [{ name: 'agent-a', cli: 'claude' }],
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'retried-worker',
-                agent: 'agent-a',
-                task: 'Do work',
-                verification: { type: 'exit_code', value: '0' },
-              },
-            ],
-          },
-        ],
-      });
-
-      // Agent exits code 0 and verification passes, BUT output contains INCOMPLETE_RETRY
-      mockSpawnOutputs = [
-        'Implemented the feature.\nOWNER_DECISION: INCOMPLETE_RETRY\nREASON: needs more tests\n',
-      ];
-
-      const localDb = makeDb();
-      runner = new WorkflowRunner({ db: localDb, workspaceId: 'ws-test' });
-      const run = await runner.execute(config, 'default');
-
-      // Should NOT complete — the explicit retry signal should prevent fallback
-      expect(run.status).toBe('failed');
-    }, 15000);
-  });
-});
diff --git a/packages/sdk/src/__tests__/e2e-owner-review.test.ts b/packages/sdk/src/__tests__/e2e-owner-review.test.ts
deleted file mode 100644
index da47d9c95..000000000
--- a/packages/sdk/src/__tests__/e2e-owner-review.test.ts
+++ /dev/null
@@ -1,758 +0,0 @@
-/**
- * E2E test harness for PR #511: auto step owner + per-step review gating.
- *
- * Validates:
- * 1. Hub-role agent auto-assigned as owner (lead matches)
- * 2. "github-integration" agent NOT matched as hub (word-boundary)
- * 3. Review gating — approval flow
- * 4. Review gating — rejection flow (PTY echo handling)
- * 5. Review timeout budgeting
- * 6. Owner timeout emission
- * 7. Lead + workers team with owner assignment
- * 8. YAML workflow parsing of e2e-owner-review.yaml
- * 9. Owner completion marker validation
- */
-
-import { describe, it, expect, vi, beforeEach } from 'vitest';
-import { readFileSync } from 'node:fs';
-import { resolve } from 'node:path';
-import type { WorkflowDb } from '../workflows/runner.js';
-import type { RelayYamlConfig, WorkflowRunRow, WorkflowStepRow } from '../workflows/types.js';
-
-// ── Mock fetch ──────────────────────────────────────────────────────────────
-
-const mockFetch = vi.fn().mockResolvedValue({
-  ok: true,
-  json: () => Promise.resolve({ data: { api_key: 'rk_live_test', workspace_id: 'ws-test' } }),
-  text: () => Promise.resolve(''),
-});
-vi.stubGlobal('fetch', mockFetch);
-
-// ── Mock RelayCast SDK ──────────────────────────────────────────────────────
-
-const mockRelaycastAgent = {
-  send: vi.fn().mockResolvedValue(undefined),
-  heartbeat: vi.fn().mockResolvedValue(undefined),
-  channels: {
-    create: vi.fn().mockResolvedValue(undefined),
-    join: vi.fn().mockResolvedValue(undefined),
-    invite: vi.fn().mockResolvedValue(undefined),
-  },
-};
-
-const mockRelaycast = {
-  agents: { register: vi.fn().mockResolvedValue({ token: 'token-1' }) },
-  as: vi.fn().mockReturnValue(mockRelaycastAgent),
-};
-
-class MockRelayError extends Error {
-  code: string;
-  constructor(code: string, message: string, status = 400) {
-    super(message);
-    this.code = code;
-    this.name = 'RelayError';
-    (this as any).status = status;
-  }
-}
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn().mockImplementation(() => mockRelaycast),
-  RelayError: MockRelayError,
-}));
-
-// ── Mock AgentRelay ─────────────────────────────────────────────────────────
-
-let waitForExitFn: (ms?: number) => Promise<'exited' | 'timeout' | 'released'>;
-let waitForIdleFn: (ms?: number) => Promise<'idle' | 'timeout' | 'exited'>;
-let mockSpawnOutputs: string[] = [];
-
-const mockAgent = {
-  name: 'test-agent-abc',
-  get waitForExit() {
-    return waitForExitFn;
-  },
-  get waitForIdle() {
-    return waitForIdleFn;
-  },
-  release: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockHuman = {
-  name: 'WorkflowRunner',
-  sendMessage: vi.fn().mockResolvedValue(undefined),
-};
-
-const defaultSpawnPtyImplementation = async ({ name, task }: { name: string; task?: string }) => {
-  const queued = mockSpawnOutputs.shift();
-  const stepComplete = task?.match(/STEP_COMPLETE:([^\n]+)/)?.[1]?.trim();
-  const isReview = task?.includes('REVIEW_DECISION: APPROVE or REJECT');
-  const output =
-    queued ??
-    (isReview
-      ? 'REVIEW_DECISION: APPROVE\nREVIEW_REASON: looks good\n'
-      : stepComplete
-        ? `STEP_COMPLETE:${stepComplete}\n`
-        : 'STEP_COMPLETE:unknown\n');
-
-  queueMicrotask(() => emitRelayEvent('workerOutput', { name, chunk: output }));
-
-  return { ...mockAgent, name };
-};
-
-// Listener registry for the AgentRelay mock — the production AgentRelay
-// uses addListener('eventName', handler), so the mock captures handlers
-// here keyed by event name. Tests fire events via `emitRelayEvent`.
-const relayListeners = new Map<string, Set<(...args: unknown[]) => void>>();
-function emitRelayEvent(event: string, payload: unknown): void {
-  for (const handler of relayListeners.get(event) ?? []) {
-    handler(payload);
-  }
-}
-
-const mockRelayInstance = {
-  spawnPty: vi.fn().mockImplementation(defaultSpawnPtyImplementation),
-  human: vi.fn().mockReturnValue(mockHuman),
-  shutdown: vi.fn().mockResolvedValue(undefined),
-  onBrokerStderr: vi.fn().mockReturnValue(() => {}),
-  addListener: vi.fn((event: string, handler: (...args: unknown[]) => void) => {
-    let set = relayListeners.get(event);
-    if (!set) {
-      set = new Set();
-      relayListeners.set(event, set);
-    }
-    set.add(handler);
-    return () => set!.delete(handler);
-  }),
-  listAgentsRaw: vi.fn().mockResolvedValue([]),
-};
-
-vi.mock('../relay.js', () => ({
-  AgentRelay: vi.fn().mockImplementation(() => mockRelayInstance),
-}));
-
-// Import after mocking
-const { WorkflowRunner } = await import('../workflows/runner.js');
-
-// ── Helpers ─────────────────────────────────────────────────────────────────
-
-function makeDb(): WorkflowDb {
-  const runs = new Map<string, WorkflowRunRow>();
-  const steps = new Map<string, WorkflowStepRow>();
-  return {
-    insertRun: vi.fn(async (run: WorkflowRunRow) => {
-      runs.set(run.id, { ...run });
-    }),
-    updateRun: vi.fn(async (id: string, patch: Partial<WorkflowRunRow>) => {
-      const existing = runs.get(id);
-      if (existing) runs.set(id, { ...existing, ...patch });
-    }),
-    getRun: vi.fn(async (id: string) => {
-      const run = runs.get(id);
-      return run ? { ...run } : null;
-    }),
-    insertStep: vi.fn(async (step: WorkflowStepRow) => {
-      steps.set(step.id, { ...step });
-    }),
-    updateStep: vi.fn(async (id: string, patch: Partial<WorkflowStepRow>) => {
-      const existing = steps.get(id);
-      if (existing) steps.set(id, { ...existing, ...patch });
-    }),
-    getStepsByRunId: vi.fn(async (runId: string) => {
-      return [...steps.values()].filter((s) => s.runId === runId);
-    }),
-  };
-}
-
-function makeConfig(overrides: Partial<RelayYamlConfig> = {}): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'e2e-owner-review-test',
-    swarm: { pattern: 'dag' },
-    agents: [
-      { name: 'agent-a', cli: 'claude' },
-      { name: 'agent-b', cli: 'claude' },
-    ],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'step-1', agent: 'agent-a', task: 'Do step 1' },
-          { name: 'step-2', agent: 'agent-b', task: 'Do step 2', dependsOn: ['step-1'] },
-        ],
-      },
-    ],
-    trajectories: false,
-    ...overrides,
-  };
-}
-
-function never<T>(): Promise<T> {
-  return new Promise(() => {});
-}
-
-type WorkflowStepOverride = Partial<NonNullable<RelayYamlConfig['workflows']>[number]['steps'][number]>;
-
-function makeSupervisedConfig(stepOverrides: WorkflowStepOverride = {}): RelayYamlConfig {
-  return makeConfig({
-    swarm: { pattern: 'hub-spoke' },
-    agents: [
-      { name: 'specialist', cli: 'claude', role: 'engineer' },
-      { name: 'team-lead', cli: 'claude', role: 'Lead coordinator for the workflow' },
-      { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-    ],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'step-1', agent: 'specialist', task: 'Implement the requested change', ...stepOverrides },
-        ],
-      },
-    ],
-  });
-}
-
-// ── E2E Scenarios ───────────────────────────────────────────────────────────
-
-describe('PR #511 E2E: Auto Step Owner + Review Gating', () => {
-  let db: WorkflowDb;
-  let runner: InstanceType<typeof WorkflowRunner>;
-
-  beforeEach(() => {
-    vi.clearAllMocks();
-    waitForExitFn = vi.fn().mockResolvedValue('exited');
-    waitForIdleFn = vi.fn().mockImplementation(() => never());
-    mockSpawnOutputs = [];
-    mockAgent.release.mockResolvedValue(undefined);
-    mockRelayInstance.spawnPty.mockImplementation(defaultSpawnPtyImplementation);
-    relayListeners.clear();
-    db = makeDb();
-    runner = new WorkflowRunner({ db, workspaceId: 'ws-test' });
-  });
-
-  // ── Scenario 1: Hub-role agent auto-assigned as owner ───────────────────
-
-  describe('Scenario 1: Hub-role auto-ownership', () => {
-    it('should auto-assign lead agent as owner for specialist steps', async () => {
-      const ownerAssignments: Array<{ owner: string; specialist: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') {
-          ownerAssignments.push({ owner: event.ownerName, specialist: event.specialistName });
-        }
-      });
-
-      const config = makeConfig({
-        swarm: { pattern: 'hub-spoke' },
-        agents: [
-          { name: 'impl-worker', cli: 'claude', role: 'implementer' },
-          { name: 'team-lead', cli: 'claude', role: 'Lead coordinator for the workflow' },
-          { name: 'quality-reviewer', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'hub-owner-test', agent: 'impl-worker', task: 'List 3 benefits' }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-      expect(ownerAssignments).toHaveLength(1);
-      expect(ownerAssignments[0].owner).toBe('team-lead');
-      expect(ownerAssignments[0].specialist).toBe('impl-worker');
-    }, 15000);
-
-    it('should prioritize lead over coordinator in owner resolution', async () => {
-      const ownerAssignments: string[] = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') ownerAssignments.push(event.ownerName);
-      });
-
-      const config = makeConfig({
-        swarm: { pattern: 'hub-spoke' },
-        agents: [
-          { name: 'specialist', cli: 'claude', role: 'engineer' },
-          { name: 'coord-bot', cli: 'claude', role: 'coordinator' },
-          { name: 'lead-bot', cli: 'claude', role: 'lead' },
-          { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'step-1', agent: 'specialist', task: 'Do work' }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-      expect(ownerAssignments[0]).toBe('lead-bot');
-    }, 15000);
-
-    it('should spawn a separate worker and supervisor for dedicated owner steps', async () => {
-      mockSpawnOutputs = [
-        'worker finished\n',
-        'Observed progress on channel\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: looks good\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-
-      const spawnCalls = (mockRelayInstance.spawnPty as any).mock.calls;
-      expect(spawnCalls[0][0].name).toContain('step-1-worker');
-      expect(spawnCalls[1][0].name).toContain('step-1-owner');
-      expect(spawnCalls[0][0].task).not.toContain('STEP_COMPLETE:step-1');
-      expect(spawnCalls[1][0].task).toContain('You are the step owner/supervisor for step "step-1".');
-    }, 15000);
-  });
-
-  // ── Scenario 2: github-integration NOT matched as hub ───────────────────
-
-  describe('Scenario 2: Hub word-boundary matching', () => {
-    it('should NOT match "github-integration" as hub-role agent', async () => {
-      const ownerAssignments: Array<{ owner: string; specialist: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') {
-          ownerAssignments.push({ owner: event.ownerName, specialist: event.specialistName });
-        }
-      });
-
-      const config = makeConfig({
-        swarm: { pattern: 'hub-spoke' },
-        agents: [
-          { name: 'specialist', cli: 'claude', role: 'engineer' },
-          { name: 'github-integration', cli: 'claude', role: 'GitHub integration agent' },
-          { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'github-no-hub', agent: 'specialist', task: 'Test word boundary' }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-      expect(ownerAssignments[0].owner).not.toBe('github-integration');
-      expect(ownerAssignments[0].owner).toBe('specialist');
-    }, 15000);
-
-    it('should NOT match "github-bot" with role "github integration" as hub', async () => {
-      const ownerAssignments: Array<{ owner: string; specialist: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') {
-          ownerAssignments.push({ owner: event.ownerName, specialist: event.specialistName });
-        }
-      });
-
-      const config = makeConfig({
-        swarm: { pattern: 'hub-spoke' },
-        agents: [
-          { name: 'specialist', cli: 'claude', role: 'engineer' },
-          { name: 'github-bot', cli: 'claude', role: 'github integration' },
-          { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'step-1', agent: 'specialist', task: 'Do work' }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-      expect(ownerAssignments[0].owner).not.toBe('github-bot');
-      expect(ownerAssignments[0].owner).toBe('specialist');
-    }, 15000);
-  });
-
-  // ── Scenario 3: Review gating — approval flow ──────────────────────────
-
-  describe('Scenario 3: Review gating approval', () => {
-    it('should emit step:review-completed with approved decision', async () => {
-      const reviewEvents: Array<{ decision: string; reviewerName: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:review-completed') {
-          reviewEvents.push({ decision: event.decision, reviewerName: event.reviewerName });
-        }
-      });
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-      expect(reviewEvents.length).toBeGreaterThanOrEqual(1);
-      expect(reviewEvents[0].decision).toBe('approved');
-    }, 15000);
-
-    it('should gate step completion on review approval', async () => {
-      const stepEvents: string[] = [];
-      runner.on((event) => {
-        if (event.type === 'step:completed' || event.type === 'step:review-completed') {
-          stepEvents.push(event.type);
-        }
-      });
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-      const reviewIdx = stepEvents.indexOf('step:review-completed');
-      const completedIdx = stepEvents.indexOf('step:completed');
-      expect(reviewIdx).toBeGreaterThanOrEqual(0);
-      expect(reviewIdx).toBeLessThan(completedIdx);
-    }, 15000);
-
-    it('should complete review from streamed REVIEW_DECISION before normal exit', async () => {
-      mockRelayInstance.spawnPty.mockImplementation(
-        async ({ name, task }: { name: string; task?: string }) => {
-          const isReview = task?.includes('REVIEW_DECISION: APPROVE or REJECT');
-          const stepComplete = task?.match(/STEP_COMPLETE:([^\n]+)/)?.[1]?.trim();
-          const output = isReview
-            ? 'REVIEW_DECISION: APPROVE\nREVIEW_REASON: streamed completion\n'
-            : stepComplete
-              ? `STEP_COMPLETE:${stepComplete}\n`
-              : 'STEP_COMPLETE:unknown\n';
-
-          queueMicrotask(() => emitRelayEvent('workerOutput', { name, chunk: output }));
-
-          if (!isReview) {
-            return { ...mockAgent, name };
-          }
-
-          let released = false;
-          let resolveExit: ((result: 'released') => void) | undefined;
-          const waitForExit = vi.fn().mockImplementation(() => {
-            if (released) {
-              return Promise.resolve<'released'>('released');
-            }
-            return new Promise<'released'>((resolve) => {
-              resolveExit = resolve;
-            });
-          });
-          const release = vi.fn().mockImplementation(async () => {
-            released = true;
-            resolveExit?.('released');
-          });
-
-          return {
-            name,
-            waitForExit,
-            waitForIdle: vi.fn().mockImplementation(() => never()),
-            release,
-          };
-        }
-      );
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-
-      expect(run.status).toBe('completed');
-      const spawnResults = (mockRelayInstance.spawnPty as any).mock.results;
-      const reviewAgent = await spawnResults[spawnResults.length - 1].value;
-      expect(reviewAgent.name).toContain('step-1-review');
-      expect(reviewAgent.release).toHaveBeenCalledTimes(1);
-    }, 15000);
-
-    it('should mirror worker output to the channel for owner observation', async () => {
-      mockSpawnOutputs = [
-        'worker progress update\n',
-        'STEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: looks good\n',
-      ];
-
-      const run = await runner.execute(
-        makeSupervisedConfig({ verification: { type: 'output_contains', value: 'worker progress update' } }),
-        'default'
-      );
-      expect(run.status).toBe('completed');
-
-      const channelMessages = (mockRelaycastAgent.send as any).mock.calls.map(
-        ([, text]: [string, string]) => text
-      );
-      expect(channelMessages.some((text: string) => text.includes('worker progress update'))).toBe(true);
-      expect(channelMessages.some((text: string) => text.includes('Worker `step-1-worker'))).toBe(true);
-    }, 15000);
-  });
-
-  // ── Scenario 4: Review gating — rejection flow ─────────────────────────
-
-  describe('Scenario 4: Review gating rejection', () => {
-    it('should fail the step when reviewer rejects', async () => {
-      const events: Array<{ type: string; decision?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:review-completed') {
-          events.push({ type: event.type, decision: event.decision });
-        }
-      });
-
-      mockSpawnOutputs = [
-        'worker finished\n',
-        'STEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: REJECT\nREVIEW_REASON: output is incomplete\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('review rejected');
-      expect(events).toContainEqual({ type: 'step:review-completed', decision: 'rejected' });
-    }, 15000);
-
-    it('should fail closed when review output is malformed (no REVIEW_DECISION)', async () => {
-      mockSpawnOutputs = [
-        'worker finished\n',
-        'STEP_COMPLETE:step-1\n',
-        'REVIEW_REASON: this is missing the decision line\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('review response malformed');
-    }, 15000);
-
-    it('should use last REVIEW_DECISION match when PTY echoes prompt (reject)', async () => {
-      const events: Array<{ type: string; decision?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:review-completed') {
-          events.push({ type: event.type, decision: event.decision });
-        }
-      });
-
-      const echoedPrompt =
-        'Return exactly:\nREVIEW_DECISION: APPROVE or REJECT\nREVIEW_REASON: <one sentence>\n';
-      const actualResponse = 'REVIEW_DECISION: REJECT\nREVIEW_REASON: code has critical bugs\n';
-      mockSpawnOutputs = ['worker finished\n', 'STEP_COMPLETE:step-1\n', echoedPrompt + actualResponse];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(events).toContainEqual({ type: 'step:review-completed', decision: 'rejected' });
-    }, 15000);
-  });
-
-  // ── Scenario 5: Review timeout budgeting ───────────────────────────────
-
-  describe('Scenario 5: Review timeout budgeting', () => {
-    it('should use the full remaining step timeout as the review safety backstop', async () => {
-      const config = makeSupervisedConfig({ timeoutMs: 90_000 });
-
-      mockRelayInstance.spawnPty.mockImplementation(
-        async ({ name, task }: { name: string; task?: string }) => {
-          const isReview = task?.includes('REVIEW_DECISION: APPROVE or REJECT');
-          const stepComplete = task?.match(/STEP_COMPLETE:([^\n]+)/)?.[1]?.trim();
-          const output = isReview
-            ? ''
-            : stepComplete
-              ? `STEP_COMPLETE:${stepComplete}\n`
-              : 'worker finished\n';
-
-          if (output) {
-            queueMicrotask(() => emitRelayEvent('workerOutput', { name, chunk: output }));
-          }
-
-          return {
-            name,
-            waitForExit: vi.fn().mockResolvedValue(isReview ? 'timeout' : 'exited'),
-            waitForIdle: vi.fn().mockImplementation(() => never()),
-            release: vi.fn().mockResolvedValue(undefined),
-          };
-        }
-      );
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('review safety backstop timed out');
-
-      const spawnResults = (mockRelayInstance.spawnPty as any).mock.results;
-      const reviewAgent = await spawnResults[spawnResults.length - 1].value;
-      const reviewTimeout = reviewAgent.waitForExit.mock.calls[0][0];
-      expect(reviewTimeout).toBeGreaterThan(60_000);
-      expect(reviewTimeout).toBeLessThanOrEqual(90_000);
-    }, 15000);
-
-    it('should default the review safety backstop to 10 minutes when no step timeout is set', async () => {
-      const config = makeSupervisedConfig();
-
-      mockRelayInstance.spawnPty.mockImplementation(
-        async ({ name, task }: { name: string; task?: string }) => {
-          const isReview = task?.includes('REVIEW_DECISION: APPROVE or REJECT');
-          const stepComplete = task?.match(/STEP_COMPLETE:([^\n]+)/)?.[1]?.trim();
-          const output = isReview
-            ? ''
-            : stepComplete
-              ? `STEP_COMPLETE:${stepComplete}\n`
-              : 'worker finished\n';
-
-          if (output) {
-            queueMicrotask(() => emitRelayEvent('workerOutput', { name, chunk: output }));
-          }
-
-          return {
-            name,
-            waitForExit: vi.fn().mockResolvedValue(isReview ? 'timeout' : 'exited'),
-            waitForIdle: vi.fn().mockImplementation(() => never()),
-            release: vi.fn().mockResolvedValue(undefined),
-          };
-        }
-      );
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('review safety backstop timed out after 600000ms');
-
-      const spawnResults = (mockRelayInstance.spawnPty as any).mock.results;
-      const reviewAgent = await spawnResults[spawnResults.length - 1].value;
-      expect(reviewAgent.waitForExit).toHaveBeenCalledWith(600_000);
-    }, 15000);
-  });
-
-  // ── Scenario 6: Owner timeout emission ─────────────────────────────────
-
-  describe('Scenario 6: Owner timeout events', () => {
-    it('should emit step:owner-timeout when owner exceeds time limit', async () => {
-      const events: Array<{ type: string; stepName?: string; ownerName?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-timeout') {
-          events.push({ type: event.type, stepName: event.stepName, ownerName: event.ownerName });
-        }
-      });
-
-      waitForExitFn = vi.fn().mockResolvedValue('timeout');
-      waitForIdleFn = vi.fn().mockResolvedValue('timeout');
-
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('timed out');
-      expect(events.length).toBeGreaterThanOrEqual(1);
-      expect(events[0].type).toBe('step:owner-timeout');
-      expect(events[0].stepName).toBe('step-1');
-    }, 15000);
-
-    it('should NOT emit step:owner-timeout for successful reviews', async () => {
-      const ownerTimeouts: string[] = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-timeout') ownerTimeouts.push(event.stepName);
-      });
-
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('completed');
-      expect(ownerTimeouts).toHaveLength(0);
-    }, 15000);
-  });
-
-  // ── Scenario 7: Multi-agent team with owner assignment ─────────────────
-
-  describe('Scenario 7: Lead + workers team pattern', () => {
-    it('should assign lead as owner for worker steps in a team', async () => {
-      const ownerAssignments: Array<{ owner: string; specialist: string; step: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') {
-          ownerAssignments.push({
-            owner: event.ownerName,
-            specialist: event.specialistName,
-            step: event.stepName,
-          });
-        }
-      });
-
-      const config = makeConfig({
-        swarm: { pattern: 'hub-spoke' },
-        agents: [
-          { name: 'team-lead', cli: 'claude', role: 'Lead coordinator' },
-          { name: 'worker-1', cli: 'claude', role: 'implementer' },
-          { name: 'worker-2', cli: 'claude', role: 'implementer' },
-          { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              { name: 'work-1', agent: 'worker-1', task: 'Do task A' },
-              { name: 'work-2', agent: 'worker-2', task: 'Do task B' },
-              {
-                name: 'lead-coord',
-                agent: 'team-lead',
-                task: 'Coordinate workers',
-                dependsOn: ['work-1', 'work-2'],
-              },
-            ],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-      expect(ownerAssignments.length).toBeGreaterThanOrEqual(3);
-
-      const worker1Owner = ownerAssignments.find((a) => a.step === 'work-1');
-      const worker2Owner = ownerAssignments.find((a) => a.step === 'work-2');
-      expect(worker1Owner?.owner).toBe('team-lead');
-      expect(worker2Owner?.owner).toBe('team-lead');
-
-      const leadOwner = ownerAssignments.find((a) => a.step === 'lead-coord');
-      expect(leadOwner?.owner).toBe('team-lead');
-    }, 30000);
-  });
-
-  // ── Scenario 8: YAML workflow parsing ──────────────────────────────────
-
-  describe('Scenario 8: E2E workflow YAML validation', () => {
-    it('should parse the e2e-owner-review.yaml without errors', () => {
-      const yamlPath = resolve(__dirname, '../../../../tests/workflows/e2e-owner-review.yaml');
-      const yamlContent = readFileSync(yamlPath, 'utf-8');
-
-      // parseYamlString is an instance method
-      const config = runner.parseYamlString(yamlContent);
-      expect(config.name).toBe('e2e-owner-review');
-      expect(config.agents).toHaveLength(5);
-      expect(config.workflows).toHaveLength(1);
-
-      const agentNames = config.agents!.map((a: any) => a.name);
-      expect(agentNames).toContain('team-lead');
-      expect(agentNames).toContain('github-integration');
-      expect(agentNames).toContain('impl-worker');
-      expect(agentNames).toContain('quality-reviewer');
-      expect(agentNames).toContain('coordinator-bot');
-
-      const steps = config.workflows![0].steps;
-      const stepNames = steps.map((s: any) => s.name);
-      expect(stepNames).toContain('hub-owner-test');
-      expect(stepNames).toContain('github-no-hub-match');
-      expect(stepNames).toContain('review-approval-gate');
-      expect(stepNames).toContain('deliberate-bad-output');
-      expect(stepNames).toContain('tight-timeout-step');
-      expect(stepNames).toContain('team-lead-coord');
-      expect(stepNames).toContain('merge-results');
-    });
-
-    it('should detect hub-role agents correctly from YAML', () => {
-      const yamlPath = resolve(__dirname, '../../../../tests/workflows/e2e-owner-review.yaml');
-      const yamlContent = readFileSync(yamlPath, 'utf-8');
-      const config = runner.parseYamlString(yamlContent);
-
-      const teamLead = config.agents!.find((a: any) => a.name === 'team-lead');
-      expect(teamLead?.role).toMatch(/\blead\b/i);
-
-      const githubAgent = config.agents!.find((a: any) => a.name === 'github-integration');
-      expect(githubAgent?.role).not.toMatch(/\bhub\b/i);
-      expect(githubAgent?.name).not.toMatch(/\bhub\b/i);
-
-      const coordBot = config.agents!.find((a: any) => a.name === 'coordinator-bot');
-      expect(coordBot?.role).toMatch(/\bcoordinator\b/i);
-    });
-  });
-
-  // ── Scenario 9: Owner completion marker validation ─────────────────────
-
-  describe('Scenario 9: Owner completion marker', () => {
-    it('should fail when owner does not provide a marker, decision, or evidence', async () => {
-      mockSpawnOutputs = ['The work is done but I forgot the sentinel.\n'];
-
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('owner completion decision missing');
-    }, 15000);
-
-    it('should succeed when owner produces correct STEP_COMPLETE:step-name', async () => {
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('completed');
-    }, 15000);
-  });
-});
diff --git a/packages/sdk/src/__tests__/error-scenarios.test.ts b/packages/sdk/src/__tests__/error-scenarios.test.ts
deleted file mode 100644
index 531b6ce0d..000000000
--- a/packages/sdk/src/__tests__/error-scenarios.test.ts
+++ /dev/null
@@ -1,693 +0,0 @@
-/**
- * Error scenario tests across all swarm workflow services.
- *
- * Tests failure modes, edge cases, and error propagation in
- * StateStore, BarrierManager, SwarmCoordinator, and WorkflowRunner.
- */
-
-import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest';
-import { StateStore } from '../workflows/state.js';
-import { BarrierManager } from '../workflows/barrier.js';
-import { SwarmCoordinator } from '../workflows/coordinator.js';
-import type { DbClient } from '../workflows/coordinator.js';
-import type { BarrierRow } from '../workflows/barrier.js';
-import type { StateEntry } from '../workflows/state.js';
-
-// ── Helpers ──────────────────────────────────────────────────────────────────
-
-function makeDb(): DbClient {
-  return {
-    query: vi.fn().mockResolvedValue({ rows: [] }),
-  };
-}
-
-// ── StateStore error scenarios ───────────────────────────────────────────────
-
-describe('StateStore error scenarios', () => {
-  let db: DbClient;
-  let store: StateStore;
-
-  beforeEach(() => {
-    db = makeDb();
-    store = new StateStore(db);
-  });
-
-  describe('consensus gating', () => {
-    it('should reject writes when consensus gate returns false', async () => {
-      store.setConsensusGate(async () => false);
-
-      await expect(store.set('run_1', 'key', 'value', 'agent-1')).rejects.toThrow(
-        'rejected by consensus gate'
-      );
-    });
-
-    it('should emit state:gated event on rejection', async () => {
-      const spy = vi.fn();
-      store.on('state:gated', spy);
-      store.setConsensusGate(async () => false);
-
-      await store.set('run_1', 'key', 'value', 'agent-1').catch(() => {});
-
-      expect(spy).toHaveBeenCalledWith('run_1', 'key', 'agent-1');
-    });
-
-    it('should allow writes when consensus gate returns true', async () => {
-      const entry: StateEntry = {
-        id: 'st_1',
-        runId: 'run_1',
-        namespace: 'default',
-        key: 'key',
-        value: 'value',
-        expiresAt: null,
-        createdAt: new Date().toISOString(),
-        updatedAt: new Date().toISOString(),
-      };
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [entry] });
-      store.setConsensusGate(async () => true);
-
-      const result = await store.set('run_1', 'key', 'value', 'agent-1');
-      expect(result).toEqual(entry);
-    });
-
-    it('should clear consensus gate', async () => {
-      store.setConsensusGate(async () => false);
-      store.clearConsensusGate();
-
-      const entry: StateEntry = {
-        id: 'st_1',
-        runId: 'run_1',
-        namespace: 'default',
-        key: 'key',
-        value: 'value',
-        expiresAt: null,
-        createdAt: new Date().toISOString(),
-        updatedAt: new Date().toISOString(),
-      };
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [entry] });
-
-      await expect(store.set('run_1', 'key', 'value', 'agent-1')).resolves.toBeDefined();
-    });
-  });
-
-  describe('DB failures', () => {
-    it('should propagate DB errors on set', async () => {
-      vi.mocked(db.query).mockRejectedValueOnce(new Error('connection lost'));
-      await expect(store.set('run_1', 'key', 'v', 'agent')).rejects.toThrow('connection lost');
-    });
-
-    it('should propagate DB errors on get', async () => {
-      vi.mocked(db.query).mockRejectedValueOnce(new Error('timeout'));
-      await expect(store.get('run_1', 'key')).rejects.toThrow('timeout');
-    });
-
-    it('should propagate DB errors on delete', async () => {
-      vi.mocked(db.query).mockRejectedValueOnce(new Error('disk full'));
-      await expect(store.delete('run_1', 'key')).rejects.toThrow('disk full');
-    });
-  });
-
-  describe('namespace isolation', () => {
-    it('should use custom namespace when provided', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await store.get('run_1', 'key', { namespace: 'custom' });
-      expect(db.query).toHaveBeenCalledWith(expect.any(String), ['run_1', 'custom', 'key']);
-    });
-
-    it('should use default namespace when not provided', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await store.get('run_1', 'key');
-      expect(db.query).toHaveBeenCalledWith(expect.any(String), ['run_1', 'default', 'key']);
-    });
-  });
-
-  describe('TTL', () => {
-    it('should set expiresAt when ttlMs provided', async () => {
-      const entry: StateEntry = {
-        id: 'st_1',
-        runId: 'run_1',
-        namespace: 'default',
-        key: 'key',
-        value: 'v',
-        expiresAt: new Date(Date.now() + 5000).toISOString(),
-        createdAt: new Date().toISOString(),
-        updatedAt: new Date().toISOString(),
-      };
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [entry] });
-
-      const result = await store.set('run_1', 'key', 'v', 'agent', { ttlMs: 5000 });
-      expect(result.expiresAt).not.toBeNull();
-    });
-  });
-
-  describe('event emission', () => {
-    it('should emit state:set on successful write', async () => {
-      const entry: StateEntry = {
-        id: 'st_1',
-        runId: 'run_1',
-        namespace: 'default',
-        key: 'key',
-        value: 'v',
-        expiresAt: null,
-        createdAt: new Date().toISOString(),
-        updatedAt: new Date().toISOString(),
-      };
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [entry] });
-
-      const spy = vi.fn();
-      store.on('state:set', spy);
-
-      await store.set('run_1', 'key', 'v', 'agent');
-      expect(spy).toHaveBeenCalledWith(entry);
-    });
-
-    it('should emit state:deleted on successful delete', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [{ id: 'st_1' }] });
-
-      const spy = vi.fn();
-      store.on('state:deleted', spy);
-
-      await store.delete('run_1', 'key');
-      expect(spy).toHaveBeenCalledWith('run_1', 'key', 'default');
-    });
-
-    it('should not emit state:deleted when key not found', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-
-      const spy = vi.fn();
-      store.on('state:deleted', spy);
-
-      await store.delete('run_1', 'key');
-      expect(spy).not.toHaveBeenCalled();
-    });
-  });
-
-  describe('snapshot', () => {
-    it('should return empty object for no entries', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      const snapshot = await store.snapshot('run_1');
-      expect(snapshot).toEqual({});
-    });
-
-    it('should build key-value map from entries', async () => {
-      const entries: StateEntry[] = [
-        {
-          id: '1',
-          runId: 'run_1',
-          namespace: 'default',
-          key: 'a',
-          value: 1,
-          expiresAt: null,
-          createdAt: '',
-          updatedAt: '',
-        },
-        {
-          id: '2',
-          runId: 'run_1',
-          namespace: 'default',
-          key: 'b',
-          value: 'hello',
-          expiresAt: null,
-          createdAt: '',
-          updatedAt: '',
-        },
-      ];
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: entries });
-
-      const snapshot = await store.snapshot('run_1');
-      expect(snapshot).toEqual({ a: 1, b: 'hello' });
-    });
-  });
-});
-
-// ── BarrierManager error scenarios ───────────────────────────────────────────
-
-describe('BarrierManager error scenarios', () => {
-  let db: DbClient;
-  let manager: BarrierManager;
-
-  beforeEach(() => {
-    db = makeDb();
-    manager = new BarrierManager(db);
-  });
-
-  afterEach(() => {
-    manager.cleanup();
-  });
-
-  describe('barrier creation', () => {
-    it('should create barrier and emit barrier:created', async () => {
-      const barrier: BarrierRow = {
-        id: 'bar_1',
-        runId: 'run_1',
-        barrierName: 'test-barrier',
-        waitFor: ['agent-a', 'agent-b'],
-        resolved: [],
-        isSatisfied: false,
-        timeoutMs: null,
-        createdAt: new Date().toISOString(),
-        updatedAt: new Date().toISOString(),
-      };
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [barrier] });
-
-      const spy = vi.fn();
-      manager.on('barrier:created', spy);
-
-      const result = await manager.createBarrier('run_1', {
-        name: 'test-barrier',
-        waitFor: ['agent-a', 'agent-b'],
-      });
-
-      expect(result.barrierName).toBe('test-barrier');
-      expect(spy).toHaveBeenCalledWith(barrier);
-    });
-
-    it('should create multiple barriers in batch', async () => {
-      const barrier: BarrierRow = {
-        id: 'bar_1',
-        runId: 'run_1',
-        barrierName: 'b1',
-        waitFor: ['a'],
-        resolved: [],
-        isSatisfied: false,
-        timeoutMs: null,
-        createdAt: new Date().toISOString(),
-        updatedAt: new Date().toISOString(),
-      };
-      vi.mocked(db.query).mockResolvedValue({ rows: [barrier] });
-
-      const results = await manager.createBarriers('run_1', [
-        { name: 'b1', waitFor: ['a'] },
-        { name: 'b2', waitFor: ['b'] },
-      ]);
-
-      expect(results).toHaveLength(2);
-    });
-  });
-
-  describe('barrier resolution', () => {
-    it('should resolve barrier and check satisfaction (all mode)', async () => {
-      const barrier: BarrierRow = {
-        id: 'bar_1',
-        runId: 'run_1',
-        barrierName: 'b1',
-        waitFor: ['agent-a', 'agent-b'],
-        resolved: ['agent-a'],
-        isSatisfied: false,
-        timeoutMs: null,
-        createdAt: new Date().toISOString(),
-        updatedAt: new Date().toISOString(),
-      };
-
-      // First, create the barrier to set the mode
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [barrier] });
-      await manager.createBarrier('run_1', {
-        name: 'b1',
-        waitFor: ['agent-a', 'agent-b'],
-        mode: 'all',
-      });
-
-      // Now resolve with partial (not satisfied yet)
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [barrier] });
-      const result = await manager.resolve('run_1', 'b1', 'agent-a');
-      expect(result.satisfied).toBe(false);
-    });
-
-    it('should satisfy barrier in any mode with single resolution', async () => {
-      const barrier: BarrierRow = {
-        id: 'bar_1',
-        runId: 'run_1',
-        barrierName: 'b1',
-        waitFor: ['agent-a', 'agent-b'],
-        resolved: ['agent-a'],
-        isSatisfied: false,
-        timeoutMs: null,
-        createdAt: new Date().toISOString(),
-        updatedAt: new Date().toISOString(),
-      };
-
-      // Create barrier in "any" mode
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [barrier] });
-      await manager.createBarrier('run_1', {
-        name: 'b1',
-        waitFor: ['agent-a', 'agent-b'],
-        mode: 'any',
-      });
-
-      // Resolve — should satisfy immediately since mode is "any"
-      vi.mocked(db.query)
-        .mockResolvedValueOnce({ rows: [barrier] }) // resolve UPDATE
-        .mockResolvedValueOnce({ rows: [{ ...barrier, isSatisfied: true }] }); // markSatisfied UPDATE
-
-      const satisfiedSpy = vi.fn();
-      manager.on('barrier:satisfied', satisfiedSpy);
-
-      const result = await manager.resolve('run_1', 'b1', 'agent-a');
-      expect(result.satisfied).toBe(true);
-      expect(satisfiedSpy).toHaveBeenCalled();
-    });
-
-    it('should throw when barrier not found during resolve', async () => {
-      // resolve UPDATE returns empty
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      // getBarrier also returns empty
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-
-      await expect(manager.resolve('run_1', 'nonexistent', 'agent-a')).rejects.toThrow('not found');
-    });
-
-    it('should return existing state when barrier already satisfied', async () => {
-      const barrier: BarrierRow = {
-        id: 'bar_1',
-        runId: 'run_1',
-        barrierName: 'b1',
-        waitFor: ['a'],
-        resolved: ['a'],
-        isSatisfied: true,
-        timeoutMs: null,
-        createdAt: '',
-        updatedAt: '',
-      };
-
-      // resolve UPDATE returns empty (already satisfied, WHERE is_satisfied=FALSE doesn't match)
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      // getBarrier returns the already-satisfied barrier
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [barrier] });
-
-      const result = await manager.resolve('run_1', 'b1', 'a');
-      expect(result.satisfied).toBe(true);
-    });
-  });
-
-  describe('barrier timeout', () => {
-    it('should schedule timeout and emit barrier:timeout', async () => {
-      vi.useFakeTimers();
-
-      const barrier: BarrierRow = {
-        id: 'bar_1',
-        runId: 'run_1',
-        barrierName: 'b1',
-        waitFor: ['a'],
-        resolved: [],
-        isSatisfied: false,
-        timeoutMs: 1000,
-        createdAt: '',
-        updatedAt: '',
-      };
-
-      vi.mocked(db.query).mockResolvedValue({ rows: [barrier] });
-
-      const timeoutSpy = vi.fn();
-      manager.on('barrier:timeout', timeoutSpy);
-
-      await manager.createBarrier('run_1', {
-        name: 'b1',
-        waitFor: ['a'],
-        timeoutMs: 1000,
-      });
-
-      await vi.advanceTimersByTimeAsync(1100);
-
-      expect(timeoutSpy).toHaveBeenCalledWith(barrier);
-
-      vi.useRealTimers();
-    });
-  });
-
-  describe('cleanup', () => {
-    it('should clear all timeout timers', async () => {
-      const barrier: BarrierRow = {
-        id: 'bar_1',
-        runId: 'run_1',
-        barrierName: 'b1',
-        waitFor: ['a'],
-        resolved: [],
-        isSatisfied: false,
-        timeoutMs: 60000,
-        createdAt: '',
-        updatedAt: '',
-      };
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [barrier] });
-
-      await manager.createBarrier('run_1', {
-        name: 'b1',
-        waitFor: ['a'],
-        timeoutMs: 60000,
-      });
-
-      expect(() => manager.cleanup()).not.toThrow();
-    });
-  });
-
-  describe('queries', () => {
-    it('getBarrier should return null for missing barrier', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      const result = await manager.getBarrier('run_1', 'nonexistent');
-      expect(result).toBeNull();
-    });
-
-    it('isSatisfied should return false when barrier does not exist', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      const result = await manager.isSatisfied('run_1', 'missing');
-      expect(result).toBe(false);
-    });
-
-    it('getUnsatisfiedBarriers should query with is_satisfied = FALSE', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await manager.getUnsatisfiedBarriers('run_1');
-      expect(db.query).toHaveBeenCalledWith(expect.stringContaining('is_satisfied = FALSE'), ['run_1']);
-    });
-  });
-});
-
-// ── SwarmCoordinator error scenarios ─────────────────────────────────────────
-
-describe('SwarmCoordinator error scenarios', () => {
-  let db: DbClient;
-  let coordinator: SwarmCoordinator;
-
-  beforeEach(() => {
-    db = makeDb();
-    coordinator = new SwarmCoordinator(db);
-  });
-
-  describe('run lifecycle errors', () => {
-    it('should throw when starting a non-pending run', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await expect(coordinator.startRun('run_1')).rejects.toThrow('not found or not in pending');
-    });
-
-    it('should throw when completing a non-existent run', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await expect(coordinator.completeRun('bad')).rejects.toThrow('not found');
-    });
-
-    it('should throw when failing a non-existent run', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await expect(coordinator.failRun('bad', 'error')).rejects.toThrow('not found');
-    });
-
-    it('should throw when cancelling a non-existent run', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await expect(coordinator.cancelRun('bad')).rejects.toThrow('not found');
-    });
-  });
-
-  describe('step lifecycle errors', () => {
-    it('should throw when starting a non-pending step', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await expect(coordinator.startStep('step_bad')).rejects.toThrow('not in pending state');
-    });
-
-    it('should throw when completing a non-running step', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await expect(coordinator.completeStep('step_bad')).rejects.toThrow('not in running state');
-    });
-
-    it('should throw when failing a non-running step', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await expect(coordinator.failStep('step_bad', 'err')).rejects.toThrow('not in running state');
-    });
-
-    it('should throw when skipping a non-existent step', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await expect(coordinator.skipStep('step_bad')).rejects.toThrow('not found');
-    });
-  });
-
-  describe('DB propagation', () => {
-    it('should propagate DB errors from createRun', async () => {
-      vi.mocked(db.query).mockRejectedValueOnce(new Error('connection refused'));
-      await expect(
-        coordinator.createRun('ws-1', {
-          version: '1',
-          name: 'test',
-          swarm: { pattern: 'fan-out' },
-          agents: [{ name: 'a', cli: 'claude' }],
-        })
-      ).rejects.toThrow('connection refused');
-    });
-
-    it('should propagate DB errors from getSteps', async () => {
-      vi.mocked(db.query).mockRejectedValueOnce(new Error('query timeout'));
-      await expect(coordinator.getSteps('run_1')).rejects.toThrow('query timeout');
-    });
-  });
-});
-
-// ── WorkflowRunner error scenarios ───────────────────────────────────────────
-
-describe('WorkflowRunner error scenarios', () => {
-  // Mock AgentRelay for runner tests
-  const mockAgent = {
-    name: 'test-agent',
-    waitForExit: vi.fn().mockResolvedValue(0),
-    release: vi.fn(),
-  };
-
-  vi.mock('@agent-relay/sdk/relay', () => ({
-    AgentRelay: vi.fn().mockImplementation(() => ({
-      spawnPty: vi.fn().mockResolvedValue(mockAgent),
-      human: vi.fn().mockReturnValue({ sendMessage: vi.fn() }),
-      shutdown: vi.fn(),
-    })),
-  }));
-
-  let WorkflowRunner: any;
-  let db: any;
-  let runner: any;
-
-  beforeEach(async () => {
-    const mod = await import('../workflows/runner.js');
-    WorkflowRunner = mod.WorkflowRunner;
-
-    const runs = new Map();
-    const steps = new Map();
-
-    db = {
-      insertRun: vi.fn(async (run: any) => runs.set(run.id, { ...run })),
-      updateRun: vi.fn(async (id: string, patch: any) => {
-        const existing = runs.get(id);
-        if (existing) runs.set(id, { ...existing, ...patch });
-      }),
-      getRun: vi.fn(async (id: string) => runs.get(id) ?? null),
-      insertStep: vi.fn(async (step: any) => steps.set(step.id, { ...step })),
-      updateStep: vi.fn(async (id: string, patch: any) => {
-        const existing = steps.get(id);
-        if (existing) steps.set(id, { ...existing, ...patch });
-      }),
-      getStepsByRunId: vi.fn(async (runId: string) => {
-        return [...steps.values()].filter((s: any) => s.runId === runId);
-      }),
-    };
-
-    runner = new WorkflowRunner({ db, workspaceId: 'ws-test' });
-  });
-
-  describe('validation errors', () => {
-    it('should reject non-object config', () => {
-      expect(() => runner.validateConfig('string')).toThrow('non-null object');
-      expect(() => runner.validateConfig(42)).toThrow('non-null object');
-      expect(() => runner.validateConfig(undefined)).toThrow('non-null object');
-    });
-
-    it('should reject config without swarm', () => {
-      expect(() =>
-        runner.validateConfig({ version: '1', name: 'x', agents: [{ name: 'a', cli: 'claude' }] })
-      ).toThrow('missing required field "swarm"');
-    });
-
-    it('should reject config with null swarm', () => {
-      expect(() =>
-        runner.validateConfig({
-          version: '1',
-          name: 'x',
-          swarm: null,
-          agents: [{ name: 'a', cli: 'claude' }],
-        })
-      ).toThrow('missing required field "swarm"');
-    });
-
-    it('should reject workflows with non-object steps', () => {
-      expect(() =>
-        runner.validateConfig({
-          version: '1',
-          name: 'x',
-          swarm: { pattern: 'dag' },
-          agents: [{ name: 'a', cli: 'claude' }],
-          workflows: [{ name: 'wf', steps: ['not-an-object'] }],
-        })
-      ).toThrow('each step must be an object');
-    });
-
-    it('should reject step missing required fields', () => {
-      expect(() =>
-        runner.validateConfig({
-          version: '1',
-          name: 'x',
-          swarm: { pattern: 'dag' },
-          agents: [{ name: 'a', cli: 'claude' }],
-          workflows: [{ name: 'wf', steps: [{ name: 's1', agent: 'a' }] }],
-        })
-      ).toThrow('must have "agent" and "task" string fields');
-    });
-  });
-
-  describe('variable resolution errors', () => {
-    it('should throw on unresolved variable in agent task', () => {
-      const config = {
-        version: '1',
-        name: 'test',
-        swarm: { pattern: 'dag' as const },
-        agents: [{ name: 'a', cli: 'claude' as const, task: 'Fix {{bug}}' }],
-      };
-      expect(() => runner.resolveVariables(config, {})).toThrow('Unresolved variable: {{bug}}');
-    });
-
-    it('should throw on unresolved variable in workflow step task', () => {
-      const config = {
-        version: '1',
-        name: 'test',
-        swarm: { pattern: 'dag' as const },
-        agents: [{ name: 'a', cli: 'claude' as const }],
-        workflows: [
-          {
-            name: 'wf',
-            steps: [{ name: 's1', agent: 'a', task: 'Deploy to {{env}}' }],
-          },
-        ],
-      };
-      expect(() => runner.resolveVariables(config, {})).toThrow('Unresolved variable: {{env}}');
-    });
-  });
-
-  describe('execution errors', () => {
-    it('should fail run when workflow not found by name', async () => {
-      const config = {
-        version: '1',
-        name: 'test',
-        swarm: { pattern: 'dag' as const },
-        agents: [{ name: 'a', cli: 'claude' as const }],
-        workflows: [{ name: 'wf1', steps: [{ name: 's1', agent: 'a', task: 'x' }] }],
-      };
-
-      await expect(runner.execute(config, 'nonexistent')).rejects.toThrow('not found');
-    });
-
-    it('should fail run when config has no workflows', async () => {
-      const config = {
-        version: '1',
-        name: 'test',
-        swarm: { pattern: 'dag' as const },
-        agents: [{ name: 'a', cli: 'claude' as const }],
-      };
-
-      await expect(runner.execute(config)).rejects.toThrow('No workflows defined');
-    });
-  });
-
-  describe('resume errors', () => {
-    it('should throw when resuming non-existent run', async () => {
-      await expect(runner.resume('bad_id')).rejects.toThrow('not found');
-    });
-  });
-});
diff --git a/packages/sdk/src/__tests__/file-db.test.ts b/packages/sdk/src/__tests__/file-db.test.ts
deleted file mode 100644
index 7e3de6259..000000000
--- a/packages/sdk/src/__tests__/file-db.test.ts
+++ /dev/null
@@ -1,266 +0,0 @@
-/**
- * Tests for JsonFileWorkflowDb — in-memory cache is authoritative.
- *
- * Regression: before this file existed, `getRun` re-read the jsonl from
- * disk on every call. If a write failed (EACCES in cloud, ENOSPC, etc.)
- * the cache-less implementation would return stale data, which in turn
- * caused `WorkflowRunner.execute()` to report a completed run as
- * `status: 'running'` to callers.
- */
-
-import { afterEach, beforeEach, describe, expect, it } from 'vitest';
-import { chmodSync, existsSync, mkdirSync, mkdtempSync, readFileSync, rmSync, writeFileSync } from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-
-import { JsonFileWorkflowDb } from '../workflows/file-db.js';
-import type { WorkflowRunRow, WorkflowStepRow } from '../workflows/types.js';
-
-function makeRun(overrides: Partial<WorkflowRunRow> = {}): WorkflowRunRow {
-  const now = new Date().toISOString();
-  return {
-    id: 'run_test',
-    workflowName: 'test',
-    status: 'pending',
-    createdAt: now,
-    updatedAt: now,
-    ...overrides,
-  };
-}
-
-function makeStep(overrides: Partial<WorkflowStepRow> = {}): WorkflowStepRow {
-  const now = new Date().toISOString();
-  return {
-    id: 'step_test',
-    runId: 'run_test',
-    stepName: 'test-step',
-    status: 'pending',
-    attempts: 0,
-    createdAt: now,
-    updatedAt: now,
-    ...overrides,
-  };
-}
-
-describe('JsonFileWorkflowDb', () => {
-  let tmpDir: string;
-
-  beforeEach(() => {
-    tmpDir = mkdtempSync(path.join(os.tmpdir(), 'filedb-test-'));
-  });
-
-  afterEach(() => {
-    try {
-      // Restore perms in case a test made the dir read-only.
-      chmodSync(tmpDir, 0o755);
-    } catch {
-      /* no-op */
-    }
-    rmSync(tmpDir, { recursive: true, force: true });
-  });
-
-  it('round-trips a run through cache without re-reading disk', async () => {
-    const dbPath = path.join(tmpDir, 'workflow-runs.jsonl');
-    const db = new JsonFileWorkflowDb(dbPath);
-    expect(db.isWritable()).toBe(true);
-
-    await db.insertRun(makeRun({ id: 'run_1', status: 'running' }));
-    await db.updateRun('run_1', { status: 'completed' });
-
-    const run = await db.getRun('run_1');
-    expect(run?.status).toBe('completed');
-
-    // The new write should also be durable.
-    const raw = readFileSync(dbPath, 'utf8');
-    expect(raw).toContain('"status":"completed"');
-  });
-
-  it('returns the latest run status even when the disk write silently fails', async () => {
-    // Deny writes to the storage directory so appendFileSync throws EACCES.
-    // On directories the mode controls whether new entries can be added —
-    // existing files inside become effectively read-only for append.
-    const dbPath = path.join(tmpDir, 'workflow-runs.jsonl');
-    const db = new JsonFileWorkflowDb(dbPath);
-    await db.insertRun(makeRun({ id: 'run_1', status: 'running' }));
-
-    // Revoke directory write permission AFTER the initial insert so the
-    // next append fails while the cache should still track the update.
-    chmodSync(tmpDir, 0o555);
-
-    await db.updateRun('run_1', { status: 'completed' });
-
-    // The in-memory mirror must reflect the update regardless of disk state.
-    const run = await db.getRun('run_1');
-    expect(run?.status).toBe('completed');
-  });
-
-  it('keeps cache state authoritative when disk writes lazy-fail (default, no fallback)', async () => {
-    // With homeFallback default (false), the constructor is optimistic about
-    // an unwritable directory — writable=true, first append() throws lazily.
-    // The key invariant: cache state is NOT lost even when the durable write
-    // never lands. This is the regression guard for the "workflow passes but
-    // reports status: running" bug.
-    const unwritableDir = path.join(tmpDir, 'unwritable');
-    mkdirSync(unwritableDir, { recursive: true });
-    chmodSync(unwritableDir, 0o555);
-    const blockedPath = path.join(unwritableDir, 'workflow-runs.jsonl');
-
-    const db = new JsonFileWorkflowDb(blockedPath); // default homeFallback: false
-    expect(db.isWritable()).toBe(true);
-
-    await db.insertRun(makeRun({ id: 'run_mem', status: 'running' }));
-    await db.updateRun('run_mem', { status: 'completed' });
-
-    const run = await db.getRun('run_mem');
-    expect(run?.status).toBe('completed');
-    // The jsonl was never created — disk writes all failed.
-    expect(existsSync(blockedPath)).toBe(false);
-  });
-
-  it('opt-in homeFallback: true → unwritable path routes to $HOME/.agent-relay', () => {
-    const unwritableDir = path.join(tmpDir, 'unwritable');
-    mkdirSync(unwritableDir, { recursive: true });
-    chmodSync(unwritableDir, 0o555);
-    const blockedPath = path.join(unwritableDir, 'workflow-runs.jsonl');
-
-    const db = new JsonFileWorkflowDb({
-      filePath: blockedPath,
-      homeFallback: true,
-    });
-
-    const resolved = db.getStoragePath();
-    expect(db.isWritable()).toBe(true);
-    expect(resolved.startsWith(os.homedir())).toBe(true);
-    expect(resolved).toContain(path.join('.agent-relay', 'workflow-runs-workflow-runs.jsonl'));
-  });
-
-  // Regression for PR #757 Codex review feedback: the primary path's
-  // directory can be writable while the jsonl file itself is read-only
-  // (relayfile-mount chmods synced files to 0o444 while leaving the
-  // parent dir at 0o755). The old dir-only probe would accept the
-  // primary path, every append would lazy-fail, and homeFallback
-  // would never kick in despite the caller explicitly opting in.
-  it('opt-in homeFallback: true → read-only file with writable dir still falls back', () => {
-    const writableDir = path.join(tmpDir, 'project');
-    mkdirSync(writableDir, { recursive: true });
-    const primaryPath = path.join(writableDir, 'workflow-runs.jsonl');
-    writeFileSync(primaryPath, ''); // create the file so chmod targets it
-    chmodSync(primaryPath, 0o444); // file read-only; dir still 0o755
-
-    const db = new JsonFileWorkflowDb({
-      filePath: primaryPath,
-      homeFallback: true,
-    });
-
-    const resolved = db.getStoragePath();
-    expect(db.isWritable()).toBe(true);
-    expect(resolved.startsWith(os.homedir())).toBe(true);
-    expect(resolved).not.toBe(primaryPath);
-  });
-
-  it('notifies onWriteFailure on every failed append', async () => {
-    const dbPath = path.join(tmpDir, 'workflow-runs.jsonl');
-    const failures: Array<{ err: unknown; filePath: string }> = [];
-    const db = new JsonFileWorkflowDb({
-      filePath: dbPath,
-      homeFallback: false,
-      onWriteFailure: (err, filePath) => failures.push({ err, filePath }),
-    });
-
-    await db.insertRun(makeRun({ id: 'run_1', status: 'running' }));
-
-    // Making the file itself read-only forces appendFileSync to throw.
-    // (Directory chmod alone is insufficient because appending to an
-    // already-open inode doesn't require directory write.)
-    chmodSync(dbPath, 0o444);
-
-    await db.updateRun('run_1', { status: 'completed' });
-    await db.updateRun('run_1', { status: 'completed' }); // second failure — listener should fire again
-
-    expect(failures.length).toBeGreaterThanOrEqual(2);
-    expect(failures[0].filePath).toBe(dbPath);
-
-    // The cache still reflects the latest state regardless of the write failure.
-    const run = await db.getRun('run_1');
-    expect(run?.status).toBe('completed');
-  });
-
-  it('replays existing jsonl on construction (--resume path)', async () => {
-    const dbPath = path.join(tmpDir, 'workflow-runs.jsonl');
-
-    {
-      const db = new JsonFileWorkflowDb(dbPath);
-      await db.insertRun(makeRun({ id: 'run_replay', status: 'running' }));
-      await db.insertStep(makeStep({ id: 'step_1', runId: 'run_replay', status: 'pending' }));
-      await db.updateStep('step_1', { status: 'completed' });
-      await db.updateRun('run_replay', { status: 'completed' });
-    }
-
-    // Fresh instance should see the replayed state.
-    const reloaded = new JsonFileWorkflowDb(dbPath);
-    const run = await reloaded.getRun('run_replay');
-    expect(run?.status).toBe('completed');
-
-    const steps = await reloaded.getStepsByRunId('run_replay');
-    expect(steps).toHaveLength(1);
-    expect(steps[0].status).toBe('completed');
-  });
-
-  // Regression for PR #757 Devin review: InMemoryWorkflowDb shallow-copies
-  // on insert, JsonFileWorkflowDb previously stored the caller's object by
-  // reference. The runner inserts a row and also keeps it in its own map,
-  // then mutates state.row.status directly before calling updateStep/Run —
-  // if the cache held the same reference, those mutations would silently
-  // bypass updateStep's append + timestamp handling.
-  it('insertRun/insertStep do not alias the caller object into the cache', async () => {
-    const dbPath = path.join(tmpDir, 'workflow-runs.jsonl');
-    const db = new JsonFileWorkflowDb(dbPath);
-
-    const run = makeRun({ id: 'run_alias', status: 'running' });
-    await db.insertRun(run);
-
-    // Mutate the caller's object post-insert — shouldn't reach the cache.
-    run.status = 'failed';
-    run.error = 'direct mutation should not leak into the db';
-
-    const cached = await db.getRun('run_alias');
-    expect(cached?.status).toBe('running');
-    expect(cached?.error).toBeUndefined();
-
-    const step = makeStep({ id: 'step_alias', runId: 'run_alias', status: 'pending' });
-    await db.insertStep(step);
-    step.status = 'failed';
-    step.error = 'same hazard';
-
-    const cachedSteps = await db.getStepsByRunId('run_alias');
-    expect(cachedSteps).toHaveLength(1);
-    expect(cachedSteps[0].status).toBe('pending');
-    expect(cachedSteps[0].error).toBeUndefined();
-  });
-
-  it('cache insert/update is visible to getStepsByRunId without a disk round-trip', async () => {
-    const dbPath = path.join(tmpDir, 'workflow-runs.jsonl');
-    const db = new JsonFileWorkflowDb(dbPath);
-
-    await db.insertStep(makeStep({ id: 's1', runId: 'r1', stepName: 'a', status: 'pending' }));
-    await db.insertStep(makeStep({ id: 's2', runId: 'r1', stepName: 'b', status: 'pending' }));
-    await db.updateStep('s1', { status: 'completed' });
-
-    const steps = await db.getStepsByRunId('r1');
-    expect(steps.map((s) => `${s.stepName}=${s.status}`).sort()).toEqual(['a=completed', 'b=pending']);
-  });
-
-  it('hasStepOutputs still works relative to the resolved storage path', () => {
-    const dbPath = path.join(tmpDir, 'workflow-runs.jsonl');
-    const db = new JsonFileWorkflowDb(dbPath);
-
-    const outputsDir = path.join(tmpDir, 'step-outputs', 'run_x');
-    mkdirSync(outputsDir, { recursive: true });
-    // Drop a file so readdirSync reports length > 0.
-    writeFileSync(path.join(outputsDir, 'out.txt'), 'hi');
-
-    expect(db.hasStepOutputs('run_x')).toBe(true);
-    expect(db.hasStepOutputs('run_y')).toBe(false);
-    expect(existsSync(dbPath)).toBe(false); // no writes happened yet
-  });
-});
diff --git a/packages/sdk/src/__tests__/idle-nudge.test.ts b/packages/sdk/src/__tests__/idle-nudge.test.ts
deleted file mode 100644
index 86b85bedd..000000000
--- a/packages/sdk/src/__tests__/idle-nudge.test.ts
+++ /dev/null
@@ -1,458 +0,0 @@
-/**
- * Idle nudge detection and escalation tests.
- *
- * Covers both modes:
- * - No idleNudge config: idle is treated as completion.
- * - idleNudge config enabled: waitForExit timeout drives nudges/escalation.
- */
-
-import { describe, it, expect, vi, beforeEach } from 'vitest';
-import type { WorkflowDb } from '../workflows/runner.js';
-import type { RelayYamlConfig, WorkflowRunRow, WorkflowStepRow } from '../workflows/types.js';
-
-// ── Mock fetch to prevent real HTTP calls (Relaycast provisioning) ───────────
-
-const mockFetch = vi.fn().mockResolvedValue({
-  ok: true,
-  json: () => Promise.resolve({ data: { api_key: 'rk_live_test', workspace_id: 'ws-test' } }),
-  text: () => Promise.resolve(''),
-});
-vi.stubGlobal('fetch', mockFetch);
-
-// ── Mock RelayCast SDK ────────────────────────────────────────────────────────
-
-const mockRelaycastAgent = {
-  send: vi.fn().mockResolvedValue(undefined),
-  heartbeat: vi.fn().mockResolvedValue(undefined),
-  channels: {
-    create: vi.fn().mockResolvedValue(undefined),
-    join: vi.fn().mockResolvedValue(undefined),
-    invite: vi.fn().mockResolvedValue(undefined),
-  },
-};
-
-const mockRelaycast = {
-  agents: {
-    register: vi.fn().mockResolvedValue({ token: 'token-1' }),
-  },
-  as: vi.fn().mockReturnValue(mockRelaycastAgent),
-};
-
-class MockRelayError extends Error {
-  code: string;
-  constructor(code: string, message: string, status = 400) {
-    super(message);
-    this.code = code;
-    this.name = 'RelayError';
-    (this as any).status = status;
-  }
-}
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn().mockImplementation(() => mockRelaycast),
-  RelayError: MockRelayError,
-}));
-
-// ── Mock AgentRelay ───────────────────────────────────────────────────────────
-
-let waitForExitFn: (ms?: number) => Promise<'exited' | 'timeout' | 'released'>;
-let waitForIdleFn: (ms?: number) => Promise<'idle' | 'timeout' | 'exited'>;
-
-const mockSendMessage = vi.fn().mockResolvedValue(undefined);
-const mockRelease = vi.fn().mockResolvedValue(undefined);
-
-const mockAgent = {
-  name: 'test-agent-abc',
-  exitCode: 0,
-  exitSignal: undefined,
-  get waitForExit() {
-    return waitForExitFn;
-  },
-  get waitForIdle() {
-    return waitForIdleFn;
-  },
-  release: mockRelease,
-  sendMessage: mockSendMessage,
-};
-
-const mockHumanSendMessage = vi.fn().mockResolvedValue(undefined);
-const mockHuman = {
-  name: 'workflow-runner',
-  sendMessage: mockHumanSendMessage,
-};
-
-vi.mock('../relay.js', () => ({
-  AgentRelay: vi.fn().mockImplementation(() => ({
-    spawnPty: vi.fn().mockResolvedValue(mockAgent),
-    human: vi.fn().mockReturnValue(mockHuman),
-    shutdown: vi.fn().mockResolvedValue(undefined),
-    onBrokerStderr: vi.fn().mockReturnValue(() => {}),
-    addListener: vi.fn(() => () => {}),
-    listAgentsRaw: vi.fn().mockResolvedValue([]),
-  })),
-}));
-
-const { WorkflowRunner } = await import('../workflows/runner.js');
-
-// ── Test fixtures ─────────────────────────────────────────────────────────────
-
-function makeDb(): WorkflowDb {
-  const runs = new Map<string, WorkflowRunRow>();
-  const steps = new Map<string, WorkflowStepRow>();
-
-  return {
-    insertRun: vi.fn(async (run: WorkflowRunRow) => {
-      runs.set(run.id, { ...run });
-    }),
-    updateRun: vi.fn(async (id: string, patch: Partial<WorkflowRunRow>) => {
-      const existing = runs.get(id);
-      if (existing) runs.set(id, { ...existing, ...patch });
-    }),
-    getRun: vi.fn(async (id: string) => {
-      const run = runs.get(id);
-      return run ? { ...run } : null;
-    }),
-    insertStep: vi.fn(async (step: WorkflowStepRow) => {
-      steps.set(step.id, { ...step });
-    }),
-    updateStep: vi.fn(async (id: string, patch: Partial<WorkflowStepRow>) => {
-      const existing = steps.get(id);
-      if (existing) steps.set(id, { ...existing, ...patch });
-    }),
-    getStepsByRunId: vi.fn(async (runId: string) => {
-      return [...steps.values()].filter((s) => s.runId === runId);
-    }),
-  };
-}
-
-function makeConfig(overrides: Partial<RelayYamlConfig> = {}): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'test-workflow',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'agent-a', cli: 'claude' }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [{ name: 'step-1', agent: 'agent-a', task: 'Do step 1' }],
-      },
-    ],
-    trajectories: false,
-    ...overrides,
-  };
-}
-
-function never<T>(): Promise<T> {
-  return new Promise(() => {});
-}
-
-describe('Idle Nudge Detection', () => {
-  let db: WorkflowDb;
-  let runner: InstanceType<typeof WorkflowRunner>;
-
-  beforeEach(() => {
-    vi.clearAllMocks();
-    db = makeDb();
-    runner = new WorkflowRunner({ db, workspaceId: 'ws-test' });
-
-    waitForExitFn = vi.fn().mockResolvedValue('exited');
-    waitForIdleFn = vi.fn().mockResolvedValue('timeout');
-  });
-
-  describe('idleNudge enabled', () => {
-    it('sends direct nudge then completes when exit follows', async () => {
-      let exitCallCount = 0;
-      waitForExitFn = vi.fn().mockImplementation(() => {
-        exitCallCount++;
-        return Promise.resolve(exitCallCount === 1 ? 'timeout' : 'exited');
-      });
-
-      const run = await runner.execute(
-        makeConfig({
-          swarm: {
-            pattern: 'mesh',
-            idleNudge: { nudgeAfterMs: 100, escalateAfterMs: 100, maxNudges: 1 },
-          },
-        }),
-        'default'
-      );
-
-      expect(run.status).toBe('completed');
-      expect(mockHumanSendMessage).toHaveBeenCalledTimes(1);
-      expect(mockHumanSendMessage).toHaveBeenCalledWith(
-        expect.objectContaining({
-          to: 'test-agent-abc',
-          text: expect.stringContaining('/exit'),
-        })
-      );
-      expect(mockRelease).not.toHaveBeenCalled();
-      expect(waitForIdleFn).not.toHaveBeenCalled();
-    });
-
-    it('uses hub fallback behavior without failing when hub is not active', async () => {
-      let exitCallCount = 0;
-      waitForExitFn = vi.fn().mockImplementation(() => {
-        exitCallCount++;
-        return Promise.resolve(exitCallCount === 1 ? 'timeout' : 'exited');
-      });
-
-      const config = makeConfig({
-        swarm: {
-          pattern: 'hub-spoke',
-          idleNudge: { nudgeAfterMs: 100, escalateAfterMs: 100, maxNudges: 1 },
-        },
-        agents: [
-          { name: 'lead', cli: 'claude', role: 'Lead coordinator' },
-          { name: 'worker', cli: 'claude' },
-        ],
-      });
-      const step = { name: 'step-1', agent: 'worker', task: 'Do work' };
-      const agentDef = { name: 'worker', cli: 'claude' };
-
-      (runner as any).currentConfig = config;
-      (runner as any).relay = { human: vi.fn().mockReturnValue(mockHuman) };
-      const result = await (runner as any).waitForExitWithIdleNudging(mockAgent, agentDef, step, 500);
-
-      expect(result).toBe('exited');
-      expect(mockHumanSendMessage).toHaveBeenCalledTimes(1);
-    });
-
-    it('force-releases after maxNudges is exceeded', async () => {
-      waitForExitFn = vi.fn().mockResolvedValue('timeout');
-
-      const run = await runner.execute(
-        makeConfig({
-          swarm: {
-            pattern: 'dag',
-            idleNudge: { nudgeAfterMs: 50, escalateAfterMs: 50, maxNudges: 1 },
-          },
-        }),
-        'default'
-      );
-
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('force-released');
-      expect(mockHumanSendMessage).toHaveBeenCalledTimes(1);
-      expect(mockRelease).toHaveBeenCalledTimes(1);
-      expect(waitForIdleFn).not.toHaveBeenCalled();
-    });
-
-    it('force-releases after multiple nudges', async () => {
-      waitForExitFn = vi.fn().mockResolvedValue('timeout');
-
-      const run = await runner.execute(
-        makeConfig({
-          swarm: {
-            pattern: 'dag',
-            idleNudge: { nudgeAfterMs: 50, escalateAfterMs: 50, maxNudges: 3 },
-          },
-        }),
-        'default'
-      );
-
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('force-released');
-      expect(mockHumanSendMessage).toHaveBeenCalledTimes(3);
-      expect(mockRelease).toHaveBeenCalledTimes(1);
-    });
-
-    it('emits step:nudged event', async () => {
-      let exitCallCount = 0;
-      waitForExitFn = vi.fn().mockImplementation(() => {
-        exitCallCount++;
-        return Promise.resolve(exitCallCount === 1 ? 'timeout' : 'exited');
-      });
-
-      const events: Array<{ type: string }> = [];
-      runner.on((event) => events.push(event));
-
-      await runner.execute(
-        makeConfig({
-          swarm: {
-            pattern: 'dag',
-            idleNudge: { nudgeAfterMs: 50, escalateAfterMs: 50, maxNudges: 1 },
-          },
-        }),
-        'default'
-      );
-
-      expect(events.filter((e) => e.type === 'step:nudged')).toHaveLength(1);
-    });
-
-    it('emits step:force-released event on escalation', async () => {
-      waitForExitFn = vi.fn().mockResolvedValue('timeout');
-
-      const events: Array<{ type: string }> = [];
-      runner.on((event) => events.push(event));
-
-      await runner.execute(
-        makeConfig({
-          swarm: {
-            pattern: 'dag',
-            idleNudge: { nudgeAfterMs: 50, escalateAfterMs: 50, maxNudges: 1 },
-          },
-        }),
-        'default'
-      );
-
-      expect(events.filter((e) => e.type === 'step:force-released')).toHaveLength(1);
-    });
-
-    it('uses defaults when idleNudge is empty object', async () => {
-      waitForExitFn = vi.fn().mockResolvedValue('timeout');
-
-      const run = await runner.execute(
-        makeConfig({
-          swarm: {
-            pattern: 'dag',
-            idleNudge: {},
-          },
-        }),
-        'default'
-      );
-
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('force-released');
-      // default maxNudges is 1
-      expect(mockHumanSendMessage).toHaveBeenCalledTimes(1);
-      expect(mockRelease).toHaveBeenCalledTimes(1);
-    });
-
-    it('respects overall timeout during nudge loop', async () => {
-      // Each waitForExit call takes 100ms (real timer), but the overall timeout
-      // is only 80ms. After the first call (~100ms elapsed), the loop detects
-      // that remaining time is exhausted and returns 'timeout'.
-      waitForExitFn = vi
-        .fn()
-        .mockImplementation(
-          () => new Promise<'timeout'>((resolve) => setTimeout(() => resolve('timeout'), 100))
-        );
-
-      const run = await runner.execute(
-        makeConfig({
-          swarm: {
-            pattern: 'dag',
-            idleNudge: { nudgeAfterMs: 10, escalateAfterMs: 10, maxNudges: 10 },
-          },
-          agents: [{ name: 'agent-a', cli: 'claude', constraints: { timeoutMs: 80 } }],
-        }),
-        'default'
-      );
-
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('timed out');
-    });
-
-    it('keeps a supervising lead alive after idle nudges are exhausted', async () => {
-      let exitCallCount = 0;
-      waitForExitFn = vi.fn().mockImplementation(() => {
-        exitCallCount++;
-        return Promise.resolve(exitCallCount < 3 ? 'timeout' : 'exited');
-      });
-
-      const config = makeConfig({
-        swarm: {
-          pattern: 'hub-spoke',
-          idleNudge: { nudgeAfterMs: 50, escalateAfterMs: 50, maxNudges: 1 },
-          channel: 'lead-supervision',
-        },
-      });
-      const agentDef = { name: 'team-lead', cli: 'claude', role: 'Lead coordinator' };
-      const step = {
-        name: 'step-1',
-        agent: 'team-lead',
-        task: 'Monitor #lead-supervision for WORKER_DONE, wait for the handoff, then exit.',
-      };
-
-      (runner as any).currentConfig = config;
-      expect((runner as any).shouldPreserveIdleSupervisor(agentDef, step)).toBe(true);
-
-      const result = await (runner as any).waitForExitWithIdleNudging(
-        mockAgent,
-        agentDef,
-        step,
-        500,
-        undefined,
-        true
-      );
-
-      expect(result).toBe('exited');
-      expect(waitForExitFn).toHaveBeenCalledTimes(3);
-      expect(mockRelease).not.toHaveBeenCalled();
-    });
-  });
-
-  describe('Idle = done (no idleNudge config)', () => {
-    it('idle fires first: releases agent and completes step', async () => {
-      waitForIdleFn = vi.fn().mockResolvedValue('idle');
-      waitForExitFn = vi.fn().mockImplementation(() => never());
-
-      const run = await runner.execute(makeConfig(), 'default');
-      const steps = await db.getStepsByRunId(run.id);
-
-      expect(run.status).toBe('completed');
-      expect(steps).toHaveLength(1);
-      expect(steps[0]?.status).toBe('completed');
-      expect(mockRelease).toHaveBeenCalledTimes(1);
-    });
-
-    it('exit fires first: completes without idle-based release', async () => {
-      waitForExitFn = vi.fn().mockResolvedValue('exited');
-      waitForIdleFn = vi.fn().mockResolvedValue('timeout');
-
-      const run = await runner.execute(makeConfig(), 'default');
-      const steps = await db.getStepsByRunId(run.id);
-
-      expect(run.status).toBe('completed');
-      expect(steps).toHaveLength(1);
-      expect(steps[0]?.status).toBe('completed');
-      expect(mockRelease).not.toHaveBeenCalled();
-    });
-
-    it('does not treat supervisory lead idleness as completion', async () => {
-      waitForExitFn = vi.fn().mockResolvedValue('exited');
-      waitForIdleFn = vi.fn().mockResolvedValue('idle');
-
-      const config = makeConfig({
-        swarm: { pattern: 'hub-spoke', channel: 'lead-supervision' },
-      });
-      const agentDef = { name: 'team-lead', cli: 'claude', role: 'Lead coordinator' };
-      const step = {
-        name: 'step-1',
-        agent: 'team-lead',
-        task: 'Wait on #lead-supervision for WORKER_DONE before handing off.',
-      };
-
-      (runner as any).currentConfig = config;
-      expect((runner as any).shouldPreserveIdleSupervisor(agentDef, step)).toBe(true);
-
-      const result = await (runner as any).waitForExitWithIdleNudging(
-        mockAgent,
-        agentDef,
-        step,
-        500,
-        undefined,
-        true
-      );
-
-      expect(result).toBe('exited');
-      expect(waitForExitFn).toHaveBeenCalledTimes(1);
-      expect(waitForIdleFn).not.toHaveBeenCalled();
-      expect(mockRelease).not.toHaveBeenCalled();
-    });
-
-    it('both timeout: fails step with timeout error', async () => {
-      waitForExitFn = vi.fn().mockResolvedValue('timeout');
-      waitForIdleFn = vi.fn().mockResolvedValue('timeout');
-
-      const run = await runner.execute(makeConfig(), 'default');
-      const steps = await db.getStepsByRunId(run.id);
-
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('timed out');
-      expect(steps).toHaveLength(1);
-      expect(steps[0]?.status).toBe('failed');
-      expect(steps[0]?.error).toContain('timed out');
-    });
-  });
-});
diff --git a/packages/sdk/src/__tests__/provisioner-mount.test.ts b/packages/sdk/src/__tests__/provisioner-mount.test.ts
deleted file mode 100644
index 92d1ccebd..000000000
--- a/packages/sdk/src/__tests__/provisioner-mount.test.ts
+++ /dev/null
@@ -1,126 +0,0 @@
-import { existsSync } from 'node:fs';
-import { mkdtemp, mkdir, rm, writeFile } from 'node:fs/promises';
-import { tmpdir } from 'node:os';
-import path from 'node:path';
-
-import { afterEach, describe, expect, it } from 'vitest';
-
-import { ensureRelayfileMount } from '../provisioner/mount.js';
-import { createLocalJwksKeyPair, provisionWorkflowAgents } from '../provisioner/index.js';
-
-const tempDirs: string[] = [];
-
-async function makeTempDir(prefix: string): Promise<string> {
-  const dir = await mkdtemp(path.join(tmpdir(), prefix));
-  tempDirs.push(dir);
-  return dir;
-}
-
-async function createFakeMountBinary(): Promise<string> {
-  const root = await makeTempDir('relayfile-mount-bin-');
-  const binaryPath = path.join(root, 'relayfile-mount');
-  await writeFile(
-    binaryPath,
-    [
-      '#!/bin/sh',
-      'LOCAL_DIR=""',
-      'ONCE=0',
-      'while [ "$#" -gt 0 ]; do',
-      '  case "$1" in',
-      '    --local-dir)',
-      '      LOCAL_DIR="$2"',
-      '      shift 2',
-      '      ;;',
-      '    --once)',
-      '      ONCE=1',
-      '      shift',
-      '      ;;',
-      '    *)',
-      '      shift',
-      '      ;;',
-      '  esac',
-      'done',
-      'mkdir -p "$LOCAL_DIR"',
-      'if [ "$ONCE" -eq 1 ]; then',
-      '  printf "seeded\\n" > "$LOCAL_DIR/seeded.txt"',
-      '  exit 0',
-      'fi',
-      'printf "live\\n" > "$LOCAL_DIR/live.txt"',
-      'trap "exit 0" TERM INT',
-      'while :; do sleep 1; done',
-      '',
-    ].join('\n'),
-    { mode: 0o755 }
-  );
-  return binaryPath;
-}
-
-async function waitForPath(filePath: string, timeoutMs = 1000): Promise<boolean> {
-  const deadline = Date.now() + timeoutMs;
-  while (Date.now() < deadline) {
-    if (existsSync(filePath)) {
-      return true;
-    }
-    await new Promise((resolve) => setTimeout(resolve, 25));
-  }
-  return existsSync(filePath);
-}
-
-afterEach(async () => {
-  for (const dir of tempDirs.splice(0)) {
-    await rm(dir, { recursive: true, force: true });
-  }
-});
-
-describe('ensureRelayfileMount', () => {
-  it('runs initial sync, starts the watcher, and removes the mount on stop', async () => {
-    const binaryPath = await createFakeMountBinary();
-    const mountPoint = path.join(await makeTempDir('relayfile-mount-target-'), 'workspace');
-
-    const mount = await ensureRelayfileMount({
-      binaryPath,
-      relayfileUrl: 'http://127.0.0.1:8080',
-      workspace: 'rw_test',
-      token: 'test-token',
-      mountPoint,
-    });
-
-    expect(mount.pid).toBeGreaterThan(0);
-    expect(existsSync(path.join(mountPoint, 'seeded.txt'))).toBe(true);
-    expect(await waitForPath(path.join(mountPoint, 'live.txt'))).toBe(true);
-
-    await mount.stop();
-
-    expect(existsSync(mountPoint)).toBe(false);
-  });
-});
-
-describe('provisionWorkflowAgents mount integration', () => {
-  it('starts a per-agent mount and exposes its mount point in the result', async () => {
-    const projectDir = await makeTempDir('relay-provisioner-project-');
-    const binaryPath = await createFakeMountBinary();
-    await mkdir(path.join(projectDir, 'src'), { recursive: true });
-    await writeFile(path.join(projectDir, 'src', 'index.ts'), 'export const value = 1;\n');
-
-    const result = await provisionWorkflowAgents({
-      tokenSigningKey: createLocalJwksKeyPair(),
-      workspace: 'rw_workspace',
-      projectDir,
-      relayfileBaseUrl: 'http://127.0.0.1:8080',
-      agents: {
-        worker: {
-          access: 'readonly',
-        },
-      },
-      skipSeeding: true,
-      mountBinaryPath: binaryPath,
-    });
-
-    const mount = result.mounts.get('worker');
-    expect(mount).toBeDefined();
-    expect(result.agents.worker.mountPoint).toBe(mount?.mountPoint);
-    expect(existsSync(path.join(mount!.mountPoint, 'seeded.txt'))).toBe(true);
-
-    await mount?.stop();
-  });
-});
diff --git a/packages/sdk/src/__tests__/resume-fallback.test.ts b/packages/sdk/src/__tests__/resume-fallback.test.ts
deleted file mode 100644
index dd02769cd..000000000
--- a/packages/sdk/src/__tests__/resume-fallback.test.ts
+++ /dev/null
@@ -1,429 +0,0 @@
-/**
- * Tests for resuming workflow execution from cached step outputs when the JSONL
- * run database is missing or unavailable.
- */
-
-import { afterEach, beforeEach, describe, expect, it, vi } from 'vitest';
-import { chmodSync, mkdirSync, mkdtempSync, rmSync, writeFileSync } from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import type { WorkflowDb } from '../workflows/runner.js';
-import type { RelayYamlConfig, WorkflowRunRow, WorkflowStepRow } from '../workflows/types.js';
-
-// ── Mock fetch ───────────────────────────────────────────────────────────────
-
-const mockFetch = vi.fn().mockResolvedValue({
-  ok: true,
-  json: () => Promise.resolve({ data: { api_key: 'rk_live_test', workspace_id: 'ws-test' } }),
-  text: () => Promise.resolve(''),
-});
-vi.stubGlobal('fetch', mockFetch);
-
-// ── Mock RelayCast SDK ───────────────────────────────────────────────────────
-
-const mockRelaycastAgent = {
-  send: vi.fn().mockResolvedValue(undefined),
-  heartbeat: vi.fn().mockResolvedValue(undefined),
-  channels: {
-    create: vi.fn().mockResolvedValue(undefined),
-    join: vi.fn().mockResolvedValue(undefined),
-    invite: vi.fn().mockResolvedValue(undefined),
-  },
-};
-
-const mockRelaycast = {
-  agents: {
-    register: vi.fn().mockResolvedValue({ token: 'token-1' }),
-  },
-  as: vi.fn().mockReturnValue(mockRelaycastAgent),
-};
-
-class MockRelayError extends Error {
-  code: string;
-  constructor(code: string, message: string, status = 400) {
-    super(message);
-    this.code = code;
-    this.name = 'RelayError';
-    (this as any).status = status;
-  }
-}
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn().mockImplementation(() => mockRelaycast),
-  RelayError: MockRelayError,
-}));
-
-// ── Mock AgentRelay ──────────────────────────────────────────────────────────
-
-let waitForExitFn: (ms?: number) => Promise<'exited' | 'timeout' | 'released'>;
-
-const mockAgent = {
-  name: 'test-agent-abc',
-  get waitForExit() {
-    return waitForExitFn;
-  },
-  get waitForIdle() {
-    return vi.fn().mockImplementation(() => new Promise(() => {}));
-  },
-  release: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockHuman = {
-  name: 'WorkflowRunner',
-  sendMessage: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockListeners = new Map<string, Set<(...args: any[]) => void>>();
-function emitMockEvent(event: string, ...args: any[]): void {
-  const set = mockListeners.get(event);
-  if (set) for (const cb of set) cb(...args);
-}
-
-const mockRelayInstance = {
-  spawnPty: vi.fn().mockImplementation(async ({ name, task }: { name: string; task?: string }) => {
-    const stepComplete = task?.match(/STEP_COMPLETE:([^\n]+)/)?.[1]?.trim();
-    const isReview = task?.includes('REVIEW_DECISION: APPROVE or REJECT');
-    const output = isReview
-      ? 'REVIEW_DECISION: APPROVE\nREVIEW_REASON: looks good\n'
-      : stepComplete
-        ? `STEP_COMPLETE:${stepComplete}\n`
-        : 'STEP_COMPLETE:unknown\n';
-
-    queueMicrotask(() => {
-      emitMockEvent('workerOutput', { name, chunk: output });
-    });
-
-    return { ...mockAgent, name };
-  }),
-  human: vi.fn().mockReturnValue(mockHuman),
-  shutdown: vi.fn().mockResolvedValue(undefined),
-  onBrokerStderr: vi.fn().mockReturnValue(() => {}),
-  addListener: vi.fn((event: string, cb: (...args: any[]) => void) => {
-    let set = mockListeners.get(event);
-    if (!set) {
-      set = new Set();
-      mockListeners.set(event, set);
-    }
-    set.add(cb);
-    return () => set!.delete(cb);
-  }),
-  listAgentsRaw: vi.fn().mockResolvedValue([]),
-};
-
-vi.mock('../relay.js', () => ({
-  AgentRelay: vi.fn().mockImplementation(() => mockRelayInstance),
-}));
-
-// Import after mocking
-const { WorkflowRunner } = await import('../workflows/runner.js');
-const { JsonFileWorkflowDb } = await import('../workflows/file-db.js');
-
-// ── Helpers ──────────────────────────────────────────────────────────────────
-
-function makeDb(): WorkflowDb {
-  const runs = new Map<string, WorkflowRunRow>();
-  const steps = new Map<string, WorkflowStepRow>();
-
-  return {
-    insertRun: vi.fn(async (run: WorkflowRunRow) => {
-      runs.set(run.id, { ...run });
-    }),
-    updateRun: vi.fn(async (id: string, patch: Partial<WorkflowRunRow>) => {
-      const existing = runs.get(id);
-      if (existing) runs.set(id, { ...existing, ...patch });
-    }),
-    getRun: vi.fn(async (id: string) => {
-      const run = runs.get(id);
-      return run ? { ...run } : null;
-    }),
-    insertStep: vi.fn(async (step: WorkflowStepRow) => {
-      steps.set(step.id, { ...step });
-    }),
-    updateStep: vi.fn(async (id: string, patch: Partial<WorkflowStepRow>) => {
-      const existing = steps.get(id);
-      if (existing) steps.set(id, { ...existing, ...patch });
-    }),
-    getStepsByRunId: vi.fn(async (runId: string) => {
-      return [...steps.values()].filter((s) => s.runId === runId);
-    }),
-  };
-}
-
-function makeResumeConfig(): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'test-resume-fallback',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'agent-a', cli: 'claude' }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'step-a', agent: 'agent-a', task: 'Do step A' },
-          { name: 'step-b', agent: 'agent-a', task: 'Do step B', dependsOn: ['step-a'] },
-          { name: 'step-c', agent: 'agent-a', task: 'Do step C', dependsOn: ['step-b'] },
-        ],
-      },
-    ],
-    trajectories: false,
-  };
-}
-
-function makeTemplateConfig(): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'test-resume-template',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'agent-a', cli: 'claude' }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'step-a', agent: 'agent-a', task: 'Generate input' },
-          {
-            name: 'step-b',
-            agent: 'agent-a',
-            task: 'Use cached value: {{steps.step-a.output}}',
-            dependsOn: ['step-a'],
-          },
-        ],
-      },
-    ],
-    trajectories: false,
-  };
-}
-
-function makeRunRow(
-  runId: string,
-  config: RelayYamlConfig,
-  status: WorkflowRunRow['status'] = 'failed'
-): WorkflowRunRow {
-  const now = new Date().toISOString();
-  return {
-    id: runId,
-    workspaceId: 'ws-test',
-    workflowName: 'default',
-    pattern: config.swarm.pattern,
-    status,
-    config,
-    startedAt: now,
-    createdAt: now,
-    updatedAt: now,
-  };
-}
-
-function makeStepRow(
-  runId: string,
-  stepName: string,
-  task: string,
-  dependsOn: string[] = [],
-  status: WorkflowStepRow['status'] = 'pending',
-  output?: string
-): WorkflowStepRow {
-  const now = new Date().toISOString();
-  return {
-    id: `${runId}-${stepName}`,
-    runId,
-    stepName,
-    agentName: 'agent-a',
-    stepType: 'agent',
-    status,
-    task,
-    dependsOn,
-    output,
-    retryCount: 0,
-    createdAt: now,
-    updatedAt: now,
-    startedAt: status !== 'pending' ? now : undefined,
-    completedAt: status === 'completed' ? now : undefined,
-  };
-}
-
-function writeCachedOutput(tmpDir: string, runId: string, stepName: string, output: string): void {
-  const outputDir = path.join(tmpDir, '.agent-relay', 'step-outputs', runId);
-  mkdirSync(outputDir, { recursive: true });
-  writeFileSync(path.join(outputDir, `${stepName}.md`), output);
-}
-
-// ── Tests ────────────────────────────────────────────────────────────────────
-
-describe('resume fallback to step-output cache', () => {
-  let db: WorkflowDb;
-  let runner: InstanceType<typeof WorkflowRunner>;
-  let tmpDir: string;
-
-  beforeEach(() => {
-    vi.clearAllMocks();
-    waitForExitFn = vi.fn().mockResolvedValue('exited');
-    mockListeners.clear();
-    tmpDir = mkdtempSync(path.join(os.tmpdir(), 'resume-fallback-'));
-    db = makeDb();
-    runner = new WorkflowRunner({ db, workspaceId: 'ws-test', cwd: tmpDir });
-  });
-
-  afterEach(() => {
-    try {
-      rmSync(tmpDir, { recursive: true, force: true });
-    } catch {
-      /* noop */
-    }
-  });
-
-  it('should reconstruct run from step-output cache when JSONL missing', async () => {
-    const runId = 'resume-cache-run';
-    const config = makeResumeConfig();
-    writeCachedOutput(tmpDir, runId, 'step-a', 'cached-a');
-    writeCachedOutput(tmpDir, runId, 'step-b', 'cached-b');
-
-    const events: Array<{ type: string; stepName?: string }> = [];
-    runner.on((event) => {
-      if ('stepName' in event) {
-        events.push({ type: event.type, stepName: event.stepName });
-      }
-    });
-
-    const run = await (runner as any).resume(runId, undefined, config);
-    expect(run.status, run.error).toBe('completed');
-
-    const startedSteps = events.filter((e) => e.type === 'step:started').map((e) => e.stepName);
-    expect(startedSteps).not.toContain('step-a');
-    expect(startedSteps).not.toContain('step-b');
-    expect(startedSteps).toContain('step-c');
-  });
-
-  it('should throw "not found" when neither JSONL nor cache exists', async () => {
-    const config = makeResumeConfig();
-
-    await expect((runner as any).resume('nonexistent-id', undefined, config)).rejects.toThrow('not found');
-  });
-
-  it('should prefer JSONL database over step-output cache', async () => {
-    const runId = 'resume-db-run';
-    const config = makeResumeConfig();
-    const dbPath = path.join(tmpDir, '.agent-relay', 'workflow-runs.jsonl');
-    const fileDb = new JsonFileWorkflowDb(dbPath);
-    const dbRunner = new WorkflowRunner({ db: fileDb, workspaceId: 'ws-test', cwd: tmpDir });
-
-    await fileDb.insertRun(makeRunRow(runId, config));
-    await fileDb.insertStep(makeStepRow(runId, 'step-a', 'Do step A', [], 'failed'));
-    await fileDb.insertStep(makeStepRow(runId, 'step-b', 'Do step B', ['step-a'], 'pending'));
-    await fileDb.insertStep(makeStepRow(runId, 'step-c', 'Do step C', ['step-b'], 'pending'));
-
-    writeCachedOutput(tmpDir, runId, 'step-a', 'cached-a-from-fallback');
-
-    const events: Array<{ type: string; stepName?: string }> = [];
-    dbRunner.on((event) => {
-      if ('stepName' in event) {
-        events.push({ type: event.type, stepName: event.stepName });
-      }
-    });
-
-    const run = await dbRunner.resume(runId);
-    expect(run.status, run.error).toBe('completed');
-
-    const startedSteps = events.filter((e) => e.type === 'step:started').map((e) => e.stepName);
-    expect(startedSteps).toContain('step-a');
-    expect(startedSteps).toContain('step-b');
-    expect(startedSteps).toContain('step-c');
-  });
-
-  it('should handle empty step-output directory gracefully', async () => {
-    const runId = 'resume-empty-cache';
-    const config = makeResumeConfig();
-    mkdirSync(path.join(tmpDir, '.agent-relay', 'step-outputs', runId), { recursive: true });
-
-    const events: Array<{ type: string; stepName?: string }> = [];
-    runner.on((event) => {
-      if ('stepName' in event) {
-        events.push({ type: event.type, stepName: event.stepName });
-      }
-    });
-
-    const run = await (runner as any).resume(runId, undefined, config);
-    expect(run.status, run.error).toBe('completed');
-
-    const startedSteps = events.filter((e) => e.type === 'step:started').map((e) => e.stepName);
-    expect(startedSteps).toContain('step-a');
-    expect(startedSteps).toContain('step-b');
-    expect(startedSteps).toContain('step-c');
-  });
-
-  it('should load cached output into step template variables', async () => {
-    const runId = 'resume-template-cache';
-    const config = makeTemplateConfig();
-    writeCachedOutput(tmpDir, runId, 'step-a', 'hello world');
-
-    const run = await (runner as any).resume(runId, undefined, config);
-    expect(run.status, run.error).toBe('completed');
-
-    const spawnedTasks = mockRelayInstance.spawnPty.mock.calls.map(
-      ([args]) => (args as { task?: string }).task ?? ''
-    );
-    expect(spawnedTasks.some((task) => task.includes('Use cached value: hello world'))).toBe(true);
-  });
-
-  it('should skip .report.json files when scanning step outputs', async () => {
-    const runId = 'resume-report-cache';
-    const config = makeResumeConfig();
-    const outputDir = path.join(tmpDir, '.agent-relay', 'step-outputs', runId);
-    mkdirSync(outputDir, { recursive: true });
-    writeFileSync(path.join(outputDir, 'step-a.md'), 'cached-a');
-    writeFileSync(path.join(outputDir, 'step-a.report.json'), '{"summary":"done"}');
-    writeFileSync(path.join(outputDir, 'step-b.report.json'), '{"summary":"metadata only"}');
-
-    const events: Array<{ type: string; stepName?: string }> = [];
-    runner.on((event) => {
-      if ('stepName' in event) {
-        events.push({ type: event.type, stepName: event.stepName });
-      }
-    });
-
-    const run = await (runner as any).resume(runId, undefined, config);
-    expect(run.status, run.error).toBe('completed');
-
-    const startedSteps = events.filter((e) => e.type === 'step:started').map((e) => e.stepName);
-    expect(startedSteps).not.toContain('step-a');
-    expect(startedSteps).toContain('step-b');
-    expect(startedSteps).toContain('step-c');
-  });
-});
-
-describe('file-db append diagnostics', () => {
-  let tmpDir: string;
-
-  beforeEach(() => {
-    vi.clearAllMocks();
-    tmpDir = mkdtempSync(path.join(os.tmpdir(), 'file-db-warn-'));
-  });
-
-  afterEach(() => {
-    try {
-      chmodSync(path.join(tmpDir, 'readonly'), 0o755);
-    } catch {
-      /* noop */
-    }
-    try {
-      rmSync(tmpDir, { recursive: true, force: true });
-    } catch {
-      /* noop */
-    }
-  });
-
-  it('should warn once when append fails', async () => {
-    const readonlyDir = path.join(tmpDir, 'readonly');
-    mkdirSync(readonlyDir, { recursive: true });
-    chmodSync(readonlyDir, 0o555);
-
-    const dbPath = path.join(readonlyDir, 'workflow-runs.jsonl');
-    const fileDb = new JsonFileWorkflowDb(dbPath);
-    const warnSpy = vi.spyOn(console, 'warn').mockImplementation(() => {});
-    const config = makeResumeConfig();
-
-    await fileDb.insertRun(makeRunRow('warn-run-1', config));
-    await fileDb.insertRun(makeRunRow('warn-run-2', config));
-
-    expect(warnSpy).toHaveBeenCalledTimes(1);
-
-    warnSpy.mockRestore();
-  });
-});
diff --git a/packages/sdk/src/__tests__/start-from.test.ts b/packages/sdk/src/__tests__/start-from.test.ts
deleted file mode 100644
index 657ff327d..000000000
--- a/packages/sdk/src/__tests__/start-from.test.ts
+++ /dev/null
@@ -1,357 +0,0 @@
-/**
- * Tests for the startFrom workflow execution feature.
- *
- * Validates that callers can start a workflow from a specific step,
- * skipping all predecessor steps and loading cached outputs when available.
- */
-
-import { afterEach, describe, it, expect, vi, beforeEach } from 'vitest';
-import { existsSync, mkdirSync, mkdtempSync, rmSync, writeFileSync } from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import type { WorkflowDb } from '../workflows/runner.js';
-import type { RelayYamlConfig, WorkflowRunRow, WorkflowStepRow } from '../workflows/types.js';
-
-// ── Mock fetch ───────────────────────────────────────────────────────────────
-
-const mockFetch = vi.fn().mockResolvedValue({
-  ok: true,
-  json: () => Promise.resolve({ data: { api_key: 'rk_live_test', workspace_id: 'ws-test' } }),
-  text: () => Promise.resolve(''),
-});
-vi.stubGlobal('fetch', mockFetch);
-
-// ── Mock RelayCast SDK ───────────────────────────────────────────────────────
-
-const mockRelaycastAgent = {
-  send: vi.fn().mockResolvedValue(undefined),
-  heartbeat: vi.fn().mockResolvedValue(undefined),
-  channels: {
-    create: vi.fn().mockResolvedValue(undefined),
-    join: vi.fn().mockResolvedValue(undefined),
-    invite: vi.fn().mockResolvedValue(undefined),
-  },
-};
-
-const mockRelaycast = {
-  agents: {
-    register: vi.fn().mockResolvedValue({ token: 'token-1' }),
-  },
-  as: vi.fn().mockReturnValue(mockRelaycastAgent),
-};
-
-class MockRelayError extends Error {
-  code: string;
-  constructor(code: string, message: string, status = 400) {
-    super(message);
-    this.code = code;
-    this.name = 'RelayError';
-    (this as any).status = status;
-  }
-}
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn().mockImplementation(() => mockRelaycast),
-  RelayError: MockRelayError,
-}));
-
-// ── Mock AgentRelay ──────────────────────────────────────────────────────────
-
-let waitForExitFn: (ms?: number) => Promise<'exited' | 'timeout' | 'released'>;
-
-const mockAgent = {
-  name: 'test-agent-abc',
-  get waitForExit() {
-    return waitForExitFn;
-  },
-  get waitForIdle() {
-    return vi.fn().mockImplementation(() => new Promise(() => {}));
-  },
-  release: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockHuman = {
-  name: 'WorkflowRunner',
-  sendMessage: vi.fn().mockResolvedValue(undefined),
-};
-
-// Listener registry for the AgentRelay mock — production AgentRelay uses
-// addListener('eventName', handler). Tests fire events via emitRelayEvent.
-const relayListeners = new Map<string, Set<(...args: unknown[]) => void>>();
-function emitRelayEvent(event: string, payload: unknown): void {
-  for (const handler of relayListeners.get(event) ?? []) {
-    handler(payload);
-  }
-}
-
-const mockRelayInstance = {
-  spawnPty: vi.fn().mockImplementation(async ({ name, task }: { name: string; task?: string }) => {
-    const stepComplete = task?.match(/STEP_COMPLETE:([^\n]+)/)?.[1]?.trim();
-    const isReview = task?.includes('REVIEW_DECISION: APPROVE or REJECT');
-    const output = isReview
-      ? 'REVIEW_DECISION: APPROVE\nREVIEW_REASON: looks good\n'
-      : stepComplete
-        ? `STEP_COMPLETE:${stepComplete}\n`
-        : 'STEP_COMPLETE:unknown\n';
-
-    queueMicrotask(() => emitRelayEvent('workerOutput', { name, chunk: output }));
-
-    return { ...mockAgent, name };
-  }),
-  human: vi.fn().mockReturnValue(mockHuman),
-  shutdown: vi.fn().mockResolvedValue(undefined),
-  onBrokerStderr: vi.fn().mockReturnValue(() => {}),
-  addListener: vi.fn((event: string, handler: (...args: unknown[]) => void) => {
-    let set = relayListeners.get(event);
-    if (!set) {
-      set = new Set();
-      relayListeners.set(event, set);
-    }
-    set.add(handler);
-    return () => set!.delete(handler);
-  }),
-  listAgentsRaw: vi.fn().mockResolvedValue([]),
-};
-
-vi.mock('../relay.js', () => ({
-  AgentRelay: vi.fn().mockImplementation(() => mockRelayInstance),
-}));
-
-// Import after mocking
-const { WorkflowRunner } = await import('../workflows/runner.js');
-const { workflow } = await import('../workflows/builder.js');
-
-// ── Helpers ──────────────────────────────────────────────────────────────────
-
-function makeDb(): WorkflowDb {
-  const runs = new Map<string, WorkflowRunRow>();
-  const steps = new Map<string, WorkflowStepRow>();
-
-  return {
-    insertRun: vi.fn(async (run: WorkflowRunRow) => {
-      runs.set(run.id, { ...run });
-    }),
-    updateRun: vi.fn(async (id: string, patch: Partial<WorkflowRunRow>) => {
-      const existing = runs.get(id);
-      if (existing) runs.set(id, { ...existing, ...patch });
-    }),
-    getRun: vi.fn(async (id: string) => {
-      const run = runs.get(id);
-      return run ? { ...run } : null;
-    }),
-    insertStep: vi.fn(async (step: WorkflowStepRow) => {
-      steps.set(step.id, { ...step });
-    }),
-    updateStep: vi.fn(async (id: string, patch: Partial<WorkflowStepRow>) => {
-      const existing = steps.get(id);
-      if (existing) steps.set(id, { ...existing, ...patch });
-    }),
-    getStepsByRunId: vi.fn(async (runId: string) => {
-      return [...steps.values()].filter((s) => s.runId === runId);
-    }),
-  };
-}
-
-function makeLinearConfig(): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'test-start-from',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'agent-a', cli: 'claude' }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'step-1', agent: 'agent-a', task: 'Do step 1' },
-          { name: 'step-2', agent: 'agent-a', task: 'Do step 2', dependsOn: ['step-1'] },
-          { name: 'step-3', agent: 'agent-a', task: 'Do step 3', dependsOn: ['step-2'] },
-        ],
-      },
-    ],
-    trajectories: false,
-  };
-}
-
-function makeDiamondConfig(): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'test-diamond',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'agent-a', cli: 'claude' }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'root', agent: 'agent-a', task: 'Root step' },
-          { name: 'left', agent: 'agent-a', task: 'Left branch', dependsOn: ['root'] },
-          { name: 'right', agent: 'agent-a', task: 'Right branch', dependsOn: ['root'] },
-          { name: 'merge', agent: 'agent-a', task: 'Merge', dependsOn: ['left', 'right'] },
-        ],
-      },
-    ],
-    trajectories: false,
-  };
-}
-
-// ── Tests ────────────────────────────────────────────────────────────────────
-
-describe('startFrom', () => {
-  let db: WorkflowDb;
-  let runner: InstanceType<typeof WorkflowRunner>;
-  let tmpDir: string;
-
-  beforeEach(() => {
-    vi.clearAllMocks();
-    waitForExitFn = vi.fn().mockResolvedValue('exited');
-    relayListeners.clear();
-    tmpDir = mkdtempSync(path.join(os.tmpdir(), 'start-from-'));
-    db = makeDb();
-    runner = new WorkflowRunner({ db, workspaceId: 'ws-test', cwd: tmpDir });
-  });
-
-  it('should throw when startFrom step does not exist', async () => {
-    const config = makeLinearConfig();
-    await expect(runner.execute(config, 'default', undefined, { startFrom: 'nonexistent' })).rejects.toThrow(
-      'startFrom step "nonexistent" not found in workflow'
-    );
-  });
-
-  it('should skip predecessor steps in a linear chain', async () => {
-    const config = makeLinearConfig();
-    const events: Array<{ type: string; stepName?: string }> = [];
-    runner.on((event) => {
-      if ('stepName' in event) {
-        events.push({ type: event.type, stepName: event.stepName });
-      }
-    });
-
-    const run = await runner.execute(config, 'default', undefined, { startFrom: 'step-3' });
-    expect(run.status, run.error).toBe('completed');
-
-    // step-1 and step-2 should NOT have step:started events (they were pre-completed)
-    const startedSteps = events.filter((e) => e.type === 'step:started').map((e) => e.stepName);
-    expect(startedSteps).not.toContain('step-1');
-    expect(startedSteps).not.toContain('step-2');
-    expect(startedSteps).toContain('step-3');
-  });
-
-  it('should skip all transitive deps in a diamond DAG', async () => {
-    const config = makeDiamondConfig();
-    const events: Array<{ type: string; stepName?: string }> = [];
-    runner.on((event) => {
-      if ('stepName' in event) {
-        events.push({ type: event.type, stepName: event.stepName });
-      }
-    });
-
-    const run = await runner.execute(config, 'default', undefined, { startFrom: 'merge' });
-    expect(run.status, run.error).toBe('completed');
-
-    const startedSteps = events.filter((e) => e.type === 'step:started').map((e) => e.stepName);
-    expect(startedSteps).not.toContain('root');
-    expect(startedSteps).not.toContain('left');
-    expect(startedSteps).not.toContain('right');
-    expect(startedSteps).toContain('merge');
-  });
-
-  it('should load cached output from disk for skipped steps', async () => {
-    const config = makeLinearConfig();
-
-    // Pre-create cached output for step-1 (simulating a prior run)
-    // We need to intercept the runId to write to the correct path.
-    // Instead, we'll verify updateStep was called with expected output.
-    const run = await runner.execute(config, 'default', undefined, { startFrom: 'step-2' });
-    expect(run.status, run.error).toBe('completed');
-
-    // step-1 should have been marked completed with empty string (no cached output)
-    const updateCalls = (db.updateStep as any).mock.calls as Array<[string, Partial<WorkflowStepRow>]>;
-    const step1Completion = updateCalls.find(
-      ([_, patch]) => patch.status === 'completed' && patch.output === ''
-    );
-    expect(step1Completion).toBeDefined();
-  });
-
-  it('should load cached output when available on disk via previousRunId', async () => {
-    const config = makeLinearConfig();
-
-    // Write cached output for step-1 under a known previous run ID
-    const prevRunId = 'prev-run-abc123';
-    const outputDir = path.join(tmpDir, '.agent-relay', 'step-outputs', prevRunId);
-    mkdirSync(outputDir, { recursive: true });
-    writeFileSync(path.join(outputDir, 'step-1.md'), 'cached-output-from-step-1');
-
-    const run = await runner.execute(config, 'default', undefined, {
-      startFrom: 'step-2',
-      previousRunId: prevRunId,
-    });
-    expect(run.status, run.error).toBe('completed');
-
-    // Verify step-1 was marked completed with the cached output
-    const updateCalls = (db.updateStep as any).mock.calls as Array<[string, Partial<WorkflowStepRow>]>;
-    const step1WithCachedOutput = updateCalls.find(
-      ([_, patch]) => patch.status === 'completed' && patch.output === 'cached-output-from-step-1'
-    );
-    expect(step1WithCachedOutput).toBeDefined();
-  });
-
-  it('should work when startFrom targets the first step (no deps to skip)', async () => {
-    const config = makeLinearConfig();
-    const events: Array<{ type: string; stepName?: string }> = [];
-    runner.on((event) => {
-      if ('stepName' in event) {
-        events.push({ type: event.type, stepName: event.stepName });
-      }
-    });
-
-    const run = await runner.execute(config, 'default', undefined, { startFrom: 'step-1' });
-    expect(run.status, run.error).toBe('completed');
-
-    // All 3 steps should start since step-1 has no deps
-    const startedSteps = events.filter((e) => e.type === 'step:started').map((e) => e.stepName);
-    expect(startedSteps).toContain('step-1');
-    expect(startedSteps).toContain('step-2');
-    expect(startedSteps).toContain('step-3');
-  });
-
-  it('should work with builder .startFrom() chainable method', () => {
-    const config = workflow('test')
-      .agent('worker', { cli: 'claude' })
-      .step('build', { agent: 'worker', task: 'Build' })
-      .step('test', { agent: 'worker', task: 'Test', dependsOn: ['build'] })
-      .step('deploy', { agent: 'worker', task: 'Deploy', dependsOn: ['test'] })
-      .startFrom('deploy')
-      .toConfig();
-
-    // toConfig() should still produce valid config — startFrom is a runtime option
-    expect(config.workflows![0].steps).toHaveLength(3);
-    expect(config.agents).toHaveLength(1);
-  });
-
-  it('should pass startFrom from WorkflowRunOptions', async () => {
-    const config = makeLinearConfig();
-    const events: Array<{ type: string; stepName?: string }> = [];
-
-    // Test via runner.execute directly with options
-    runner.on((event) => {
-      if ('stepName' in event) {
-        events.push({ type: event.type, stepName: event.stepName });
-      }
-    });
-
-    const run = await runner.execute(config, 'default', undefined, { startFrom: 'step-2' });
-    expect(run.status, run.error).toBe('completed');
-
-    const startedSteps = events.filter((e) => e.type === 'step:started').map((e) => e.stepName);
-    expect(startedSteps).not.toContain('step-1');
-    expect(startedSteps).toContain('step-2');
-    expect(startedSteps).toContain('step-3');
-  });
-
-  afterEach(() => {
-    try {
-      rmSync(tmpDir, { recursive: true, force: true });
-    } catch {
-      /* noop */
-    }
-  });
-});
diff --git a/packages/sdk/src/__tests__/swarm-coordinator.test.ts b/packages/sdk/src/__tests__/swarm-coordinator.test.ts
deleted file mode 100644
index b066524ba..000000000
--- a/packages/sdk/src/__tests__/swarm-coordinator.test.ts
+++ /dev/null
@@ -1,904 +0,0 @@
-/**
- * SwarmCoordinator integration tests.
- *
- * Tests pattern selection, topology resolution, run lifecycle,
- * and step management with a mocked DbClient.
- */
-
-import { describe, it, expect, vi, beforeEach } from 'vitest';
-import { SwarmCoordinator } from '../workflows/coordinator.js';
-import type { DbClient } from '../workflows/coordinator.js';
-import type { RelayYamlConfig, WorkflowRunRow, WorkflowStepRow } from '../workflows/types.js';
-
-// ── Helpers ──────────────────────────────────────────────────────────────────
-
-function makeDb(): DbClient {
-  return {
-    query: vi.fn().mockResolvedValue({ rows: [] }),
-  };
-}
-
-function makeConfig(overrides: Partial<RelayYamlConfig> = {}): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'test-workflow',
-    swarm: { pattern: 'fan-out' },
-    agents: [
-      { name: 'leader', cli: 'claude', role: 'lead' },
-      { name: 'worker-1', cli: 'claude' },
-      { name: 'worker-2', cli: 'codex' },
-    ],
-    trajectories: false,
-    ...overrides,
-  };
-}
-
-function makeRunRow(overrides: Partial<WorkflowRunRow> = {}): WorkflowRunRow {
-  const now = new Date().toISOString();
-  return {
-    id: 'run_test_1',
-    workspaceId: 'ws-1',
-    workflowName: 'test-workflow',
-    pattern: 'fan-out',
-    status: 'pending',
-    config: makeConfig(),
-    startedAt: now,
-    createdAt: now,
-    updatedAt: now,
-    ...overrides,
-  };
-}
-
-function makeStepRow(overrides: Partial<WorkflowStepRow> = {}): WorkflowStepRow {
-  const now = new Date().toISOString();
-  return {
-    id: 'step_test_1',
-    runId: 'run_test_1',
-    stepName: 'step-1',
-    agentName: 'worker-1',
-    status: 'pending',
-    task: 'Do something',
-    dependsOn: [],
-    retryCount: 0,
-    createdAt: now,
-    updatedAt: now,
-    ...overrides,
-  };
-}
-
-// ── Tests ────────────────────────────────────────────────────────────────────
-
-describe('SwarmCoordinator', () => {
-  let db: DbClient;
-  let coordinator: SwarmCoordinator;
-
-  beforeEach(() => {
-    vi.clearAllMocks();
-    db = makeDb();
-    coordinator = new SwarmCoordinator(db);
-  });
-
-  // ── Pattern selection ──────────────────────────────────────────────────
-
-  describe('selectPattern', () => {
-    it('should return explicit pattern from config', () => {
-      expect(coordinator.selectPattern(makeConfig({ swarm: { pattern: 'pipeline' } }))).toBe('pipeline');
-    });
-
-    it('should auto-select dag when steps have dependencies', () => {
-      const config = makeConfig({
-        swarm: { pattern: undefined as unknown as string } as any,
-        workflows: [
-          {
-            name: 'wf',
-            steps: [
-              { name: 's1', agent: 'worker-1', task: 'x' },
-              { name: 's2', agent: 'worker-2', task: 'y', dependsOn: ['s1'] },
-            ],
-          },
-        ],
-      });
-      // With pattern set explicitly, it returns it; with undefined it falls through heuristics
-      // Since config.swarm.pattern is undefined (truthy check fails), heuristics kick in
-      config.swarm.pattern = '' as any;
-      const pattern = coordinator.selectPattern(config);
-      expect(pattern).toBe('dag');
-    });
-
-    it('should auto-select consensus when consensusStrategy is set', () => {
-      const config = makeConfig({
-        swarm: { pattern: '' as any },
-        coordination: { consensusStrategy: 'majority' },
-      });
-      expect(coordinator.selectPattern(config)).toBe('consensus');
-    });
-
-    // ── Auto-selection heuristic tests ──────────────────────────────────
-
-    it('should auto-select map-reduce when mapper and reducer roles present', () => {
-      const config = makeConfig({
-        swarm: { pattern: '' as any },
-        agents: [
-          { name: 'mapper', cli: 'claude', role: 'mapper' },
-          { name: 'reducer', cli: 'claude', role: 'reducer' },
-        ],
-      });
-      expect(coordinator.selectPattern(config)).toBe('map-reduce');
-    });
-
-    it('should auto-select red-team when attacker and defender roles present', () => {
-      const config = makeConfig({
-        swarm: { pattern: '' as any },
-        agents: [
-          { name: 'attacker', cli: 'claude', role: 'attacker' },
-          { name: 'defender', cli: 'claude', role: 'defender' },
-        ],
-      });
-      expect(coordinator.selectPattern(config)).toBe('red-team');
-    });
-
-    it('should auto-select reflection when critic role present', () => {
-      const config = makeConfig({
-        swarm: { pattern: '' as any },
-        agents: [
-          { name: 'producer', cli: 'claude' },
-          { name: 'critic', cli: 'claude', role: 'critic' },
-        ],
-      });
-      expect(coordinator.selectPattern(config)).toBe('reflection');
-    });
-
-    it('should auto-select escalation when tier-N roles present', () => {
-      const config = makeConfig({
-        swarm: { pattern: '' as any },
-        agents: [
-          { name: 't1', cli: 'claude', role: 'tier-1' },
-          { name: 't2', cli: 'claude', role: 'tier-2' },
-        ],
-      });
-      expect(coordinator.selectPattern(config)).toBe('escalation');
-    });
-
-    it('should auto-select auction when auctioneer role present', () => {
-      const config = makeConfig({
-        swarm: { pattern: '' as any },
-        agents: [
-          { name: 'auctioneer', cli: 'claude', role: 'auctioneer' },
-          { name: 'bidder', cli: 'claude' },
-        ],
-      });
-      expect(coordinator.selectPattern(config)).toBe('auction');
-    });
-
-    it('should auto-select supervisor when supervisor role present', () => {
-      const config = makeConfig({
-        swarm: { pattern: '' as any },
-        agents: [
-          { name: 'supervisor', cli: 'claude', role: 'supervisor' },
-          { name: 'worker', cli: 'claude' },
-        ],
-      });
-      expect(coordinator.selectPattern(config)).toBe('supervisor');
-    });
-
-    it('should auto-select verifier when verifier role present', () => {
-      const config = makeConfig({
-        swarm: { pattern: '' as any },
-        agents: [
-          { name: 'producer', cli: 'claude' },
-          { name: 'verifier', cli: 'claude', role: 'verifier' },
-        ],
-      });
-      expect(coordinator.selectPattern(config)).toBe('verifier');
-    });
-
-    it('should auto-select swarm when hive-mind role present', () => {
-      const config = makeConfig({
-        swarm: { pattern: '' as any },
-        agents: [
-          { name: 'hive', cli: 'claude', role: 'hive-mind' },
-          { name: 'drone', cli: 'claude' },
-        ],
-      });
-      expect(coordinator.selectPattern(config)).toBe('swarm');
-    });
-
-    it('should auto-select circuit-breaker when fallback role present', () => {
-      const config = makeConfig({
-        swarm: { pattern: '' as any },
-        agents: [
-          { name: 'primary', cli: 'claude', role: 'primary' },
-          { name: 'fallback', cli: 'claude', role: 'fallback' },
-        ],
-      });
-      expect(coordinator.selectPattern(config)).toBe('circuit-breaker');
-    });
-
-    it('should auto-select review-loop when implementer and multiple reviewers present', () => {
-      const config = makeConfig({
-        swarm: { pattern: '' as any },
-        agents: [
-          { name: 'implementer', cli: 'claude', role: 'Senior developer implementing the task' },
-          { name: 'reviewer-diff', cli: 'codex', role: 'Code quality reviewer' },
-          { name: 'reviewer-arch', cli: 'claude', role: 'Architecture reviewer' },
-        ],
-      });
-      expect(coordinator.selectPattern(config)).toBe('review-loop');
-    });
-
-    it('should auto-select review-loop when agent names contain implementer and reviewer', () => {
-      const config = makeConfig({
-        swarm: { pattern: '' as any },
-        agents: [
-          { name: 'implementer', cli: 'claude' },
-          { name: 'reviewer-1', cli: 'codex' },
-          { name: 'reviewer-2', cli: 'claude' },
-        ],
-      });
-      expect(coordinator.selectPattern(config)).toBe('review-loop');
-    });
-  });
-
-  // ── Topology resolution ────────────────────────────────────────────────
-
-  describe('resolveTopology', () => {
-    it('should build fan-out topology with hub', () => {
-      const topology = coordinator.resolveTopology(makeConfig());
-      expect(topology.pattern).toBe('fan-out');
-      expect(topology.hub).toBe('leader');
-      expect(topology.edges.get('leader')).toEqual(['worker-1', 'worker-2']);
-      expect(topology.edges.get('worker-1')).toEqual(['leader']);
-    });
-
-    it('should build pipeline topology in step order', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'pipeline' },
-        workflows: [
-          {
-            name: 'wf',
-            steps: [
-              { name: 's1', agent: 'worker-1', task: 'step 1' },
-              { name: 's2', agent: 'worker-2', task: 'step 2' },
-              { name: 's3', agent: 'leader', task: 'step 3' },
-            ],
-          },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('pipeline');
-      expect(topology.pipelineOrder).toEqual(['worker-1', 'worker-2', 'leader']);
-      expect(topology.edges.get('worker-1')).toEqual(['worker-2']);
-      expect(topology.edges.get('leader')).toEqual([]);
-    });
-
-    it('should build hub-spoke topology', () => {
-      const config = makeConfig({ swarm: { pattern: 'hub-spoke' } });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.hub).toBe('leader');
-      expect(topology.edges.get('leader')).toContain('worker-1');
-      expect(topology.edges.get('worker-1')).toEqual(['leader']);
-    });
-
-    it('should build mesh topology for consensus', () => {
-      const config = makeConfig({ swarm: { pattern: 'consensus' } });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.edges.get('leader')).toContain('worker-1');
-      expect(topology.edges.get('leader')).toContain('worker-2');
-      expect(topology.edges.get('worker-1')).toContain('leader');
-    });
-
-    it('should build DAG topology from step dependencies', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'dag' },
-        workflows: [
-          {
-            name: 'wf',
-            steps: [
-              { name: 's1', agent: 'worker-1', task: 'x' },
-              { name: 's2', agent: 'worker-2', task: 'y', dependsOn: ['s1'] },
-            ],
-          },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('dag');
-      expect(topology.edges.get('worker-1')).toContain('worker-2');
-    });
-
-    it('should build hierarchical topology', () => {
-      const config = makeConfig({ swarm: { pattern: 'hierarchical' } });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.hub).toBe('leader');
-      expect(topology.edges.get('leader')).toContain('worker-1');
-    });
-
-    it('should build cascade topology', () => {
-      const config = makeConfig({ swarm: { pattern: 'cascade' } });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pipelineOrder).toEqual(['leader', 'worker-1', 'worker-2']);
-    });
-
-    // ── Additional pattern tests ────────────────────────────────────────
-
-    it('should build map-reduce topology', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'map-reduce' },
-        agents: [
-          { name: 'coordinator', cli: 'claude', role: 'lead' },
-          { name: 'mapper-1', cli: 'claude', role: 'mapper' },
-          { name: 'mapper-2', cli: 'claude', role: 'mapper' },
-          { name: 'reducer', cli: 'claude', role: 'reducer' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('map-reduce');
-      expect(topology.hub).toBe('coordinator');
-      expect(topology.edges.get('coordinator')).toContain('mapper-1');
-      expect(topology.edges.get('mapper-1')).toContain('reducer');
-      expect(topology.edges.get('reducer')).toContain('coordinator');
-    });
-
-    it('should build scatter-gather topology', () => {
-      const config = makeConfig({ swarm: { pattern: 'scatter-gather' } });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('scatter-gather');
-      expect(topology.hub).toBe('leader');
-      expect(topology.edges.get('leader')).toContain('worker-1');
-      expect(topology.edges.get('worker-1')).toEqual(['leader']);
-    });
-
-    it('should build supervisor topology', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'supervisor' },
-        agents: [
-          { name: 'supervisor', cli: 'claude', role: 'supervisor' },
-          { name: 'worker-1', cli: 'claude' },
-          { name: 'worker-2', cli: 'codex' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('supervisor');
-      expect(topology.hub).toBe('supervisor');
-      expect(topology.edges.get('supervisor')).toContain('worker-1');
-      expect(topology.edges.get('worker-1')).toEqual(['supervisor']);
-    });
-
-    it('should build reflection topology', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'reflection' },
-        agents: [
-          { name: 'producer', cli: 'claude' },
-          { name: 'critic', cli: 'claude', role: 'critic' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('reflection');
-      expect(topology.edges.get('producer')).toContain('critic');
-      expect(topology.edges.get('critic')).toContain('producer');
-    });
-
-    it('should build red-team topology', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'red-team' },
-        agents: [
-          { name: 'attacker', cli: 'claude', role: 'attacker' },
-          { name: 'defender', cli: 'claude', role: 'defender' },
-          { name: 'judge', cli: 'claude', role: 'judge' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('red-team');
-      expect(topology.edges.get('attacker')).toContain('defender');
-      expect(topology.edges.get('defender')).toContain('attacker');
-      expect(topology.edges.get('attacker')).toContain('judge');
-    });
-
-    it('should build verifier topology', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'verifier' },
-        agents: [
-          { name: 'producer', cli: 'claude' },
-          { name: 'verifier', cli: 'claude', role: 'verifier' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('verifier');
-      expect(topology.edges.get('producer')).toContain('verifier');
-      expect(topology.edges.get('verifier')).toContain('producer');
-    });
-
-    it('should build auction topology', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'auction' },
-        agents: [
-          { name: 'auctioneer', cli: 'claude', role: 'auctioneer' },
-          { name: 'bidder-1', cli: 'claude' },
-          { name: 'bidder-2', cli: 'codex' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('auction');
-      expect(topology.hub).toBe('auctioneer');
-      expect(topology.edges.get('auctioneer')).toContain('bidder-1');
-      expect(topology.edges.get('bidder-1')).toEqual(['auctioneer']);
-    });
-
-    it('should build escalation topology', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'escalation' },
-        agents: [
-          { name: 'tier1', cli: 'claude', role: 'tier-1' },
-          { name: 'tier2', cli: 'claude', role: 'tier-2' },
-          { name: 'tier3', cli: 'claude', role: 'tier-3' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('escalation');
-      expect(topology.pipelineOrder).toEqual(['tier1', 'tier2', 'tier3']);
-      expect(topology.edges.get('tier1')).toContain('tier2');
-      expect(topology.edges.get('tier2')).toContain('tier3');
-    });
-
-    it('should build saga topology', () => {
-      const config = makeConfig({ swarm: { pattern: 'saga' } });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('saga');
-      expect(topology.hub).toBe('leader');
-      expect(topology.edges.get('leader')).toContain('worker-1');
-      expect(topology.edges.get('worker-1')).toEqual(['leader']);
-    });
-
-    it('should build circuit-breaker topology', () => {
-      const config = makeConfig({ swarm: { pattern: 'circuit-breaker' } });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('circuit-breaker');
-      expect(topology.pipelineOrder).toEqual(['leader', 'worker-1', 'worker-2']);
-      expect(topology.edges.get('leader')).toEqual(['worker-1']);
-      expect(topology.edges.get('worker-2')).toEqual([]);
-    });
-
-    it('should build blackboard topology', () => {
-      const config = makeConfig({ swarm: { pattern: 'blackboard' } });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('blackboard');
-      // Full mesh for blackboard
-      expect(topology.edges.get('leader')).toContain('worker-1');
-      expect(topology.edges.get('worker-1')).toContain('leader');
-    });
-
-    it('should build swarm topology with neighbor communication', () => {
-      const config = makeConfig({ swarm: { pattern: 'swarm' } });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('swarm');
-      // Middle agent should have two neighbors
-      expect(topology.edges.get('worker-1')).toContain('leader');
-      expect(topology.edges.get('worker-1')).toContain('worker-2');
-    });
-
-    // ── Edge case tests ─────────────────────────────────────────────────
-
-    it('should handle map-reduce with no reducers (fallback to coordinator)', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'map-reduce' },
-        agents: [
-          { name: 'coordinator', cli: 'claude', role: 'lead' },
-          { name: 'mapper-1', cli: 'claude', role: 'mapper' },
-          { name: 'mapper-2', cli: 'claude', role: 'mapper' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('map-reduce');
-      // Mappers should fallback to coordinator when no reducers
-      expect(topology.edges.get('mapper-1')).toContain('coordinator');
-    });
-
-    it('should handle verifier with no verifiers (empty edges)', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'verifier' },
-        agents: [
-          { name: 'producer-1', cli: 'claude' },
-          { name: 'producer-2', cli: 'claude' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('verifier');
-      // Producers have no one to send to
-      expect(topology.edges.get('producer-1')).toEqual([]);
-    });
-
-    it('should handle escalation with no tier roles (use agent order)', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'escalation' },
-        agents: [
-          { name: 'agent-1', cli: 'claude' },
-          { name: 'agent-2', cli: 'claude' },
-          { name: 'agent-3', cli: 'claude' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('escalation');
-      expect(topology.pipelineOrder).toEqual(['agent-1', 'agent-2', 'agent-3']);
-    });
-
-    it('should handle reflection with no critic (fallback to mesh)', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'reflection' },
-        agents: [
-          { name: 'agent-1', cli: 'claude' },
-          { name: 'agent-2', cli: 'claude' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('reflection');
-      // Falls back to full mesh when no critic
-      expect(topology.edges.get('agent-1')).toContain('agent-2');
-      expect(topology.edges.get('agent-2')).toContain('agent-1');
-    });
-
-    it('should handle swarm with hive-mind role', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'swarm' },
-        agents: [
-          { name: 'hive', cli: 'claude', role: 'hive-mind' },
-          { name: 'drone-1', cli: 'claude' },
-          { name: 'drone-2', cli: 'claude' },
-          { name: 'drone-3', cli: 'claude' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('swarm');
-      expect(topology.hub).toBe('hive');
-      // All drones should connect to hive mind
-      expect(topology.edges.get('drone-1')).toContain('hive');
-      expect(topology.edges.get('drone-2')).toContain('hive');
-    });
-
-    it('should exclude non-interactive agents from message edges', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'fan-out' },
-        agents: [
-          { name: 'leader', cli: 'claude', role: 'lead' },
-          { name: 'worker-1', cli: 'codex', interactive: false },
-          { name: 'worker-2', cli: 'claude' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('fan-out');
-      // leader should only message worker-2 (not worker-1 which is non-interactive)
-      expect(topology.edges.get('leader')).toEqual(['worker-2']);
-      // worker-1 should have empty edges (non-interactive)
-      expect(topology.edges.get('worker-1')).toEqual([]);
-      // worker-2 should only message leader
-      expect(topology.edges.get('worker-2')).toEqual(['leader']);
-      // All agents should still be in the topology
-      expect(topology.agents).toHaveLength(3);
-    });
-
-    it('should exclude non-interactive agents from DAG topology edges', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'dag' },
-        agents: [
-          { name: 'leader', cli: 'claude', role: 'lead' },
-          { name: 'worker-1', cli: 'codex', interactive: false },
-          { name: 'worker-2', cli: 'claude' },
-        ],
-        workflows: [
-          {
-            name: 'wf',
-            steps: [
-              { name: 's1', agent: 'worker-1', task: 'x' },
-              { name: 's2', agent: 'worker-2', task: 'y', dependsOn: ['s1'] },
-              { name: 's3', agent: 'leader', task: 'z', dependsOn: ['s2'] },
-            ],
-          },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('dag');
-      // worker-1 is non-interactive — should have empty edges even though s2 depends on s1
-      expect(topology.edges.get('worker-1')).toEqual([]);
-      // worker-2 should NOT have worker-1 as a target (non-interactive)
-      const worker2Targets = topology.edges.get('worker-2') ?? [];
-      expect(worker2Targets).not.toContain('worker-1');
-      // worker-2 should still point to leader
-      expect(worker2Targets).toContain('leader');
-    });
-
-    it('should handle all non-interactive agents gracefully', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'fan-out' },
-        agents: [
-          { name: 'leader', cli: 'claude', role: 'lead' },
-          { name: 'worker-1', cli: 'codex', interactive: false },
-          { name: 'worker-2', cli: 'codex', interactive: false },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      // leader is the only interactive agent, so it fans out to no one
-      expect(topology.edges.get('leader')).toEqual([]);
-      expect(topology.edges.get('worker-1')).toEqual([]);
-      expect(topology.edges.get('worker-2')).toEqual([]);
-    });
-
-    it('should handle red-team with multiple attackers and defenders', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'red-team' },
-        agents: [
-          { name: 'attacker-1', cli: 'claude', role: 'attacker' },
-          { name: 'attacker-2', cli: 'claude', role: 'attacker' },
-          { name: 'defender-1', cli: 'claude', role: 'defender' },
-          { name: 'defender-2', cli: 'claude', role: 'defender' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('red-team');
-      // Attackers should reach all defenders
-      expect(topology.edges.get('attacker-1')).toContain('defender-1');
-      expect(topology.edges.get('attacker-1')).toContain('defender-2');
-      // Defenders should reach all attackers
-      expect(topology.edges.get('defender-1')).toContain('attacker-1');
-      expect(topology.edges.get('defender-1')).toContain('attacker-2');
-    });
-
-    it('should build review-loop topology with implementer as hub and reviewer collaboration', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'review-loop' },
-        agents: [
-          { name: 'implementer', cli: 'claude', role: 'Senior developer implementing the task' },
-          { name: 'reviewer-diff', cli: 'codex', role: 'Code quality reviewer' },
-          { name: 'reviewer-arch', cli: 'claude', role: 'Architecture reviewer' },
-          { name: 'reviewer-security', cli: 'codex', role: 'Security reviewer' },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('review-loop');
-      expect(topology.hub).toBe('implementer');
-      // Implementer can message all reviewers
-      expect(topology.edges.get('implementer')).toContain('reviewer-diff');
-      expect(topology.edges.get('implementer')).toContain('reviewer-arch');
-      expect(topology.edges.get('implementer')).toContain('reviewer-security');
-      // Reviewers can message implementer AND other reviewers (collaborative review)
-      expect(topology.edges.get('reviewer-diff')).toContain('implementer');
-      expect(topology.edges.get('reviewer-diff')).toContain('reviewer-arch');
-      expect(topology.edges.get('reviewer-diff')).toContain('reviewer-security');
-      expect(topology.edges.get('reviewer-arch')).toContain('implementer');
-      expect(topology.edges.get('reviewer-arch')).toContain('reviewer-diff');
-      expect(topology.edges.get('reviewer-security')).toContain('implementer');
-      expect(topology.edges.get('reviewer-security')).toContain('reviewer-diff');
-    });
-
-    it('should build review-loop topology with non-interactive reviewers', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'review-loop' },
-        agents: [
-          { name: 'implementer', cli: 'claude', role: 'Senior developer implementing the task' },
-          { name: 'reviewer-diff', cli: 'codex', role: 'Code quality reviewer', interactive: false },
-          { name: 'reviewer-arch', cli: 'claude', role: 'Architecture reviewer', interactive: false },
-        ],
-      });
-      const topology = coordinator.resolveTopology(config);
-      expect(topology.pattern).toBe('review-loop');
-      expect(topology.hub).toBe('implementer');
-      // Non-interactive reviewers have empty edges
-      expect(topology.edges.get('reviewer-diff')).toEqual([]);
-      expect(topology.edges.get('reviewer-arch')).toEqual([]);
-      // Implementer should not have non-interactive agents in edges
-      expect(topology.edges.get('implementer')).toEqual([]);
-    });
-  });
-
-  // ── Run lifecycle ──────────────────────────────────────────────────────
-
-  describe('createRun', () => {
-    it('should insert a run and emit run:created', async () => {
-      const run = makeRunRow();
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [run] });
-
-      const spy = vi.fn();
-      coordinator.on('run:created', spy);
-
-      const result = await coordinator.createRun('ws-1', makeConfig());
-      expect(result).toEqual(run);
-      expect(spy).toHaveBeenCalledWith(run);
-      expect(db.query).toHaveBeenCalledOnce();
-    });
-  });
-
-  describe('startRun', () => {
-    it('should transition pending run to running', async () => {
-      const run = makeRunRow({ status: 'running' });
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [run] });
-
-      const spy = vi.fn();
-      coordinator.on('run:started', spy);
-
-      const result = await coordinator.startRun('run_test_1');
-      expect(result.status).toBe('running');
-      expect(spy).toHaveBeenCalledWith(run);
-    });
-
-    it('should throw when run not found', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await expect(coordinator.startRun('nonexistent')).rejects.toThrow('not found or not in pending state');
-    });
-  });
-
-  describe('completeRun', () => {
-    it('should transition run to completed and emit event', async () => {
-      const run = makeRunRow({ status: 'completed' });
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [run] });
-
-      const spy = vi.fn();
-      coordinator.on('run:completed', spy);
-
-      const result = await coordinator.completeRun('run_test_1', { result: 'ok' });
-      expect(result.status).toBe('completed');
-      expect(spy).toHaveBeenCalledWith(run);
-    });
-
-    it('should throw when run not found', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await expect(coordinator.completeRun('nonexistent')).rejects.toThrow('not found');
-    });
-  });
-
-  describe('failRun', () => {
-    it('should transition run to failed with error', async () => {
-      const run = makeRunRow({ status: 'failed', error: 'boom' });
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [run] });
-
-      const spy = vi.fn();
-      coordinator.on('run:failed', spy);
-
-      await coordinator.failRun('run_test_1', 'boom');
-      expect(spy).toHaveBeenCalledWith(run);
-    });
-  });
-
-  describe('cancelRun', () => {
-    it('should transition run to cancelled', async () => {
-      const run = makeRunRow({ status: 'cancelled' });
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [run] });
-
-      const spy = vi.fn();
-      coordinator.on('run:cancelled', spy);
-
-      const result = await coordinator.cancelRun('run_test_1');
-      expect(result.status).toBe('cancelled');
-    });
-  });
-
-  // ── Step management ────────────────────────────────────────────────────
-
-  describe('createSteps', () => {
-    it('should create steps from workflow config', async () => {
-      const step = makeStepRow();
-      vi.mocked(db.query).mockResolvedValue({ rows: [step] });
-
-      const config = makeConfig({
-        workflows: [
-          {
-            name: 'wf',
-            steps: [
-              { name: 's1', agent: 'worker-1', task: 'x' },
-              { name: 's2', agent: 'worker-2', task: 'y' },
-            ],
-          },
-        ],
-      });
-
-      const steps = await coordinator.createSteps('run_1', config);
-      expect(steps).toHaveLength(2);
-      expect(db.query).toHaveBeenCalledTimes(2);
-    });
-  });
-
-  describe('startStep', () => {
-    it('should transition step to running and emit event', async () => {
-      const step = makeStepRow({ status: 'running' });
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [step] });
-
-      const spy = vi.fn();
-      coordinator.on('step:started', spy);
-
-      const result = await coordinator.startStep('step_1');
-      expect(result.status).toBe('running');
-      expect(spy).toHaveBeenCalledWith(step);
-    });
-
-    it('should throw for non-pending step', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await expect(coordinator.startStep('bad')).rejects.toThrow('not found or not in pending state');
-    });
-  });
-
-  describe('completeStep', () => {
-    it('should transition step to completed with output', async () => {
-      const step = makeStepRow({ status: 'completed', output: 'result data' });
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [step] });
-
-      const spy = vi.fn();
-      coordinator.on('step:completed', spy);
-
-      const result = await coordinator.completeStep('step_1', 'result data');
-      expect(result.output).toBe('result data');
-      expect(spy).toHaveBeenCalledWith(step);
-    });
-  });
-
-  describe('failStep', () => {
-    it('should transition step to failed with error', async () => {
-      const step = makeStepRow({ status: 'failed', error: 'timeout' });
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [step] });
-
-      const spy = vi.fn();
-      coordinator.on('step:failed', spy);
-
-      const result = await coordinator.failStep('step_1', 'timeout');
-      expect(result.error).toBe('timeout');
-    });
-  });
-
-  describe('skipStep', () => {
-    it('should mark step as skipped', async () => {
-      const step = makeStepRow({ status: 'skipped' });
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [step] });
-
-      const result = await coordinator.skipStep('step_1');
-      expect(result.status).toBe('skipped');
-    });
-  });
-
-  // ── Queries ────────────────────────────────────────────────────────────
-
-  describe('getRun', () => {
-    it('should return run or null', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      expect(await coordinator.getRun('nonexistent')).toBeNull();
-
-      const run = makeRunRow();
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [run] });
-      expect(await coordinator.getRun('run_test_1')).toEqual(run);
-    });
-  });
-
-  describe('getReadySteps', () => {
-    it('should return pending steps with all dependencies completed', async () => {
-      const steps: WorkflowStepRow[] = [
-        makeStepRow({ id: 's1', stepName: 'step-1', status: 'completed', dependsOn: [] }),
-        makeStepRow({ id: 's2', stepName: 'step-2', status: 'pending', dependsOn: ['step-1'] }),
-        makeStepRow({ id: 's3', stepName: 'step-3', status: 'pending', dependsOn: ['step-2'] }),
-      ];
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: steps });
-
-      const ready = await coordinator.getReadySteps('run_test_1');
-      expect(ready).toHaveLength(1);
-      expect(ready[0].stepName).toBe('step-2');
-    });
-
-    it('should return all pending steps with no dependencies', async () => {
-      const steps: WorkflowStepRow[] = [
-        makeStepRow({ id: 's1', stepName: 'a', status: 'pending', dependsOn: [] }),
-        makeStepRow({ id: 's2', stepName: 'b', status: 'pending', dependsOn: [] }),
-      ];
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: steps });
-
-      const ready = await coordinator.getReadySteps('run_test_1');
-      expect(ready).toHaveLength(2);
-    });
-  });
-
-  describe('getRunsByWorkspace', () => {
-    it('should query by workspace with optional status filter', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await coordinator.getRunsByWorkspace('ws-1', 'running');
-      expect(db.query).toHaveBeenCalledWith(expect.stringContaining('status = $2'), ['ws-1', 'running']);
-    });
-
-    it('should query without status filter', async () => {
-      vi.mocked(db.query).mockResolvedValueOnce({ rows: [] });
-      await coordinator.getRunsByWorkspace('ws-1');
-      expect(db.query).toHaveBeenCalledWith(expect.not.stringContaining('status ='), ['ws-1']);
-    });
-  });
-});
diff --git a/packages/sdk/src/__tests__/workflow-runner.test.ts b/packages/sdk/src/__tests__/workflow-runner.test.ts
deleted file mode 100644
index 4444fb7d8..000000000
--- a/packages/sdk/src/__tests__/workflow-runner.test.ts
+++ /dev/null
@@ -1,1344 +0,0 @@
-/**
- * WorkflowRunner integration tests.
- *
- * Tests parsing, validation, variable resolution, and DAG execution
- * with a mocked DB adapter and mocked AgentRelay.
- */
-
-import { describe, it, expect, vi, beforeEach } from 'vitest';
-import {
-  existsSync,
-  mkdirSync,
-  mkdtempSync,
-  readFileSync,
-  readdirSync,
-  rmSync,
-  writeFileSync,
-} from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import type { WorkflowDb } from '../workflows/runner.js';
-import type { RelayYamlConfig, WorkflowRunRow, WorkflowStepRow } from '../workflows/types.js';
-
-// ── Mock fetch to prevent real HTTP calls (Relaycast provisioning) ───────────
-
-const mockFetch = vi.fn().mockResolvedValue({
-  ok: true,
-  json: () => Promise.resolve({ data: { api_key: 'rk_live_test', workspace_id: 'ws-test' } }),
-  text: () => Promise.resolve(''),
-});
-vi.stubGlobal('fetch', mockFetch);
-
-// ── Mock RelayCast SDK ───────────────────────────────────────────────────────
-
-const mockRelaycastAgent = {
-  send: vi.fn().mockResolvedValue(undefined),
-  heartbeat: vi.fn().mockResolvedValue(undefined),
-  channels: {
-    create: vi.fn().mockResolvedValue(undefined),
-    join: vi.fn().mockResolvedValue(undefined),
-    invite: vi.fn().mockResolvedValue(undefined),
-  },
-};
-
-const mockRelaycast = {
-  agents: {
-    register: vi.fn().mockResolvedValue({ token: 'token-1' }),
-  },
-  as: vi.fn().mockReturnValue(mockRelaycastAgent),
-};
-
-class MockRelayError extends Error {
-  code: string;
-  constructor(code: string, message: string, status = 400) {
-    super(message);
-    this.code = code;
-    this.name = 'RelayError';
-    (this as any).status = status;
-  }
-}
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn().mockImplementation(() => mockRelaycast),
-  RelayError: MockRelayError,
-}));
-
-// ── Mock AgentRelay ──────────────────────────────────────────────────────────
-
-let waitForExitFn: (ms?: number) => Promise<'exited' | 'timeout' | 'released'>;
-let waitForIdleFn: (ms?: number) => Promise<'idle' | 'timeout' | 'exited'>;
-let mockSpawnOutputs: string[] = [];
-
-const mockAgent = {
-  name: 'test-agent-abc',
-  get waitForExit() {
-    return waitForExitFn;
-  },
-  get waitForIdle() {
-    return waitForIdleFn;
-  },
-  release: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockHuman = {
-  name: 'WorkflowRunner',
-  sendMessage: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockListeners = new Map<string, Set<(...args: any[]) => void>>();
-function emitMockEvent(event: string, ...args: any[]): void {
-  const set = mockListeners.get(event);
-  if (set) for (const cb of set) cb(...args);
-}
-
-const defaultSpawnPtyImplementation = async ({ name, task }: { name: string; task?: string }) => {
-  const queued = mockSpawnOutputs.shift();
-  const stepComplete = task?.match(/STEP_COMPLETE:([^\n]+)/)?.[1]?.trim();
-  const isReview = task?.includes('REVIEW_DECISION: APPROVE or REJECT');
-  const output =
-    queued ??
-    (isReview
-      ? 'REVIEW_DECISION: APPROVE\nREVIEW_REASON: looks good\n'
-      : stepComplete
-        ? `STEP_COMPLETE:${stepComplete}\n`
-        : 'STEP_COMPLETE:unknown\n');
-
-  queueMicrotask(() => {
-    emitMockEvent('workerOutput', { name, chunk: output });
-  });
-
-  return { ...mockAgent, name };
-};
-
-const mockRelayInstance = {
-  spawnPty: vi.fn().mockImplementation(defaultSpawnPtyImplementation),
-  human: vi.fn().mockReturnValue(mockHuman),
-  shutdown: vi.fn().mockResolvedValue(undefined),
-  onBrokerStderr: vi.fn().mockReturnValue(() => {}),
-  addListener: vi.fn((event: string, cb: (...args: any[]) => void) => {
-    let set = mockListeners.get(event);
-    if (!set) {
-      set = new Set();
-      mockListeners.set(event, set);
-    }
-    set.add(cb);
-    return () => set!.delete(cb);
-  }),
-  listAgentsRaw: vi.fn().mockResolvedValue([]),
-};
-
-vi.mock('../relay.js', () => ({
-  AgentRelay: vi.fn().mockImplementation(() => mockRelayInstance),
-}));
-
-// Import after mocking
-const { WorkflowRunner } = await import('../workflows/runner.js');
-
-// ── Test fixtures ────────────────────────────────────────────────────────────
-
-function makeDb(): WorkflowDb {
-  const runs = new Map<string, WorkflowRunRow>();
-  const steps = new Map<string, WorkflowStepRow>();
-
-  return {
-    insertRun: vi.fn(async (run: WorkflowRunRow) => {
-      runs.set(run.id, { ...run });
-    }),
-    updateRun: vi.fn(async (id: string, patch: Partial<WorkflowRunRow>) => {
-      const existing = runs.get(id);
-      if (existing) runs.set(id, { ...existing, ...patch });
-    }),
-    getRun: vi.fn(async (id: string) => {
-      const run = runs.get(id);
-      return run ? { ...run } : null;
-    }),
-    insertStep: vi.fn(async (step: WorkflowStepRow) => {
-      steps.set(step.id, { ...step });
-    }),
-    updateStep: vi.fn(async (id: string, patch: Partial<WorkflowStepRow>) => {
-      const existing = steps.get(id);
-      if (existing) steps.set(id, { ...existing, ...patch });
-    }),
-    getStepsByRunId: vi.fn(async (runId: string) => {
-      return [...steps.values()].filter((s) => s.runId === runId);
-    }),
-  };
-}
-
-function makeConfig(overrides: Partial<RelayYamlConfig> = {}): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'test-workflow',
-    swarm: { pattern: 'dag' },
-    agents: [
-      { name: 'agent-a', cli: 'claude' },
-      { name: 'agent-b', cli: 'claude' },
-    ],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'step-1', agent: 'agent-a', task: 'Do step 1' },
-          { name: 'step-2', agent: 'agent-b', task: 'Do step 2', dependsOn: ['step-1'] },
-        ],
-      },
-    ],
-    trajectories: false,
-    ...overrides,
-  };
-}
-
-function never<T>(): Promise<T> {
-  return new Promise(() => {});
-}
-
-type WorkflowStepOverride = Partial<NonNullable<RelayYamlConfig['workflows']>[number]['steps'][number]>;
-
-function makeSupervisedConfig(stepOverrides: WorkflowStepOverride = {}): RelayYamlConfig {
-  return makeConfig({
-    swarm: { pattern: 'hub-spoke' },
-    agents: [
-      { name: 'specialist', cli: 'claude', role: 'engineer' },
-      { name: 'team-lead', cli: 'claude', role: 'lead coordinator' },
-      { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-    ],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          {
-            name: 'step-1',
-            agent: 'specialist',
-            task: 'Implement the requested change',
-            ...stepOverrides,
-          },
-        ],
-      },
-    ],
-  });
-}
-
-function readCompletedTrajectoryFile(dir: string): any {
-  const completedDir = path.join(dir, '.trajectories', 'completed');
-  if (!existsSync(completedDir)) return null;
-
-  const jsonFile = readdirSync(completedDir).find((file) => file.endsWith('.json'));
-  if (!jsonFile) return null;
-
-  return JSON.parse(readFileSync(path.join(completedDir, jsonFile), 'utf-8'));
-}
-
-// ── Tests ────────────────────────────────────────────────────────────────────
-
-describe('WorkflowRunner', () => {
-  let db: WorkflowDb;
-  let runner: InstanceType<typeof WorkflowRunner>;
-
-  beforeEach(() => {
-    vi.clearAllMocks();
-    waitForExitFn = vi.fn().mockResolvedValue('exited');
-    waitForIdleFn = vi.fn().mockImplementation(() => never());
-    mockSpawnOutputs = [];
-    mockAgent.release.mockResolvedValue(undefined);
-    mockRelayInstance.spawnPty.mockImplementation(defaultSpawnPtyImplementation);
-    mockListeners.clear();
-    db = makeDb();
-    runner = new WorkflowRunner({ db, workspaceId: 'ws-test' });
-  });
-
-  // ── Parsing & validation ───────────────────────────────────────────────
-
-  describe('parseYamlString', () => {
-    it('should parse valid YAML config', () => {
-      const yaml = `
-version: "1"
-name: test
-swarm:
-  pattern: fan-out
-agents:
-  - name: a1
-    cli: claude
-`;
-      const config = runner.parseYamlString(yaml);
-      expect(config.name).toBe('test');
-      expect(config.swarm.pattern).toBe('fan-out');
-      expect(config.agents).toHaveLength(1);
-    });
-
-    it('should throw on null YAML', () => {
-      expect(() => runner.parseYamlString('null')).toThrow('config must be a non-null object');
-    });
-
-    it('should throw on invalid YAML syntax', () => {
-      expect(() => runner.parseYamlString('not: valid: yaml: []')).toThrow();
-    });
-  });
-
-  describe('validateConfig', () => {
-    it('should accept valid config', () => {
-      expect(() => runner.validateConfig(makeConfig())).not.toThrow();
-    });
-
-    it('should reject null config', () => {
-      expect(() => runner.validateConfig(null)).toThrow('non-null object');
-    });
-
-    it('should reject missing version', () => {
-      expect(() =>
-        runner.validateConfig({
-          name: 'x',
-          swarm: { pattern: 'dag' },
-          agents: [{ name: 'a', cli: 'claude' }],
-        })
-      ).toThrow('missing required field "version"');
-    });
-
-    it('should reject missing name', () => {
-      expect(() =>
-        runner.validateConfig({
-          version: '1',
-          swarm: { pattern: 'dag' },
-          agents: [{ name: 'a', cli: 'claude' }],
-        })
-      ).toThrow('missing required field "name"');
-    });
-
-    it('should reject empty agents array', () => {
-      expect(() =>
-        runner.validateConfig({ version: '1', name: 'x', swarm: { pattern: 'dag' }, agents: [] })
-      ).not.toThrow();
-    });
-
-    it('should reject agent without cli', () => {
-      expect(() =>
-        runner.validateConfig({
-          version: '1',
-          name: 'x',
-          swarm: { pattern: 'dag' },
-          agents: [{ name: 'a' }],
-        })
-      ).toThrow('each agent must have a string "cli"');
-    });
-
-    it('should detect unknown dependencies in workflows', () => {
-      const config = makeConfig({
-        workflows: [
-          {
-            name: 'wf',
-            steps: [{ name: 's1', agent: 'agent-a', task: 'do', dependsOn: ['nonexistent'] }],
-          },
-        ],
-      });
-      expect(() => runner.validateConfig(config)).toThrow('depends on unknown step "nonexistent"');
-    });
-
-    it('should detect dependency cycles', () => {
-      const config = makeConfig({
-        workflows: [
-          {
-            name: 'wf',
-            steps: [
-              { name: 's1', agent: 'agent-a', task: 'do', dependsOn: ['s2'] },
-              { name: 's2', agent: 'agent-b', task: 'do', dependsOn: ['s1'] },
-            ],
-          },
-        ],
-      });
-      expect(() => runner.validateConfig(config)).toThrow('dependency cycle');
-    });
-  });
-
-  // ── Variable resolution ────────────────────────────────────────────────
-
-  describe('resolveVariables', () => {
-    it('should replace {{var}} in agent tasks', () => {
-      const config = makeConfig({
-        agents: [{ name: 'a', cli: 'claude', task: 'Fix bug {{bugId}}' }],
-      });
-      const resolved = runner.resolveVariables(config, { bugId: '42' });
-      expect(resolved.agents[0].task).toBe('Fix bug 42');
-    });
-
-    it('should replace {{var}} in workflow step tasks', () => {
-      const config = makeConfig();
-      config.workflows![0].steps[0].task = 'Process {{item}}';
-      const resolved = runner.resolveVariables(config, { item: 'test-item' });
-      expect(resolved.workflows![0].steps[0].task).toBe('Process test-item');
-    });
-
-    it('should throw on unresolved variables', () => {
-      const config = makeConfig({
-        agents: [{ name: 'a', cli: 'claude', task: 'Fix {{unknown}}' }],
-      });
-      expect(() => runner.resolveVariables(config, {})).toThrow('Unresolved variable: {{unknown}}');
-    });
-
-    it('should not mutate original config', () => {
-      const config = makeConfig({
-        agents: [{ name: 'a', cli: 'claude', task: 'Fix {{id}}' }],
-      });
-      runner.resolveVariables(config, { id: '1' });
-      expect(config.agents[0].task).toBe('Fix {{id}}');
-    });
-  });
-
-  // ── Execution ──────────────────────────────────────────────────────────
-
-  describe('execute', () => {
-    it('should create run and steps in DB', async () => {
-      const config = makeConfig();
-      const run = await runner.execute(config, 'default');
-
-      expect(db.insertRun).toHaveBeenCalledTimes(1);
-      expect(db.insertStep).toHaveBeenCalledTimes(2);
-      expect(run.status, run.error).toBe('completed');
-    });
-
-    it('should throw when workflow not found', async () => {
-      const config = makeConfig();
-      await expect(runner.execute(config, 'nonexistent')).rejects.toThrow('Workflow "nonexistent" not found');
-    });
-
-    it('should throw when no workflows defined', async () => {
-      const config = makeConfig({ workflows: undefined });
-      await expect(runner.execute(config)).rejects.toThrow('No workflows defined');
-    });
-
-    it('should emit run:started and run:completed events', async () => {
-      const events: string[] = [];
-      runner.on((event) => events.push(event.type));
-
-      await runner.execute(makeConfig(), 'default');
-
-      expect(events).toContain('run:started');
-      expect(events).toContain('run:completed');
-    });
-
-    it('should emit step events in order', async () => {
-      const stepEvents: Array<{ type: string; stepName?: string }> = [];
-      runner.on((event) => {
-        if (event.type.startsWith('step:')) {
-          stepEvents.push({
-            type: event.type,
-            stepName: 'stepName' in event ? event.stepName : undefined,
-          });
-        }
-      });
-
-      await runner.execute(makeConfig(), 'default');
-
-      const startedSteps = stepEvents.filter((e) => e.type === 'step:started');
-      expect(startedSteps).toHaveLength(2);
-    });
-
-    it('should emit owner assignment and review completion events for interactive steps', async () => {
-      const events: Array<{ type: string; stepName?: string }> = [];
-      runner.on((event) =>
-        events.push({ type: event.type, stepName: 'stepName' in event ? event.stepName : undefined })
-      );
-
-      await runner.execute(makeSupervisedConfig(), 'default');
-
-      const ownerAssigned = events.filter((e) => e.type === 'step:owner-assigned');
-      const reviewCompleted = events.filter((e) => e.type === 'step:review-completed');
-      expect(ownerAssigned).toHaveLength(1);
-      expect(reviewCompleted).toHaveLength(1);
-    });
-
-    it('should prioritize lead owner when multiple hub-role candidates exist', async () => {
-      const ownerAssignments: string[] = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') ownerAssignments.push(event.ownerName);
-      });
-
-      const config = makeConfig({
-        swarm: { pattern: 'hub-spoke' },
-        agents: [
-          { name: 'specialist', cli: 'claude', role: 'engineer' },
-          { name: 'coord-1', cli: 'claude', role: 'coordinator' },
-          { name: 'lead-1', cli: 'claude', role: 'lead' },
-          { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'step-1', agent: 'specialist', task: 'Do step 1' }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-      expect(ownerAssignments).toEqual(['lead-1']);
-    }, 15000);
-
-    it('should not treat github role text as hub owner signal', async () => {
-      const ownerAssignments: string[] = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') ownerAssignments.push(event.ownerName);
-      });
-
-      const config = makeConfig({
-        swarm: { pattern: 'hub-spoke' },
-        agents: [
-          { name: 'specialist', cli: 'claude', role: 'engineer' },
-          { name: 'github-agent', cli: 'claude', role: 'github actions agent' },
-          { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'step-1', agent: 'specialist', task: 'Do step 1' }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-      expect(ownerAssignments).toEqual(['specialist']);
-    });
-
-    it('should not elect github-role agent as owner (hub word-boundary)', async () => {
-      const ownerAssignments: Array<{ owner: string; specialist: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') {
-          ownerAssignments.push({ owner: event.ownerName, specialist: event.specialistName });
-        }
-      });
-
-      const config = makeConfig({
-        swarm: { pattern: 'hub-spoke' },
-        agents: [
-          { name: 'specialist', cli: 'claude', role: 'engineer' },
-          { name: 'github-bot', cli: 'claude', role: 'github integration' },
-          { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'step-1', agent: 'specialist', task: 'Do step 1' }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-      // github-bot should NOT be elected as owner (role contains "hub" substring but not word)
-      expect(ownerAssignments[0].owner).not.toBe('github-bot');
-      // specialist should be its own owner since no hub-role agent exists
-      expect(ownerAssignments[0].owner).toBe('specialist');
-    }, 15000);
-
-    it('should parse REJECT from PTY-echoed review output', async () => {
-      const events: Array<{ type: string; decision?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:review-completed') {
-          events.push({ type: event.type, decision: event.decision });
-        }
-      });
-
-      // Simulate PTY output that echoes the review prompt before the actual response
-      const echoedPrompt =
-        'Return exactly:\nREVIEW_DECISION: APPROVE or REJECT\nREVIEW_REASON: <one sentence>\n';
-      const actualResponse = 'REVIEW_DECISION: REJECT\nREVIEW_REASON: code has bugs\n';
-      mockSpawnOutputs = ['worker finished\n', 'STEP_COMPLETE:step-1\n', echoedPrompt + actualResponse];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('review rejected');
-      // Should parse REJECT from actual response, not APPROVE from echoed instruction
-      expect(events).toContainEqual({ type: 'step:review-completed', decision: 'rejected' });
-    }, 15000);
-
-    it('should resolve variables during execution', async () => {
-      const config = makeConfig();
-      config.workflows![0].steps[0].task = 'Build {{feature}}';
-      const run = await runner.execute(config, 'default', { feature: 'auth' });
-      expect(run.status, run.error).toBe('completed');
-    });
-
-    it('repairs a failed deterministic gate with a workflow agent before retrying', async () => {
-      const tmpDir = mkdtempSync(path.join(os.tmpdir(), 'relay-deterministic-repair-'));
-      const stepDir = path.join(tmpDir, 'step-cwd');
-      mkdirSync(stepDir);
-      const artifactPath = path.join(stepDir, 'repaired.txt');
-      const repairAgent = vi.fn(async (step) => {
-        writeFileSync(path.join(step.cwd!, 'repaired.txt'), 'fixed\n', 'utf-8');
-        return 'wrote repaired.txt';
-      });
-      runner = new WorkflowRunner({
-        db,
-        workspaceId: 'ws-test',
-        cwd: tmpDir,
-        executor: {
-          executeAgentStep: repairAgent,
-        },
-      });
-
-      try {
-        const run = await runner.execute(
-          makeConfig({
-            errorHandling: { strategy: 'retry', repairRetries: 1, retryDelayMs: 1 },
-            agents: [{ name: 'fixer', cli: 'claude', role: 'implementation engineer' }],
-            workflows: [
-              {
-                name: 'default',
-                steps: [
-                  {
-                    name: 'verify-artifact',
-                    type: 'deterministic',
-                    cwd: 'step-cwd',
-                    command: `node -e "require('node:fs').accessSync('repaired.txt')"`,
-                  },
-                ],
-              },
-            ],
-          }),
-          'default'
-        );
-
-        expect(run.status, run.error).toBe('completed');
-        expect(repairAgent).toHaveBeenCalledTimes(1);
-        expect(repairAgent.mock.calls[0][0]).toMatchObject({ cwd: stepDir, workdir: undefined });
-        expect(repairAgent.mock.calls[0][2]).toContain('A deterministic workflow gate failed');
-        expect(repairAgent.mock.calls[0][2]).toContain('verify-artifact');
-        expect(readFileSync(artifactPath, 'utf-8')).toBe('fixed\n');
-      } finally {
-        rmSync(tmpDir, { recursive: true, force: true });
-      }
-    });
-
-    it('does not spawn deterministic repair agents unless repair retries are explicitly enabled', async () => {
-      const tmpDir = mkdtempSync(path.join(os.tmpdir(), 'relay-deterministic-no-implicit-repair-'));
-      const repairAgent = vi.fn(async () => 'unexpected repair');
-      runner = new WorkflowRunner({
-        db,
-        workspaceId: 'ws-test',
-        cwd: tmpDir,
-        executor: {
-          executeAgentStep: repairAgent,
-        },
-      });
-
-      try {
-        const run = await runner.execute(
-          makeConfig({
-            agents: [{ name: 'fixer', cli: 'claude', role: 'implementation engineer' }],
-            workflows: [
-              {
-                name: 'default',
-                steps: [
-                  {
-                    name: 'verify-artifact',
-                    type: 'deterministic',
-                    command: `node -e "require('node:fs').accessSync('missing.txt')"`,
-                  },
-                ],
-              },
-            ],
-          }),
-          'default'
-        );
-
-        expect(run.status).toBe('failed');
-        expect(repairAgent).not.toHaveBeenCalled();
-      } finally {
-        rmSync(tmpDir, { recursive: true, force: true });
-      }
-    });
-
-    it('should fail when owner response provides no decision, marker, or evidence', async () => {
-      mockSpawnOutputs = ['Owner completed work but forgot sentinel\n'];
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('owner completion decision missing');
-    });
-
-    it('should run specialist work in a separate process and mirror worker output to the channel', async () => {
-      mockSpawnOutputs = [
-        'worker progress update\nworker finished\n',
-        'Observed worker progress on the channel\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: looks good\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-
-      expect(run.status).toBe('completed');
-      const spawnCalls = (mockRelayInstance.spawnPty as any).mock.calls;
-      expect(spawnCalls[0][0].name).toContain('step-1-worker');
-      expect(spawnCalls[1][0].name).toContain('step-1-owner');
-      expect(spawnCalls[0][0].task).not.toContain('STEP_COMPLETE:step-1');
-      expect(spawnCalls[0][0].task).toContain('WORKER COMPLETION CONTRACT');
-      expect(spawnCalls[0][0].task).toContain('WORKER_DONE: <brief summary>');
-      expect(spawnCalls[1][0].task).toContain('You are the step owner/supervisor for step "step-1".');
-      expect(spawnCalls[1][0].task).toContain('runtime: step-1-worker');
-      expect(spawnCalls[1][0].task).toContain('LEAD_DONE: <brief summary>');
-
-      const channelMessages = (mockRelaycastAgent.send as any).mock.calls.map(
-        ([, text]: [string, string]) => text
-      );
-      expect(channelMessages.some((text: string) => text.includes('Worker `step-1-worker'))).toBe(true);
-      expect(channelMessages.some((text: string) => text.includes('worker finished'))).toBe(true);
-    });
-
-    it('should apply verification fallback for self-owned interactive steps', async () => {
-      mockSpawnOutputs = ['LEAD_DONE\n', 'REVIEW_DECISION: APPROVE\nREVIEW_REASON: verified\n'];
-
-      const run = await runner.execute(
-        makeConfig({
-          agents: [{ name: 'team-lead', cli: 'claude', role: 'Lead coordinator' }],
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                {
-                  name: 'lead-step',
-                  agent: 'team-lead',
-                  task: 'Output exactly:\nLEAD_DONE\n/exit',
-                  verification: { type: 'exit_code', value: 0 },
-                },
-              ],
-            },
-          ],
-        }),
-        'default'
-      );
-
-      expect(run.status, run.error).toBe('completed');
-      const steps = await db.getStepsByRunId(run.id);
-      expect(steps[0]?.completionReason).toBe('completed_verified');
-    });
-
-    it('should keep explicit interactive workers self-owned without extra supervisor/reviewer spawns', async () => {
-      const ownerAssignments: Array<{ owner: string; specialist: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') {
-          ownerAssignments.push({ owner: event.ownerName, specialist: event.specialistName });
-        }
-      });
-
-      mockSpawnOutputs = ['STEP_COMPLETE:worker-step\nWORKER_DONE_LOCAL\n'];
-
-      const run = await runner.execute(
-        makeConfig({
-          agents: [
-            { name: 'team-lead', cli: 'claude', role: 'Lead coordinator', preset: 'lead' },
-            { name: 'relay-worker', cli: 'codex', preset: 'worker', interactive: true },
-          ],
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                {
-                  name: 'worker-step',
-                  agent: 'relay-worker',
-                  task: 'Output exactly:\nWORKER_DONE_LOCAL\n/exit',
-                  verification: { type: 'output_contains', value: 'WORKER_DONE_LOCAL' },
-                },
-              ],
-            },
-          ],
-        }),
-        'default'
-      );
-
-      expect(ownerAssignments).toContainEqual({ owner: 'relay-worker', specialist: 'relay-worker' });
-      expect(run.status, run.error).toBe('completed');
-
-      const spawnCalls = (mockRelayInstance.spawnPty as any).mock.calls;
-      expect(spawnCalls).toHaveLength(1);
-      expect(spawnCalls[0][0].task).toContain('STEP OWNER CONTRACT');
-      expect(spawnCalls[0][0].name).not.toContain('-owner-');
-      expect(spawnCalls[0][0].name).not.toContain('-review-');
-    });
-
-    it('should spill oversized interactive tasks to a temp file before PTY spawn', async () => {
-      const tmpDir = mkdtempSync(path.join(os.tmpdir(), 'relay-pty-task-'));
-      const oversizedBytes = WorkflowRunner.PTY_TASK_ARG_SIZE_LIMIT + 1024;
-      let spawnedTask = '';
-      let taskFilePath = '';
-      let taskFileContents = '';
-      runner = new WorkflowRunner({ db, workspaceId: 'ws-test', cwd: tmpDir });
-
-      mockRelayInstance.spawnPty.mockImplementation(
-        async ({ name, task }: { name: string; task?: string }) => {
-          spawnedTask = task ?? '';
-          const match = spawnedTask.match(/TASK_FILE:(.+)\n/);
-          if (match) {
-            taskFilePath = match[1].trim();
-            taskFileContents = readFileSync(taskFilePath, 'utf-8');
-          }
-
-          const output = mockSpawnOutputs.shift() ?? 'LEAD_DONE\n';
-          queueMicrotask(() => {
-            emitMockEvent('workerOutput', { name, chunk: output });
-          });
-
-          return { ...mockAgent, name };
-        }
-      );
-
-      try {
-        mockSpawnOutputs = ['LEAD_DONE\n'];
-
-        const run = await runner.execute(
-          makeConfig({
-            agents: [{ name: 'team-lead', cli: 'claude', role: 'Lead coordinator' }],
-            workflows: [
-              {
-                name: 'default',
-                steps: [
-                  {
-                    name: 'prepare',
-                    type: 'deterministic',
-                    command: `node -e "process.stdout.write('A'.repeat(${oversizedBytes}))"`,
-                  },
-                  {
-                    name: 'lead-step',
-                    agent: 'team-lead',
-                    dependsOn: ['prepare'],
-                    task: 'Review the injected context below and then print LEAD_DONE:\n{{steps.prepare.output}}\n/exit',
-                    verification: { type: 'exit_code', value: 0 },
-                  },
-                ],
-              },
-            ],
-          }),
-          'default'
-        );
-
-        expect(run.status, run.error).toBe('completed');
-        expect(spawnedTask).toContain('TASK_FILE:');
-        expect(spawnedTask).not.toContain('{{steps.prepare.output}}');
-        expect(Buffer.byteLength(spawnedTask, 'utf8')).toBeLessThan(2048);
-        expect(taskFilePath).toBeTruthy();
-        expect(Buffer.byteLength(taskFileContents, 'utf8')).toBeGreaterThan(
-          WorkflowRunner.PTY_TASK_ARG_SIZE_LIMIT
-        );
-        expect(taskFileContents).toContain('Review the injected context below');
-        expect(existsSync(taskFilePath)).toBe(false);
-      } finally {
-        rmSync(tmpDir, { recursive: true, force: true });
-      }
-    });
-
-    it('should pass canonical bypass args to interactive codex PTY spawns', async () => {
-      mockSpawnOutputs = ['LEAD_DONE\n', 'REVIEW_DECISION: APPROVE\nREVIEW_REASON: verified\n'];
-
-      const run = await runner.execute(
-        makeConfig({
-          agents: [{ name: 'lead', cli: 'codex', role: 'Lead coordinator' }],
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                {
-                  name: 'lead-step',
-                  agent: 'lead',
-                  task: 'Output exactly:\nLEAD_DONE\n/exit',
-                  verification: { type: 'exit_code', value: 0 },
-                },
-              ],
-            },
-          ],
-        }),
-        'default'
-      );
-
-      expect(run.status, run.error).toBe('completed');
-      const spawnCalls = (mockRelayInstance.spawnPty as any).mock.calls;
-      expect(spawnCalls[0][0].args).toEqual(['--dangerously-bypass-approvals-and-sandbox']);
-    });
-
-    it('should let the owner complete after checking file-based artifacts', async () => {
-      const tmpDir = mkdtempSync(path.join(os.tmpdir(), 'relay-owner-file-'));
-      const artifact = path.join(tmpDir, 'artifact.txt');
-      writeFileSync(artifact, 'done\n', 'utf-8');
-      runner = new WorkflowRunner({ db, workspaceId: 'ws-test', cwd: tmpDir });
-
-      try {
-        mockSpawnOutputs = [
-          'worker wrote artifact\n',
-          'Bash(git diff --stat)\nSTEP_COMPLETE:step-1\n',
-          'REVIEW_DECISION: APPROVE\nREVIEW_REASON: artifact verified\n',
-        ];
-
-        const run = await runner.execute(
-          makeSupervisedConfig({ verification: { type: 'file_exists', value: 'artifact.txt' } }),
-          'default'
-        );
-
-        expect(run.status).toBe('completed');
-        const ownerTask = (mockRelayInstance.spawnPty as any).mock.calls[1][0].task as string;
-        expect(ownerTask).toContain('Verification gate: confirm the file exists at "artifact.txt"');
-      } finally {
-        rmSync(tmpDir, { recursive: true, force: true });
-      }
-    });
-
-    it('should keep specialist output for chaining even when the owner signals later', async () => {
-      mockSpawnOutputs = [
-        'specialist deliverable\n',
-        'Worker already exited; artifacts look correct\nSTEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: APPROVE\nREVIEW_REASON: handoff is safe\n',
-      ];
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('completed');
-
-      const stepRows = await db.getStepsByRunId(run.id);
-      expect(stepRows[0].output).toContain('specialist deliverable');
-      expect(stepRows[0].output).not.toContain('Worker already exited; artifacts look correct');
-    });
-
-    it('should fail when review response lacks any usable decision signal', async () => {
-      mockSpawnOutputs = [
-        'worker finished\n',
-        'STEP_COMPLETE:step-1\n',
-        'I need more context before deciding.\n',
-      ];
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('review response malformed');
-    });
-
-    it('should fail when review explicitly rejects step output', async () => {
-      const events: Array<{ type: string; decision?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:review-completed') {
-          events.push({
-            type: event.type,
-            decision: event.decision,
-          });
-        }
-      });
-
-      mockSpawnOutputs = [
-        'worker finished\n',
-        'STEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: REJECT\nREVIEW_REASON: missing checks\n',
-      ];
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('review rejected');
-      expect(events).toContainEqual({ type: 'step:review-completed', decision: 'rejected' });
-    });
-
-    it('should parse final review decision when PTY output echoes review instructions', async () => {
-      const events: Array<{ type: string; decision?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:review-completed') {
-          events.push({
-            type: event.type,
-            decision: event.decision,
-          });
-        }
-      });
-
-      mockSpawnOutputs = [
-        'worker finished\n',
-        'STEP_COMPLETE:step-1\n',
-        'Return exactly:\nREVIEW_DECISION: APPROVE or REJECT\nREVIEW_REASON: <one sentence>\nREVIEW_DECISION: REJECT\nREVIEW_REASON: insufficient evidence\n',
-      ];
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('review rejected');
-      expect(events).toContainEqual({ type: 'step:review-completed', decision: 'rejected' });
-    });
-
-    it('should record review completion in trajectory with decision and reason', async () => {
-      const tmpDir = mkdtempSync(path.join(os.tmpdir(), 'relay-review-traj-'));
-      runner = new WorkflowRunner({ db, workspaceId: 'ws-test', cwd: tmpDir });
-
-      try {
-        mockSpawnOutputs = [
-          'worker finished\n',
-          'STEP_COMPLETE:step-1\n',
-          'REVIEW_DECISION: APPROVE\nREVIEW_REASON: durable review record\n',
-        ];
-
-        const config = makeSupervisedConfig();
-        config.trajectories = {};
-        const run = await runner.execute(config, 'default');
-        expect(run.status).toBe('completed');
-
-        const trajectory = readCompletedTrajectoryFile(tmpDir);
-        const events = trajectory.chapters.flatMap((chapter: any) => chapter.events);
-        const reviewEvent = events.find((event: any) => event.type === 'review-completed');
-
-        expect(reviewEvent).toBeTruthy();
-        expect(reviewEvent.raw).toMatchObject({
-          stepName: 'step-1',
-          reviewer: 'reviewer-1',
-          decision: 'approved',
-          reason: 'durable review record',
-        });
-      } finally {
-        rmSync(tmpDir, { recursive: true, force: true });
-      }
-    });
-
-    it('should not double release the worker when the owner fails after worker completion', async () => {
-      const workerRelease = vi.fn().mockResolvedValue(undefined);
-      const ownerRelease = vi.fn().mockResolvedValue(undefined);
-
-      mockRelayInstance.spawnPty.mockImplementation(
-        async ({ name, task }: { name: string; task?: string }) => {
-          const isOwner = name.includes('-owner-');
-          const output = isOwner ? 'owner checking\n' : 'worker finished\n';
-
-          queueMicrotask(() => {
-            emitMockEvent('workerOutput', { name, chunk: output });
-          });
-
-          if (isOwner) {
-            return {
-              name,
-              waitForExit: vi.fn().mockImplementation(async () => {
-                await Promise.resolve();
-                return 'timeout';
-              }),
-              waitForIdle: vi.fn().mockResolvedValue('timeout'),
-              release: ownerRelease,
-            };
-          }
-
-          return {
-            name,
-            waitForExit: vi.fn().mockImplementation(async () => {
-              await workerRelease();
-              return 'released';
-            }),
-            waitForIdle: vi.fn().mockImplementation(() => never()),
-            release: workerRelease,
-          };
-        }
-      );
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('owner timed out');
-      expect(workerRelease).toHaveBeenCalledTimes(1);
-      expect(ownerRelease).toHaveBeenCalledTimes(1);
-    });
-
-    it('should emit owner-timeout when owner times out', async () => {
-      const events: Array<{ type: string; stepName?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-timeout') {
-          events.push({
-            type: event.type,
-            stepName: event.stepName,
-          });
-        }
-      });
-
-      waitForExitFn = vi.fn().mockResolvedValue('timeout');
-      waitForIdleFn = vi.fn().mockResolvedValue('timeout');
-
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('timed out');
-      expect(events).toContainEqual({ type: 'step:owner-timeout', stepName: 'step-1' });
-    });
-
-    it('should emit owner-timeout for a dedicated supervisor when the worker is stuck', async () => {
-      const events: Array<{ type: string; stepName?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-timeout') {
-          events.push({ type: event.type, stepName: event.stepName });
-        }
-      });
-
-      waitForExitFn = vi.fn().mockResolvedValue('timeout');
-      waitForIdleFn = vi.fn().mockResolvedValue('timeout');
-
-      const run = await runner.execute(makeSupervisedConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('owner timed out');
-      expect(events).toContainEqual({ type: 'step:owner-timeout', stepName: 'step-1' });
-    });
-
-    it('should preserve self-completion when no dedicated owner is available', async () => {
-      mockSpawnOutputs = ['STEP_COMPLETE:step-1\n', 'REVIEW_DECISION: APPROVE\nREVIEW_REASON: looks good\n'];
-
-      const config = makeConfig({
-        agents: [
-          { name: 'specialist', cli: 'claude', role: 'engineer' },
-          { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'step-1', agent: 'specialist', task: 'Do step 1' }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-
-      expect(run.status).toBe('completed');
-      const spawnCalls = (mockRelayInstance.spawnPty as any).mock.calls;
-      expect(spawnCalls[0][0].name).toContain('step-1-');
-      expect(spawnCalls[0][0].name).not.toContain('worker');
-      expect(spawnCalls[0][0].task).toContain('STEP OWNER CONTRACT');
-      expect(spawnCalls[0][0].task).toContain('STEP_COMPLETE:step-1');
-    });
-
-    it('should use the full remaining timeout as the review safety backstop', async () => {
-      const config = makeSupervisedConfig({ timeoutMs: 90_000 });
-      const run = await runner.execute(config, 'default');
-
-      expect(run.status).toBe('completed');
-      const waitCalls = (waitForExitFn as any).mock?.calls ?? [];
-      expect(waitCalls.length).toBeGreaterThanOrEqual(2);
-      const reviewWaitMs = waitCalls[waitCalls.length - 1][0];
-      expect(reviewWaitMs).toBeGreaterThan(60_000);
-      expect(reviewWaitMs).toBeLessThanOrEqual(90_000);
-    });
-  });
-
-  // ── Event subscription ─────────────────────────────────────────────────
-
-  describe('on / event subscription', () => {
-    it('should return unsubscribe function', async () => {
-      const events: string[] = [];
-      const unsub = runner.on((event) => events.push(event.type));
-
-      await runner.execute(makeConfig(), 'default');
-      const count = events.length;
-
-      unsub();
-      // Events after unsubscribe are not captured (no second execute needed to prove this,
-      // just verify the unsub function works without error)
-      expect(count).toBeGreaterThan(0);
-    });
-  });
-
-  // ── Pause / abort ──────────────────────────────────────────────────────
-
-  describe('pause and abort', () => {
-    it('should support pause/unpause without error', () => {
-      expect(() => runner.pause()).not.toThrow();
-      expect(() => runner.unpause()).not.toThrow();
-    });
-
-    it('should support abort without error', () => {
-      expect(() => runner.abort()).not.toThrow();
-    });
-  });
-
-  // ── Resume ─────────────────────────────────────────────────────────────
-
-  describe('resume', () => {
-    it('should throw when run not found', async () => {
-      await expect(runner.resume('nonexistent')).rejects.toThrow('Run "nonexistent" not found');
-    });
-  });
-
-  // ── Non-interactive command builder ────────────────────────────────────
-
-  describe('buildNonInteractiveCommand', () => {
-    it('should build claude command with -p flag', () => {
-      const { cmd, args } = WorkflowRunner.buildNonInteractiveCommand('claude', 'Do the thing');
-      expect(cmd).toBe('claude');
-      expect(args).toEqual(['-p', '--dangerously-skip-permissions', 'Do the thing']);
-    });
-
-    it('should build codex command with exec subcommand and bypass flag', () => {
-      const { cmd, args } = WorkflowRunner.buildNonInteractiveCommand('codex', 'Build it');
-      expect(cmd).toBe('codex');
-      expect(args).toEqual(['exec', '--dangerously-bypass-approvals-and-sandbox', 'Build it']);
-    });
-
-    it('should build gemini command with -p flag', () => {
-      const { cmd, args } = WorkflowRunner.buildNonInteractiveCommand('gemini', 'Analyze');
-      expect(cmd).toBe('gemini');
-      expect(args).toEqual(['-p', 'Analyze']);
-    });
-
-    it('should build opencode command with run subcommand', () => {
-      const { cmd, args } = WorkflowRunner.buildNonInteractiveCommand('opencode', 'Fix bug');
-      expect(cmd).toBe('opencode');
-      expect(args).toEqual(['run', 'Fix bug']);
-    });
-
-    it('should build droid command with exec subcommand', () => {
-      const { cmd, args } = WorkflowRunner.buildNonInteractiveCommand('droid', 'Deploy');
-      expect(cmd).toBe('droid');
-      expect(args).toEqual(['exec', 'Deploy']);
-    });
-
-    it('should build aider command with --message and safety flags', () => {
-      const { cmd, args } = WorkflowRunner.buildNonInteractiveCommand('aider', 'Refactor');
-      expect(cmd).toBe('aider');
-      expect(args).toEqual(['--message', 'Refactor', '--yes-always', '--no-git']);
-    });
-
-    it('should build goose command with run subcommand', () => {
-      const { cmd, args } = WorkflowRunner.buildNonInteractiveCommand('goose', 'Test it');
-      expect(cmd).toBe('goose');
-      expect(args).toEqual(['run', '--text', 'Test it', '--no-session']);
-    });
-
-    it('should append extra args after CLI-specific args', () => {
-      const { cmd, args } = WorkflowRunner.buildNonInteractiveCommand('claude', 'Task', ['--model', 'opus']);
-      expect(cmd).toBe('claude');
-      expect(args).toEqual(['-p', '--dangerously-skip-permissions', 'Task', '--model', 'opus']);
-    });
-  });
-
-  // ── Dry run ─────────────────────────────────────────────────────────────
-
-  describe('dryRun', () => {
-    it('should compute correct waves for a simple DAG', () => {
-      const config = makeConfig();
-      const report = runner.dryRun(config);
-
-      expect(report.valid).toBe(true);
-      expect(report.errors).toHaveLength(0);
-      expect(report.totalSteps).toBe(2);
-      expect(report.estimatedWaves).toBe(2);
-      expect(report.waves[0].wave).toBe(1);
-      expect(report.waves[0].steps).toHaveLength(1);
-      expect(report.waves[0].steps[0].name).toBe('step-1');
-      expect(report.waves[1].wave).toBe(2);
-      expect(report.waves[1].steps).toHaveLength(1);
-      expect(report.waves[1].steps[0].name).toBe('step-2');
-    });
-
-    it('should compute parallel steps in the same wave', () => {
-      const config = makeConfig({
-        workflows: [
-          {
-            name: 'parallel',
-            steps: [
-              { name: 'a', agent: 'agent-a', task: 'Do A' },
-              { name: 'b', agent: 'agent-b', task: 'Do B' },
-              { name: 'c', agent: 'agent-a', task: 'Do C', dependsOn: ['a', 'b'] },
-            ],
-          },
-        ],
-      });
-
-      const report = runner.dryRun(config, 'parallel');
-
-      expect(report.valid).toBe(true);
-      expect(report.estimatedWaves).toBe(2);
-      expect(report.waves[0].steps).toHaveLength(2);
-      expect(report.waves[0].steps.map((s) => s.name).sort()).toEqual(['a', 'b']);
-      expect(report.waves[1].steps).toHaveLength(1);
-      expect(report.waves[1].steps[0].name).toBe('c');
-    });
-
-    it('should report agent step counts', () => {
-      const config = makeConfig();
-      const report = runner.dryRun(config);
-
-      const agentA = report.agents.find((a) => a.name === 'agent-a');
-      const agentB = report.agents.find((a) => a.name === 'agent-b');
-      expect(agentA?.stepCount).toBe(1);
-      expect(agentB?.stepCount).toBe(1);
-    });
-
-    it('should include resolved permissions without provisioning tokens', () => {
-      const tmpDir = mkdtempSync(path.join(os.tmpdir(), 'workflow-dry-run-perms-'));
-      try {
-        writeFileSync(path.join(tmpDir, 'readme.md'), '# readme\n');
-        writeFileSync(path.join(tmpDir, 'notes.txt'), 'notes\n');
-        writeFileSync(path.join(tmpDir, '.agentreadonly'), 'readme.md\n');
-
-        const dryRunRunner = new WorkflowRunner({ db, workspaceId: 'ws-test', cwd: tmpDir });
-        const report = dryRunRunner.dryRun(
-          makeConfig({
-            agents: [
-              {
-                name: 'agent-a',
-                cli: 'claude',
-                permissions: {
-                  access: 'readonly',
-                  files: {
-                    write: ['notes.txt'],
-                  },
-                  scopes: ['relay:custom'],
-                },
-              },
-              { name: 'agent-b', cli: 'claude' },
-            ],
-          })
-        );
-
-        const agentA = report.permissions?.find((entry) => entry.agent === 'agent-a');
-        const agentB = report.permissions?.find((entry) => entry.agent === 'agent-b');
-
-        expect(agentA?.agent).toBe('agent-a');
-        expect(agentA?.access).toBe('readonly');
-        expect(agentA?.writePaths).toBe(1);
-        expect(agentA?.denyPaths).toBe(0);
-        expect(agentA?.readPaths).toBeGreaterThanOrEqual(1);
-        expect(agentA?.source).toBe('yaml');
-        expect(agentA?.scopes).toBeGreaterThan(1);
-
-        expect(agentB).toMatchObject({
-          agent: 'agent-b',
-          access: 'readwrite',
-          source: 'preset',
-        });
-      } finally {
-        rmSync(tmpDir, { recursive: true, force: true });
-      }
-    });
-
-    it('should warn when step references unknown agent', () => {
-      const config = makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'step-1', agent: 'nonexistent', task: 'Do stuff' }],
-          },
-        ],
-      });
-
-      const report = runner.dryRun(config);
-
-      expect(report.valid).toBe(true);
-      expect(report.warnings.some((w) => w.includes('nonexistent'))).toBe(true);
-    });
-
-    it('should warn when wave exceeds maxConcurrency', () => {
-      const config = makeConfig({
-        swarm: { pattern: 'dag', maxConcurrency: 1 },
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              { name: 'a', agent: 'agent-a', task: 'Do A' },
-              { name: 'b', agent: 'agent-b', task: 'Do B' },
-            ],
-          },
-        ],
-      });
-
-      const report = runner.dryRun(config);
-
-      expect(report.valid).toBe(true);
-      expect(report.warnings.some((w) => w.includes('maxConcurrency'))).toBe(true);
-    });
-
-    it('should return errors for invalid config', () => {
-      const report = runner.dryRun({} as any);
-
-      expect(report.valid).toBe(false);
-      expect(report.errors.length).toBeGreaterThan(0);
-    });
-
-    it('should return error when workflow not found', () => {
-      const config = makeConfig();
-      const report = runner.dryRun(config, 'nonexistent');
-
-      expect(report.valid).toBe(false);
-      expect(report.errors[0]).toContain('nonexistent');
-    });
-  });
-});
diff --git a/packages/sdk/src/__tests__/workflow-trajectory.test.ts b/packages/sdk/src/__tests__/workflow-trajectory.test.ts
deleted file mode 100644
index 061ea12cc..000000000
--- a/packages/sdk/src/__tests__/workflow-trajectory.test.ts
+++ /dev/null
@@ -1,466 +0,0 @@
-/**
- * WorkflowTrajectory unit tests.
- *
- * Tests trajectory recording, chapter management, reflections, decisions,
- * confidence computation, and the disabled/enabled toggle.
- */
-
-import { describe, it, expect, beforeEach, afterEach, vi } from 'vitest';
-import { existsSync, readFileSync, readdirSync, rmSync, mkdirSync } from 'node:fs';
-import path from 'node:path';
-import os from 'node:os';
-import { WorkflowTrajectory, type StepOutcome } from '../workflows/trajectory.js';
-
-// ── Test helpers ─────────────────────────────────────────────────────────────
-
-let tmpDir: string;
-let originalTrajectoriesDataDir: string | undefined;
-let originalWorkflowId: string | undefined;
-
-function makeTmpDir(): string {
-  const dir = path.join(os.tmpdir(), `wf-traj-test-${Date.now()}-${Math.random().toString(36).slice(2)}`);
-  mkdirSync(dir, { recursive: true });
-  return dir;
-}
-
-function findFirstJsonFile(dir: string): string | null {
-  if (!existsSync(dir)) return null;
-  for (const entry of readdirSync(dir, { withFileTypes: true })) {
-    const entryPath = path.join(dir, entry.name);
-    if (entry.isDirectory()) {
-      const nested = findFirstJsonFile(entryPath);
-      if (nested) return nested;
-    }
-    if (entry.isFile() && entry.name.endsWith('.json')) return entryPath;
-  }
-  return null;
-}
-
-function readTrajectoryFile(dir: string): any {
-  const file = findFirstJsonFile(path.join(dir, '.trajectories', 'active'));
-  return file ? JSON.parse(readFileSync(file, 'utf-8')) : null;
-}
-
-function readCompletedTrajectoryFile(dir: string): any {
-  const file = findFirstJsonFile(path.join(dir, '.trajectories', 'completed'));
-  return file ? JSON.parse(readFileSync(file, 'utf-8')) : null;
-}
-
-function readTrajectoryFileAt(dataDir: string, status: 'active' | 'completed'): any {
-  const file = findFirstJsonFile(path.join(dataDir, status));
-  return file ? JSON.parse(readFileSync(file, 'utf-8')) : null;
-}
-
-// ── Tests ────────────────────────────────────────────────────────────────────
-
-describe('WorkflowTrajectory', () => {
-  beforeEach(() => {
-    originalTrajectoriesDataDir = process.env.TRAJECTORIES_DATA_DIR;
-    originalWorkflowId = process.env.TRAJECTORIES_WORKFLOW_ID;
-    delete process.env.TRAJECTORIES_DATA_DIR;
-    delete process.env.TRAJECTORIES_WORKFLOW_ID;
-    tmpDir = makeTmpDir();
-  });
-
-  afterEach(() => {
-    if (originalTrajectoriesDataDir === undefined) {
-      delete process.env.TRAJECTORIES_DATA_DIR;
-    } else {
-      process.env.TRAJECTORIES_DATA_DIR = originalTrajectoriesDataDir;
-    }
-    if (originalWorkflowId === undefined) {
-      delete process.env.TRAJECTORIES_WORKFLOW_ID;
-    } else {
-      process.env.TRAJECTORIES_WORKFLOW_ID = originalWorkflowId;
-    }
-    try {
-      rmSync(tmpDir, { recursive: true, force: true });
-    } catch {
-      // cleanup best-effort
-    }
-  });
-
-  // ── Disabled mode ──────────────────────────────────────────────────────
-
-  describe('disabled', () => {
-    it('should not create files when trajectories is false', async () => {
-      const traj = new WorkflowTrajectory(false, 'run-1', tmpDir);
-      await traj.start('test-workflow', 3);
-
-      expect(traj.isEnabled()).toBe(false);
-      expect(traj.getTrajectoryId()).toBeNull();
-      expect(existsSync(path.join(tmpDir, '.trajectories'))).toBe(false);
-    });
-
-    it('should not create files when enabled is false', async () => {
-      const traj = new WorkflowTrajectory({ enabled: false }, 'run-1', tmpDir);
-      await traj.start('test-workflow', 3);
-
-      expect(traj.isEnabled()).toBe(false);
-    });
-
-    it('should be enabled by default', () => {
-      const traj = new WorkflowTrajectory(undefined, 'run-1', tmpDir);
-      expect(traj.isEnabled()).toBe(true);
-    });
-  });
-
-  // ── Lifecycle ──────────────────────────────────────────────────────────
-
-  describe('lifecycle', () => {
-    it('should create a trajectory file on start', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-abc', tmpDir);
-      await traj.start('my-workflow', 5);
-
-      expect(traj.getTrajectoryId()).toBeTruthy();
-      expect(traj.getTrajectoryId()!.startsWith('traj_')).toBe(true);
-
-      const data = readTrajectoryFile(tmpDir);
-      expect(data).toBeTruthy();
-      expect(data.status).toBe('active');
-      expect(data.task.title).toContain('my-workflow');
-      expect(data.agents).toHaveLength(1);
-      expect(data.agents[0].name).toBe('orchestrator');
-      expect(data.commits).toEqual([]);
-      expect(data.filesChanged).toEqual([]);
-      expect(data.tags).toEqual([]);
-    });
-
-    it('should create Planning chapter on start', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-abc', tmpDir);
-      await traj.start('my-workflow', 3, '3 parallel tracks, 2 barriers');
-
-      const data = readTrajectoryFile(tmpDir);
-      expect(data.chapters).toHaveLength(1);
-      expect(data.chapters[0].title).toBe('Planning');
-      expect(data.chapters[0].events.length).toBeGreaterThanOrEqual(1);
-    });
-
-    it('should complete trajectory and move to completed dir', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-abc', tmpDir);
-      await traj.start('my-workflow', 2);
-      await traj.complete('All done', 0.95);
-
-      const active = readTrajectoryFile(tmpDir);
-      expect(active).toBeNull(); // Moved out of active
-
-      const completed = readCompletedTrajectoryFile(tmpDir);
-      expect(completed).toBeTruthy();
-      expect(completed.status).toBe('completed');
-      expect(completed.retrospective.summary).toBe('All done');
-      expect(completed.retrospective.confidence).toBe(0.95);
-    });
-
-    it('should abandon trajectory and move to completed dir', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-abc', tmpDir);
-      await traj.start('my-workflow', 2);
-      await traj.abandon('Something went wrong');
-
-      const completed = readCompletedTrajectoryFile(tmpDir);
-      expect(completed).toBeTruthy();
-      expect(completed.status).toBe('abandoned');
-    });
-
-    it('should stamp workflowId from TRAJECTORIES_WORKFLOW_ID on start', async () => {
-      process.env.TRAJECTORIES_WORKFLOW_ID = 'wf-env-123';
-      const traj = new WorkflowTrajectory({}, 'run-abc', tmpDir);
-      await traj.start('my-workflow', 1);
-
-      const data = readTrajectoryFile(tmpDir);
-      expect(data.workflowId).toBe('wf-env-123');
-    });
-
-    it('should write to TRAJECTORIES_DATA_DIR when set', async () => {
-      const customDataDir = path.join(tmpDir, 'custom-root', '.trajectories');
-      process.env.TRAJECTORIES_DATA_DIR = customDataDir;
-
-      const traj = new WorkflowTrajectory({}, 'run-abc', tmpDir);
-      await traj.start('my-workflow', 1);
-
-      expect(readTrajectoryFile(tmpDir)).toBeNull();
-      expect(readTrajectoryFileAt(customDataDir, 'active')).toBeTruthy();
-    });
-  });
-
-  // ── Step events ────────────────────────────────────────────────────────
-
-  describe('step events', () => {
-    it('should record step started', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      await traj.start('wf', 2);
-      await traj.stepStarted({ name: 'build', agent: 'builder', task: 'Build it' }, 'builder-agent');
-
-      const data = readTrajectoryFile(tmpDir);
-      expect(data.agents).toHaveLength(2); // orchestrator + builder-agent
-      const events = data.chapters.flatMap((c: any) => c.events);
-      expect(events.some((e: any) => e.content.includes('build'))).toBe(true);
-    });
-
-    it('should record step completed', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      await traj.start('wf', 1);
-      await traj.stepCompleted({ name: 'test', agent: 'tester', task: 'Run tests' }, 'All tests passing', 1);
-
-      const data = readTrajectoryFile(tmpDir);
-      const events = data.chapters.flatMap((c: any) => c.events);
-      expect(events.some((e: any) => e.type === 'finding')).toBe(true);
-    });
-
-    it('should record step failed', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      await traj.start('wf', 1);
-      await traj.stepFailed(
-        { name: 'deploy', agent: 'deployer', task: 'Deploy' },
-        'Connection refused',
-        1,
-        3
-      );
-
-      const data = readTrajectoryFile(tmpDir);
-      const events = data.chapters.flatMap((c: any) => c.events);
-      expect(events.some((e: any) => e.type === 'error')).toBe(true);
-    });
-
-    it('should record step skipped', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      await traj.start('wf', 2);
-      await traj.stepSkipped({ name: 'integration', agent: 'tester', task: 'Test' }, 'Upstream failed');
-
-      const data = readTrajectoryFile(tmpDir);
-      const events = data.chapters.flatMap((c: any) => c.events);
-      expect(events.some((e: any) => e.content.includes('skipped'))).toBe(true);
-    });
-  });
-
-  // ── Chapters ───────────────────────────────────────────────────────────
-
-  describe('chapters', () => {
-    it('should create track chapters', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      await traj.start('wf', 3);
-      await traj.beginTrack('backend');
-
-      const data = readTrajectoryFile(tmpDir);
-      expect(data.chapters.length).toBeGreaterThanOrEqual(2);
-      expect(data.chapters.some((c: any) => c.title === 'Execution: backend')).toBe(true);
-    });
-
-    it('should create convergence chapters', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      await traj.start('wf', 3);
-      await traj.beginConvergence('all-tracks-done');
-
-      const data = readTrajectoryFile(tmpDir);
-      expect(data.chapters.some((c: any) => c.title === 'Convergence: all-tracks-done')).toBe(true);
-    });
-
-    it('should close previous chapter when opening new one', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      await traj.start('wf', 3);
-      await traj.beginTrack('track-a');
-      await traj.beginTrack('track-b');
-
-      const data = readTrajectoryFile(tmpDir);
-      // Planning chapter should have endedAt
-      expect(data.chapters[0].endedAt).toBeTruthy();
-      // First track chapter should have endedAt
-      expect(data.chapters[1].endedAt).toBeTruthy();
-    });
-  });
-
-  // ── Reflections ────────────────────────────────────────────────────────
-
-  describe('reflections', () => {
-    it('should record reflect events', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      await traj.start('wf', 2);
-      await traj.reflect('All parallel tracks complete', 0.85, ['step-a: completed', 'step-b: completed']);
-
-      const data = readTrajectoryFile(tmpDir);
-      const events = data.chapters.flatMap((c: any) => c.events);
-      const reflection = events.find((e: any) => e.type === 'reflection');
-      expect(reflection).toBeTruthy();
-      expect(reflection.significance).toBe('high');
-      expect(reflection.raw.confidence).toBe(0.85);
-      expect(reflection.raw.focalPoints).toHaveLength(2);
-    });
-
-    it('should synthesize and reflect at convergence', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      await traj.start('wf', 3);
-
-      const outcomes: StepOutcome[] = [
-        { name: 'step-a', agent: 'a', status: 'completed', attempts: 1 },
-        { name: 'step-b', agent: 'b', status: 'completed', attempts: 2 },
-      ];
-
-      await traj.synthesizeAndReflect('backend-ready', outcomes, ['step-c']);
-
-      const data = readTrajectoryFile(tmpDir);
-      // Should have a convergence chapter
-      expect(data.chapters.some((c: any) => c.title.includes('Convergence'))).toBe(true);
-      const events = data.chapters.flatMap((c: any) => c.events);
-      const reflection = events.find((e: any) => e.type === 'reflection');
-      expect(reflection).toBeTruthy();
-      expect(reflection.content).toContain('backend-ready');
-      expect(reflection.content).toContain('step-b'); // retried
-    });
-  });
-
-  // ── Decisions ──────────────────────────────────────────────────────────
-
-  describe('decisions', () => {
-    it('should record decisions', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      await traj.start('wf', 1);
-      await traj.decide('How to handle failure', 'retry', 'Transient error detected');
-
-      const data = readTrajectoryFile(tmpDir);
-      const events = data.chapters.flatMap((c: any) => c.events);
-      const decision = events.find((e: any) => e.type === 'decision');
-      expect(decision).toBeTruthy();
-      expect(decision.raw.chosen).toBe('retry');
-    });
-
-    it('should skip decisions when autoDecisions is false', async () => {
-      const traj = new WorkflowTrajectory({ autoDecisions: false }, 'run-1', tmpDir);
-      await traj.start('wf', 1);
-      await traj.decide('How to handle failure', 'retry', 'Transient error');
-
-      const data = readTrajectoryFile(tmpDir);
-      const events = data.chapters.flatMap((c: any) => c.events);
-      expect(events.filter((e: any) => e.type === 'decision')).toHaveLength(0);
-    });
-  });
-
-  // ── Confidence computation ─────────────────────────────────────────────
-
-  describe('computeConfidence', () => {
-    it('should return 1.0 for all first-attempt verified completions', () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      const outcomes: StepOutcome[] = [
-        { name: 'a', agent: 'a', status: 'completed', attempts: 1, verificationPassed: true },
-        { name: 'b', agent: 'b', status: 'completed', attempts: 1, verificationPassed: true },
-      ];
-      expect(traj.computeConfidence(outcomes)).toBe(1.0);
-    });
-
-    it('should return lower confidence for retried steps', () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      const outcomes: StepOutcome[] = [
-        { name: 'a', agent: 'a', status: 'completed', attempts: 1, verificationPassed: true },
-        { name: 'b', agent: 'b', status: 'completed', attempts: 3, verificationPassed: true },
-      ];
-      const confidence = traj.computeConfidence(outcomes);
-      expect(confidence).toBeLessThan(1.0);
-      expect(confidence).toBeGreaterThan(0.5);
-    });
-
-    it('should return lower confidence for failed steps', () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      const outcomes: StepOutcome[] = [
-        { name: 'a', agent: 'a', status: 'completed', attempts: 1 },
-        { name: 'b', agent: 'b', status: 'failed', attempts: 3 },
-      ];
-      const confidence = traj.computeConfidence(outcomes);
-      expect(confidence).toBeLessThan(0.5);
-    });
-
-    it('should return 0.7 for empty outcomes', () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      expect(traj.computeConfidence([])).toBe(0.7);
-    });
-  });
-
-  // ── Synthesis helpers ──────────────────────────────────────────────────
-
-  describe('buildSynthesis', () => {
-    it('should produce meaningful synthesis text', () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      const outcomes: StepOutcome[] = [
-        { name: 'step-a', agent: 'a', status: 'completed', attempts: 1 },
-        { name: 'step-b', agent: 'b', status: 'completed', attempts: 2 },
-        { name: 'step-c', agent: 'c', status: 'failed', attempts: 3, error: 'timeout' },
-      ];
-
-      const synthesis = traj.buildSynthesis('barrier-1', outcomes, ['step-d']);
-      expect(synthesis).toContain('barrier-1');
-      expect(synthesis).toContain('2/3 steps completed');
-      expect(synthesis).toContain('step-c'); // failed
-      expect(synthesis).toContain('step-b'); // retried
-      expect(synthesis).toContain('step-d'); // unblocked
-    });
-
-    it('should note all-first-attempt when no retries', () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      const outcomes: StepOutcome[] = [
-        { name: 'a', agent: 'a', status: 'completed', attempts: 1 },
-        { name: 'b', agent: 'b', status: 'completed', attempts: 1 },
-      ];
-
-      const synthesis = traj.buildSynthesis('done', outcomes);
-      expect(synthesis).toContain('All steps completed on first attempt');
-    });
-  });
-
-  describe('buildRunSummary', () => {
-    it('should produce run summary with stats', () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      const outcomes: StepOutcome[] = [
-        { name: 'a', agent: 'a', status: 'completed', attempts: 1 },
-        { name: 'b', agent: 'b', status: 'completed', attempts: 2 },
-        { name: 'c', agent: 'c', status: 'failed', attempts: 3 },
-        { name: 'd', agent: 'd', status: 'skipped', attempts: 1 },
-      ];
-
-      const summary = traj.buildRunSummary(outcomes);
-      expect(summary).toContain('Failed at "c"');
-      expect(summary).toContain('2/4 steps completed before failure');
-      expect(summary).toContain('downstream step(s) to be skipped');
-    });
-  });
-
-  // ── Non-blocking behavior ──────────────────────────────────────────────
-
-  describe('non-blocking', () => {
-    it('should not throw on flush errors', async () => {
-      // Use a path that will fail (read-only or invalid)
-      const traj = new WorkflowTrajectory({}, 'run-1', '/dev/null/impossible-path');
-      // Should not throw
-      await expect(traj.start('wf', 1)).resolves.not.toThrow();
-    });
-
-    it('should handle all methods gracefully when not started', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      // Don't call start — all methods should be no-ops
-      await expect(traj.stepStarted({ name: 'x', agent: 'a', task: 't' }, 'a')).resolves.not.toThrow();
-      await expect(traj.reflect('test', 0.5)).resolves.not.toThrow();
-      await expect(traj.decide('q', 'c', 'r')).resolves.not.toThrow();
-      await expect(traj.complete('done', 0.9)).resolves.not.toThrow();
-    });
-
-    it('should save once when completing', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      await traj.start('wf', 1);
-
-      const save = vi.fn().mockResolvedValue(undefined);
-      (traj as any).storage = { initialize: vi.fn().mockResolvedValue(undefined), save };
-      (traj as any).storageInit = Promise.resolve();
-
-      await traj.complete('done', 0.9);
-      expect(save).toHaveBeenCalledTimes(1);
-    });
-
-    it('should save once when abandoning', async () => {
-      const traj = new WorkflowTrajectory({}, 'run-1', tmpDir);
-      await traj.start('wf', 1);
-
-      const save = vi.fn().mockResolvedValue(undefined);
-      (traj as any).storage = { initialize: vi.fn().mockResolvedValue(undefined), save };
-      (traj as any).storageInit = Promise.resolve();
-
-      await traj.abandon('nope');
-      expect(save).toHaveBeenCalledTimes(1);
-    });
-  });
-});
diff --git a/packages/sdk/src/__tests__/yaml-validation.test.ts b/packages/sdk/src/__tests__/yaml-validation.test.ts
deleted file mode 100644
index 6fecd8ccc..000000000
--- a/packages/sdk/src/__tests__/yaml-validation.test.ts
+++ /dev/null
@@ -1,916 +0,0 @@
-/**
- * YAML Workflow Template Validation Tests
- *
- * Tests that all built-in workflow templates are valid, parse correctly,
- * and have correct structure. Also tests error handling for invalid YAML.
- *
- * These tests are CI-friendly (no CLI or API keys needed).
- */
-import { describe, it, expect, beforeEach } from 'vitest';
-import { promises as fs } from 'node:fs';
-import path from 'node:path';
-import { fileURLToPath } from 'node:url';
-import { parse as parseYaml } from 'yaml';
-import { TemplateRegistry, BUILT_IN_TEMPLATE_NAMES } from '../workflows/templates.js';
-import { SwarmCoordinator } from '../workflows/coordinator.js';
-import type {
-  RelayYamlConfig,
-  SwarmPattern,
-  WorkflowStep,
-  CustomStepDefinition,
-} from '../workflows/types.js';
-import { isDeterministicStep, isWorktreeStep, isAgentStep, isCustomStep } from '../workflows/types.js';
-import {
-  resolveCustomStep,
-  resolveAllCustomSteps,
-  validateCustomStepsUsage,
-  CustomStepsParseError,
-  CustomStepResolutionError,
-} from '../workflows/custom-steps.js';
-
-const __dirname = path.dirname(fileURLToPath(import.meta.url));
-const TEMPLATES_DIR = path.resolve(__dirname, '../workflows/builtin-templates');
-
-// Mock DB for coordinator tests
-const mockDb = {
-  query: async () => ({ rows: [] }),
-};
-
-describe('YAML Template Validation', () => {
-  let registry: TemplateRegistry;
-  let coordinator: SwarmCoordinator;
-
-  beforeEach(() => {
-    registry = new TemplateRegistry({ builtInTemplatesDir: TEMPLATES_DIR });
-    coordinator = new SwarmCoordinator(mockDb as any);
-  });
-
-  // ── Built-in Template Registration ─────────────────────────────────────────
-
-  describe('Built-in Template Registration', () => {
-    it('should have all expected built-in templates registered', () => {
-      const templates = registry.listBuiltInTemplates();
-      expect(templates).toContain('feature-dev');
-      expect(templates).toContain('bug-fix');
-      expect(templates).toContain('code-review');
-      expect(templates).toContain('security-audit');
-      expect(templates).toContain('refactor');
-      expect(templates).toContain('documentation');
-      expect(templates).toContain('review-loop');
-    });
-
-    it('should have correct number of built-in templates', () => {
-      const templates = registry.listBuiltInTemplates();
-      expect(templates.length).toBeGreaterThanOrEqual(7);
-    });
-  });
-
-  // ── Individual Template Validation ─────────────────────────────────────────
-
-  describe('Template Loading and Validation', () => {
-    for (const templateName of BUILT_IN_TEMPLATE_NAMES) {
-      describe(`${templateName} template`, () => {
-        it('should load successfully', async () => {
-          const config = await registry.loadTemplate(templateName);
-          expect(config).toBeDefined();
-          expect(config.name).toBe(templateName);
-        });
-
-        it('should have required fields', async () => {
-          const config = await registry.loadTemplate(templateName);
-          expect(config.version).toBeDefined();
-          expect(config.name).toBeDefined();
-          expect(config.swarm).toBeDefined();
-          expect(config.swarm.pattern).toBeDefined();
-          expect(config.agents).toBeDefined();
-          expect(config.agents.length).toBeGreaterThan(0);
-        });
-
-        it('should have valid swarm pattern', async () => {
-          const config = await registry.loadTemplate(templateName);
-          const validPatterns: SwarmPattern[] = [
-            'fan-out',
-            'pipeline',
-            'hub-spoke',
-            'consensus',
-            'mesh',
-            'handoff',
-            'cascade',
-            'dag',
-            'debate',
-            'hierarchical',
-            'map-reduce',
-            'scatter-gather',
-            'supervisor',
-            'reflection',
-            'red-team',
-            'verifier',
-            'auction',
-            'escalation',
-            'saga',
-            'circuit-breaker',
-            'blackboard',
-            'swarm',
-            'competitive',
-            'review-loop',
-          ];
-          expect(validPatterns).toContain(config.swarm.pattern);
-        });
-
-        it('should have valid agent definitions', async () => {
-          const config = await registry.loadTemplate(templateName);
-          for (const agent of config.agents) {
-            expect(agent.name).toBeDefined();
-            expect(typeof agent.name).toBe('string');
-            expect(agent.cli).toBeDefined();
-            expect(['claude', 'codex', 'gemini', 'aider', 'goose', 'opencode', 'droid']).toContain(agent.cli);
-          }
-        });
-
-        it('should have unique agent names', async () => {
-          const config = await registry.loadTemplate(templateName);
-          const names = config.agents.map((a) => a.name);
-          const uniqueNames = new Set(names);
-          expect(uniqueNames.size).toBe(names.length);
-        });
-
-        it('should resolve topology without error', async () => {
-          const config = await registry.loadTemplate(templateName);
-          const topology = coordinator.resolveTopology(config);
-          expect(topology).toBeDefined();
-          expect(topology.pattern).toBe(config.swarm.pattern);
-          expect(topology.agents).toEqual(config.agents);
-          expect(topology.edges).toBeInstanceOf(Map);
-        });
-      });
-    }
-  });
-
-  // ── Workflow Steps Validation ──────────────────────────────────────────────
-
-  describe('Workflow Steps Validation', () => {
-    for (const templateName of BUILT_IN_TEMPLATE_NAMES) {
-      it(`${templateName}: workflow steps should be valid`, async () => {
-        const config = await registry.loadTemplate(templateName);
-
-        if (config.workflows && config.workflows.length > 0) {
-          for (const workflow of config.workflows) {
-            expect(workflow.name).toBeDefined();
-            expect(workflow.steps).toBeDefined();
-            expect(Array.isArray(workflow.steps)).toBe(true);
-
-            for (const step of workflow.steps) {
-              expect(step.name).toBeDefined();
-              expect(typeof step.name).toBe('string');
-
-              // Agent steps require agent and task
-              if (step.type !== 'deterministic' && step.type !== 'worktree') {
-                expect(step.agent).toBeDefined();
-                expect(step.task).toBeDefined();
-              }
-
-              // Deterministic steps require command
-              if (step.type === 'deterministic') {
-                expect(step.command).toBeDefined();
-              }
-
-              // Worktree steps require branch
-              if (step.type === 'worktree') {
-                expect(step.branch).toBeDefined();
-              }
-
-              // Check dependsOn is array if present
-              if (step.dependsOn) {
-                expect(Array.isArray(step.dependsOn)).toBe(true);
-              }
-            }
-          }
-        }
-      });
-
-      it(`${templateName}: step dependencies should reference existing steps`, async () => {
-        const config = await registry.loadTemplate(templateName);
-
-        if (config.workflows && config.workflows.length > 0) {
-          for (const workflow of config.workflows) {
-            const stepNames = new Set(workflow.steps.map((s) => s.name));
-
-            for (const step of workflow.steps) {
-              if (step.dependsOn) {
-                for (const dep of step.dependsOn) {
-                  expect(stepNames.has(dep)).toBe(true);
-                }
-              }
-            }
-          }
-        }
-      });
-
-      it(`${templateName}: step agents should reference existing agents`, async () => {
-        const config = await registry.loadTemplate(templateName);
-        const agentNames = new Set(config.agents.map((a) => a.name));
-
-        if (config.workflows && config.workflows.length > 0) {
-          for (const workflow of config.workflows) {
-            for (const step of workflow.steps) {
-              if (step.agent) {
-                expect(agentNames.has(step.agent)).toBe(true);
-              }
-            }
-          }
-        }
-      });
-    }
-  });
-
-  // ── review-loop Template Specific Tests ────────────────────────────────────
-
-  describe('review-loop Template Specifics', () => {
-    it('should have implementer agent', async () => {
-      const config = await registry.loadTemplate('review-loop');
-      const implementer = config.agents.find((a) => a.name.includes('implementer'));
-      expect(implementer).toBeDefined();
-    });
-
-    it('should have multiple reviewer agents', async () => {
-      const config = await registry.loadTemplate('review-loop');
-      const reviewers = config.agents.filter((a) => a.name.includes('reviewer'));
-      expect(reviewers.length).toBeGreaterThanOrEqual(2);
-    });
-
-    it('should have non-interactive reviewers', async () => {
-      const config = await registry.loadTemplate('review-loop');
-      const reviewers = config.agents.filter((a) => a.name.includes('reviewer'));
-      for (const reviewer of reviewers) {
-        expect(reviewer.interactive).toBe(false);
-      }
-    });
-
-    it('should have deterministic git diff step', async () => {
-      const config = await registry.loadTemplate('review-loop');
-      if (config.workflows && config.workflows.length > 0) {
-        const workflow = config.workflows[0];
-        const diffStep = workflow.steps.find((s) => s.name === 'capture-diff');
-        expect(diffStep).toBeDefined();
-        expect(diffStep?.type).toBe('deterministic');
-        expect(diffStep?.command).toContain('git diff');
-      }
-    });
-
-    it('should have review steps depending on implement step', async () => {
-      const config = await registry.loadTemplate('review-loop');
-      if (config.workflows && config.workflows.length > 0) {
-        const workflow = config.workflows[0];
-        const reviewSteps = workflow.steps.filter((s) => s.name.startsWith('review-'));
-        expect(reviewSteps.length).toBeGreaterThan(0);
-      }
-    });
-
-    it('should have consolidate step depending on all reviews', async () => {
-      const config = await registry.loadTemplate('review-loop');
-      if (config.workflows && config.workflows.length > 0) {
-        const workflow = config.workflows[0];
-        const consolidateStep = workflow.steps.find((s) => s.name === 'consolidate');
-        expect(consolidateStep).toBeDefined();
-        expect(consolidateStep?.dependsOn).toBeDefined();
-        expect(consolidateStep?.dependsOn?.length).toBeGreaterThanOrEqual(3);
-      }
-    });
-
-    it('should have address-feedback step', async () => {
-      const config = await registry.loadTemplate('review-loop');
-      if (config.workflows && config.workflows.length > 0) {
-        const workflow = config.workflows[0];
-        const addressStep = workflow.steps.find((s) => s.name === 'address-feedback');
-        expect(addressStep).toBeDefined();
-        expect(addressStep?.dependsOn).toContain('consolidate');
-      }
-    });
-
-    it('should have coordination barriers', async () => {
-      const config = await registry.loadTemplate('review-loop');
-      expect(config.coordination).toBeDefined();
-      expect(config.coordination?.barriers).toBeDefined();
-      expect(config.coordination?.barriers?.length).toBeGreaterThan(0);
-    });
-  });
-
-  // ── Error Handling Tests ───────────────────────────────────────────────────
-
-  describe('Error Handling', () => {
-    it('should reject template with missing version', () => {
-      const invalidYaml = `
-name: test
-swarm:
-  pattern: fan-out
-agents:
-  - name: test
-    cli: claude
-`;
-      const parsed = parseYaml(invalidYaml);
-      expect(() => (registry as any).validateRelayConfig(parsed, 'test')).toThrow(/version/);
-    });
-
-    it('should reject template with missing name', () => {
-      const invalidYaml = `
-version: "1.0"
-swarm:
-  pattern: fan-out
-agents:
-  - name: test
-    cli: claude
-`;
-      const parsed = parseYaml(invalidYaml);
-      expect(() => (registry as any).validateRelayConfig(parsed, 'test')).toThrow(/name/);
-    });
-
-    it('should reject template with empty agents', () => {
-      const invalidYaml = `
-version: "1.0"
-name: test
-swarm:
-  pattern: fan-out
-agents: []
-`;
-      const parsed = parseYaml(invalidYaml);
-      expect(() => (registry as any).validateRelayConfig(parsed, 'test')).toThrow(/agents/);
-    });
-
-    it('should reject template with invalid agent definition', () => {
-      const invalidYaml = `
-version: "1.0"
-name: test
-swarm:
-  pattern: fan-out
-agents:
-  - name: test
-`;
-      const parsed = parseYaml(invalidYaml);
-      expect(() => (registry as any).validateRelayConfig(parsed, 'test')).toThrow(/invalid agent/i);
-    });
-
-    it('should reject non-existent template', async () => {
-      await expect(registry.loadTemplate('non-existent-template')).rejects.toThrow(/not found/i);
-    });
-  });
-
-  // ── Template Override Tests ────────────────────────────────────────────────
-
-  describe('Template Overrides', () => {
-    it('should apply simple override', async () => {
-      const config = await registry.loadTemplate('feature-dev', {
-        overrides: { description: 'Custom description' },
-      });
-      expect(config.description).toBe('Custom description');
-    });
-
-    it('should apply nested override', async () => {
-      const config = await registry.loadTemplate('feature-dev', {
-        overrides: { 'swarm.maxConcurrency': 10 },
-      });
-      expect(config.swarm.maxConcurrency).toBe(10);
-    });
-
-    it('should apply agent override by index', async () => {
-      const config = await registry.loadTemplate('feature-dev', {
-        overrides: { 'agents[0].constraints.model': 'claude-opus' },
-      });
-      expect(config.agents[0].constraints?.model).toBe('claude-opus');
-    });
-  });
-
-  // ── DAG Validation Tests ───────────────────────────────────────────────────
-
-  describe('DAG Dependency Validation', () => {
-    for (const templateName of BUILT_IN_TEMPLATE_NAMES) {
-      it(`${templateName}: should not have circular dependencies`, async () => {
-        const config = await registry.loadTemplate(templateName);
-
-        if (config.workflows && config.workflows.length > 0) {
-          for (const workflow of config.workflows) {
-            const deps = new Map<string, string[]>();
-            for (const step of workflow.steps) {
-              deps.set(step.name, step.dependsOn ?? []);
-            }
-
-            // Check for cycles using DFS
-            const visited = new Set<string>();
-            const recursionStack = new Set<string>();
-
-            const hasCycle = (node: string): boolean => {
-              if (recursionStack.has(node)) return true;
-              if (visited.has(node)) return false;
-
-              visited.add(node);
-              recursionStack.add(node);
-
-              for (const dep of deps.get(node) ?? []) {
-                if (hasCycle(dep)) return true;
-              }
-
-              recursionStack.delete(node);
-              return false;
-            };
-
-            for (const step of workflow.steps) {
-              expect(hasCycle(step.name)).toBe(false);
-            }
-          }
-        }
-      });
-    }
-  });
-
-  // ── Verification Check Tests ───────────────────────────────────────────────
-
-  describe('Verification Check Validation', () => {
-    for (const templateName of BUILT_IN_TEMPLATE_NAMES) {
-      it(`${templateName}: verification checks should be valid`, async () => {
-        const config = await registry.loadTemplate(templateName);
-
-        if (config.workflows && config.workflows.length > 0) {
-          for (const workflow of config.workflows) {
-            for (const step of workflow.steps) {
-              if (step.verification) {
-                expect(['output_contains', 'exit_code', 'file_exists', 'custom']).toContain(
-                  step.verification.type
-                );
-                expect(step.verification.value).toBeDefined();
-              }
-            }
-          }
-        }
-      });
-    }
-  });
-
-  // ── Variable Substitution Tests ────────────────────────────────────────────
-
-  describe('Variable Substitution Patterns', () => {
-    for (const templateName of BUILT_IN_TEMPLATE_NAMES) {
-      it(`${templateName}: variable references should be valid`, async () => {
-        const config = await registry.loadTemplate(templateName);
-
-        if (config.workflows && config.workflows.length > 0) {
-          for (const workflow of config.workflows) {
-            const stepNames = new Set(workflow.steps.map((s) => s.name));
-
-            for (const step of workflow.steps) {
-              if (step.task) {
-                // Check for {{steps.X.output}} references
-                const stepRefs = step.task.match(/\{\{steps\.([^.]+)\.output\}\}/g) ?? [];
-                for (const ref of stepRefs) {
-                  const match = ref.match(/\{\{steps\.([^.]+)\.output\}\}/);
-                  if (match) {
-                    const referencedStep = match[1];
-                    // The referenced step should exist
-                    expect(stepNames.has(referencedStep)).toBe(true);
-                  }
-                }
-              }
-            }
-          }
-        }
-      });
-    }
-  });
-
-  // ── Error Handling Configuration ───────────────────────────────────────────
-
-  describe('Error Handling Configuration', () => {
-    for (const templateName of BUILT_IN_TEMPLATE_NAMES) {
-      it(`${templateName}: error handling should be valid if present`, async () => {
-        const config = await registry.loadTemplate(templateName);
-
-        if (config.errorHandling) {
-          expect(['fail-fast', 'continue', 'retry']).toContain(config.errorHandling.strategy);
-
-          if (config.errorHandling.maxRetries !== undefined) {
-            expect(config.errorHandling.maxRetries).toBeGreaterThanOrEqual(0);
-          }
-
-          if (config.errorHandling.retryDelayMs !== undefined) {
-            expect(config.errorHandling.retryDelayMs).toBeGreaterThanOrEqual(0);
-          }
-        }
-      });
-    }
-  });
-});
-
-// ── Step Type Guard Tests ───────────────────────────────────────────────────
-
-describe('Step Type Guards', () => {
-  it('should identify deterministic steps', () => {
-    const step: WorkflowStep = { name: 'test', type: 'deterministic', command: 'echo hello' };
-    expect(isDeterministicStep(step)).toBe(true);
-    expect(isWorktreeStep(step)).toBe(false);
-    expect(isAgentStep(step)).toBe(false);
-  });
-
-  it('should identify worktree steps', () => {
-    const step: WorkflowStep = { name: 'test', type: 'worktree', branch: 'feature/test' };
-    expect(isDeterministicStep(step)).toBe(false);
-    expect(isWorktreeStep(step)).toBe(true);
-    expect(isAgentStep(step)).toBe(false);
-  });
-
-  it('should identify agent steps (explicit type)', () => {
-    const step: WorkflowStep = { name: 'test', type: 'agent', agent: 'dev', task: 'Do work' };
-    expect(isDeterministicStep(step)).toBe(false);
-    expect(isWorktreeStep(step)).toBe(false);
-    expect(isAgentStep(step)).toBe(true);
-  });
-
-  it('should identify agent steps (implicit type)', () => {
-    const step: WorkflowStep = { name: 'test', agent: 'dev', task: 'Do work' };
-    expect(isDeterministicStep(step)).toBe(false);
-    expect(isWorktreeStep(step)).toBe(false);
-    expect(isAgentStep(step)).toBe(true);
-  });
-
-  it('should identify custom steps', () => {
-    const step: WorkflowStep = { name: 'test', use: 'docker-build' };
-    expect(isCustomStep(step)).toBe(true);
-  });
-
-  it('should not identify non-custom steps as custom', () => {
-    const agentStep: WorkflowStep = { name: 'test', agent: 'dev', task: 'Do work' };
-    const deterministicStep: WorkflowStep = { name: 'test', type: 'deterministic', command: 'echo hello' };
-    expect(isCustomStep(agentStep)).toBe(false);
-    expect(isCustomStep(deterministicStep)).toBe(false);
-  });
-});
-
-// ── Custom Step Resolution Tests ────────────────────────────────────────────
-
-describe('Custom Step Resolution', () => {
-  const customSteps = new Map<string, CustomStepDefinition>([
-    [
-      'docker-build',
-      {
-        params: [
-          { name: 'image', required: true },
-          { name: 'dockerfile', default: 'Dockerfile' },
-        ],
-        command: 'docker build -t {{image}} -f {{dockerfile}} .',
-        captureOutput: true,
-      },
-    ],
-    [
-      'setup-worktree',
-      {
-        type: 'worktree',
-        params: [{ name: 'branch', required: true }],
-        branch: '{{branch}}',
-        baseBranch: 'main',
-        createBranch: true,
-      },
-    ],
-  ]);
-
-  it('should resolve custom step with required param', () => {
-    const step = { name: 'build', use: 'docker-build', image: 'myapp:latest' } as WorkflowStep;
-    const resolved = resolveCustomStep(step, customSteps);
-
-    expect(resolved.type).toBe('deterministic');
-    expect(resolved.command).toBe('docker build -t myapp:latest -f Dockerfile .');
-    expect(resolved.captureOutput).toBe(true);
-  });
-
-  it('should resolve custom step with all params', () => {
-    const step = {
-      name: 'build',
-      use: 'docker-build',
-      image: 'myapp:v2',
-      dockerfile: 'Dockerfile.prod',
-    } as WorkflowStep;
-    const resolved = resolveCustomStep(step, customSteps);
-
-    expect(resolved.command).toBe('docker build -t myapp:v2 -f Dockerfile.prod .');
-  });
-
-  it('should throw on missing required param', () => {
-    const step = { name: 'build', use: 'docker-build' } as WorkflowStep;
-
-    expect(() => resolveCustomStep(step, customSteps)).toThrow(/Missing required parameter/);
-  });
-
-  it('should throw on unknown custom step', () => {
-    const step = { name: 'build', use: 'unknown-step' } as WorkflowStep;
-
-    expect(() => resolveCustomStep(step, customSteps)).toThrow(/Custom step "unknown-step" not found/);
-  });
-
-  it('should resolve worktree custom step', () => {
-    const step = { name: 'setup', use: 'setup-worktree', branch: 'feature/test' } as WorkflowStep;
-    const resolved = resolveCustomStep(step, customSteps);
-
-    expect(resolved.type).toBe('worktree');
-    expect(resolved.branch).toBe('feature/test');
-    expect(resolved.baseBranch).toBe('main');
-    expect(resolved.createBranch).toBe(true);
-  });
-
-  it('should preserve step name and dependsOn', () => {
-    const step = {
-      name: 'my-build',
-      use: 'docker-build',
-      image: 'app:latest',
-      dependsOn: ['setup'],
-    } as WorkflowStep;
-    const resolved = resolveCustomStep(step, customSteps);
-
-    expect(resolved.name).toBe('my-build');
-    expect(resolved.dependsOn).toEqual(['setup']);
-  });
-
-  it('should pass through non-custom steps unchanged', () => {
-    const step: WorkflowStep = { name: 'test', type: 'deterministic', command: 'echo hello' };
-    const resolved = resolveCustomStep(step, customSteps);
-
-    expect(resolved).toBe(step);
-  });
-
-  it('should resolve all custom steps in array', () => {
-    const steps: WorkflowStep[] = [
-      { name: 'build1', use: 'docker-build', image: 'app1:latest' } as WorkflowStep,
-      { name: 'regular', type: 'deterministic', command: 'echo done' },
-      { name: 'build2', use: 'docker-build', image: 'app2:latest' } as WorkflowStep,
-    ];
-
-    const resolved = resolveAllCustomSteps(steps, customSteps);
-
-    expect(resolved).toHaveLength(3);
-    expect(resolved[0].command).toBe('docker build -t app1:latest -f Dockerfile .');
-    expect(resolved[1].command).toBe('echo done');
-    expect(resolved[2].command).toBe('docker build -t app2:latest -f Dockerfile .');
-  });
-});
-
-// ── Custom Step Validation Tests ────────────────────────────────────────────
-
-describe('Custom Step Validation', () => {
-  const customSteps = new Map<string, CustomStepDefinition>([
-    [
-      'docker-build',
-      {
-        params: [
-          { name: 'image', required: true },
-          { name: 'dockerfile', default: 'Dockerfile' },
-        ],
-        command: 'docker build -t {{image}} -f {{dockerfile}} .',
-      },
-    ],
-    [
-      'deploy',
-      {
-        params: [{ name: 'env', required: true }],
-        command: 'deploy --env={{env}}',
-      },
-    ],
-  ]);
-
-  describe('validateCustomStepsUsage', () => {
-    it('should pass validation for correctly configured steps', () => {
-      const steps: WorkflowStep[] = [
-        { name: 'build', use: 'docker-build', image: 'myapp:latest' } as WorkflowStep,
-      ];
-
-      const result = validateCustomStepsUsage(steps, customSteps);
-
-      expect(result.valid).toBe(true);
-      expect(result.errors).toHaveLength(0);
-    });
-
-    it('should report missing custom step definition', () => {
-      const steps: WorkflowStep[] = [{ name: 'build', use: 'unknown-step' } as WorkflowStep];
-
-      const result = validateCustomStepsUsage(steps, customSteps);
-
-      expect(result.valid).toBe(false);
-      expect(result.errors).toHaveLength(1);
-      expect(result.errors[0]).toContain('unknown-step');
-      expect(result.missingSteps).toContain('unknown-step');
-    });
-
-    it('should report missing required parameters', () => {
-      const steps: WorkflowStep[] = [
-        { name: 'build', use: 'docker-build' } as WorkflowStep, // missing 'image'
-      ];
-
-      const result = validateCustomStepsUsage(steps, customSteps);
-
-      expect(result.valid).toBe(false);
-      expect(result.errors).toHaveLength(1);
-      expect(result.errors[0]).toContain('image');
-      expect(result.missingParams).toHaveLength(1);
-      expect(result.missingParams[0]).toEqual({
-        step: 'build',
-        use: 'docker-build',
-        param: 'image',
-      });
-    });
-
-    it('should warn about undefined variables in command', () => {
-      const customStepsWithUndefinedVar = new Map<string, CustomStepDefinition>([
-        [
-          'bad-step',
-          {
-            params: [{ name: 'known' }],
-            command: 'run {{known}} {{unknown}}',
-          },
-        ],
-      ]);
-
-      const steps: WorkflowStep[] = [{ name: 'test', use: 'bad-step', known: 'value' } as WorkflowStep];
-
-      const result = validateCustomStepsUsage(steps, customStepsWithUndefinedVar);
-
-      expect(result.valid).toBe(true); // warnings don't fail validation
-      expect(result.warnings).toHaveLength(1);
-      expect(result.warnings[0]).toContain('unknown');
-      expect(result.unresolvedVariables).toHaveLength(1);
-    });
-
-    it('should warn about extra parameters not in definition', () => {
-      const steps: WorkflowStep[] = [
-        { name: 'build', use: 'docker-build', image: 'app', extraParam: 'ignored' } as WorkflowStep,
-      ];
-
-      const result = validateCustomStepsUsage(steps, customSteps);
-
-      expect(result.valid).toBe(true);
-      expect(result.warnings.some((w) => w.includes('extraParam'))).toBe(true);
-    });
-
-    it('should validate multiple steps with different issues', () => {
-      const steps: WorkflowStep[] = [
-        { name: 'build1', use: 'docker-build' } as WorkflowStep, // missing image
-        { name: 'build2', use: 'missing-step' } as WorkflowStep, // unknown step
-        { name: 'deploy', use: 'deploy', env: 'prod' } as WorkflowStep, // valid
-      ];
-
-      const result = validateCustomStepsUsage(steps, customSteps);
-
-      expect(result.valid).toBe(false);
-      expect(result.errors).toHaveLength(2);
-      expect(result.missingSteps).toContain('missing-step');
-      expect(result.missingParams).toHaveLength(1);
-    });
-
-    it('should skip validation for non-custom steps', () => {
-      const steps: WorkflowStep[] = [
-        { name: 'agent-step', agent: 'dev', task: 'Do work' },
-        { name: 'det-step', type: 'deterministic', command: 'echo hello' },
-      ];
-
-      const result = validateCustomStepsUsage(steps, customSteps);
-
-      expect(result.valid).toBe(true);
-      expect(result.errors).toHaveLength(0);
-      expect(result.warnings).toHaveLength(0);
-    });
-  });
-});
-
-// ── Custom Step Error Classes Tests ─────────────────────────────────────────
-
-describe('Custom Step Error Classes', () => {
-  it('CustomStepsParseError should have helpful message', () => {
-    const error = new CustomStepsParseError(
-      'Missing "steps" key',
-      'Add a "steps" object',
-      '/path/to/steps.yaml'
-    );
-
-    expect(error.name).toBe('CustomStepsParseError');
-    expect(error.issue).toBe('Missing "steps" key');
-    expect(error.suggestion).toBe('Add a "steps" object');
-    expect(error.filePath).toBe('/path/to/steps.yaml');
-    expect(error.message).toContain('Missing "steps" key');
-    expect(error.message).toContain('Add a "steps" object');
-  });
-
-  it('CustomStepResolutionError should have helpful message', () => {
-    const error = new CustomStepResolutionError(
-      'my-step',
-      'Custom step "docker-build" not found',
-      'Add it to .relay/steps.yaml'
-    );
-
-    expect(error.name).toBe('CustomStepResolutionError');
-    expect(error.stepName).toBe('my-step');
-    expect(error.issue).toBe('Custom step "docker-build" not found');
-    expect(error.suggestion).toBe('Add it to .relay/steps.yaml');
-    expect(error.message).toContain('my-step');
-  });
-});
-
-// ── Worktree Step Tests ─────────────────────────────────────────────────────
-
-describe('Worktree Step Validation', () => {
-  it('should accept valid worktree step', () => {
-    const validYaml = `
-version: "1.0"
-name: test-worktree
-swarm:
-  pattern: dag
-agents:
-  - name: developer
-    cli: claude
-workflows:
-  - name: default
-    steps:
-      - name: setup-worktree
-        type: worktree
-        branch: feature/test
-      - name: develop
-        agent: developer
-        task: "Work in worktree"
-        dependsOn: [setup-worktree]
-`;
-    const parsed = parseYaml(validYaml);
-    expect(parsed.workflows[0].steps[0].type).toBe('worktree');
-    expect(parsed.workflows[0].steps[0].branch).toBe('feature/test');
-  });
-
-  it('should accept worktree step with all options', () => {
-    const validYaml = `
-version: "1.0"
-name: test-worktree
-swarm:
-  pattern: dag
-agents:
-  - name: developer
-    cli: claude
-workflows:
-  - name: default
-    steps:
-      - name: setup-worktree
-        type: worktree
-        branch: feature/test
-        baseBranch: main
-        path: .worktrees/dev
-        createBranch: true
-        timeoutMs: 30000
-`;
-    const parsed = parseYaml(validYaml);
-    const step = parsed.workflows[0].steps[0];
-    expect(step.type).toBe('worktree');
-    expect(step.branch).toBe('feature/test');
-    expect(step.baseBranch).toBe('main');
-    expect(step.path).toBe('.worktrees/dev');
-    expect(step.createBranch).toBe(true);
-    expect(step.timeoutMs).toBe(30000);
-  });
-
-  it('should support variable interpolation in worktree branch', () => {
-    const validYaml = `
-version: "1.0"
-name: test-worktree
-swarm:
-  pattern: dag
-agents:
-  - name: developer
-    cli: claude
-workflows:
-  - name: default
-    steps:
-      - name: setup-worktree
-        type: worktree
-        branch: "feature/{{branch-name}}"
-`;
-    const parsed = parseYaml(validYaml);
-    expect(parsed.workflows[0].steps[0].branch).toBe('feature/{{branch-name}}');
-  });
-});
-
-// ── Pattern Selection Tests ──────────────────────────────────────────────────
-
-describe('Pattern Selection for Templates', () => {
-  let registry: TemplateRegistry;
-  let coordinator: SwarmCoordinator;
-
-  beforeEach(() => {
-    registry = new TemplateRegistry({ builtInTemplatesDir: TEMPLATES_DIR });
-    coordinator = new SwarmCoordinator(mockDb as any);
-  });
-
-  it('review-loop should select review-loop pattern', async () => {
-    const config = await registry.loadTemplate('review-loop');
-    const pattern = coordinator.selectPattern(config);
-    expect(pattern).toBe('review-loop');
-  });
-
-  for (const templateName of BUILT_IN_TEMPLATE_NAMES) {
-    it(`${templateName}: selected pattern should match declared pattern`, async () => {
-      const config = await registry.loadTemplate(templateName);
-      // If pattern is explicit, selection should return it
-      if (config.swarm.pattern) {
-        const selected = coordinator.selectPattern(config);
-        expect(selected).toBe(config.swarm.pattern);
-      }
-    });
-  }
-});
diff --git a/packages/sdk/src/cli-registry.ts b/packages/sdk/src/cli-registry.ts
index ec039e26e..4468589e1 100644
--- a/packages/sdk/src/cli-registry.ts
+++ b/packages/sdk/src/cli-registry.ts
@@ -11,7 +11,7 @@
  * in `resolve_command_path()` at crates/broker/src/pty.rs.
  */
 
-import type { AgentCli } from './workflows/types.js';
+import type { AgentCli } from '@agent-relay/cloud';
 
 // ── Types ──────────────────────────────────────────────────────────────────
 
diff --git a/packages/sdk/src/cli-resolver.ts b/packages/sdk/src/cli-resolver.ts
index 7e5d5dcb2..a4624bb72 100644
--- a/packages/sdk/src/cli-resolver.ts
+++ b/packages/sdk/src/cli-resolver.ts
@@ -11,7 +11,7 @@ import { accessSync, constants as constantsSync } from 'node:fs';
 import { join } from 'node:path';
 import { homedir } from 'node:os';
 import { promisify } from 'node:util';
-import type { AgentCli } from './workflows/types.js';
+import type { AgentCli } from '@agent-relay/cloud';
 import { getCliDefinition, COMMON_SEARCH_PATHS } from './cli-registry.js';
 
 const execFileAsync = promisify(execFile);
diff --git a/packages/sdk/src/examples/workflow-superiority.ts b/packages/sdk/src/examples/workflow-superiority.ts
deleted file mode 100644
index ef1e2caf3..000000000
--- a/packages/sdk/src/examples/workflow-superiority.ts
+++ /dev/null
@@ -1,1485 +0,0 @@
-/**
- * Workflow Superiority — Multi-Agent Implementation Campaign
- *
- * A fully specified DAG workflow that orchestrates Claude (lead + reviewer)
- * and Codex workers across five implementation tiers to make the relay
- * broker-sdk workflow system decisively superior to Agno and Swarms AI.
- *
- * Architecture:
- *   - Claude lead: orchestrates each phase, approves trajectories, makes
- *     final architectural decisions
- *   - Codex workers: implement code changes, one per specialization domain
- *   - Claude code-reviewer: independent review after every implementation phase
- *     (separate from lead to avoid confirmation bias)
- *
- * DAG phases:
- *   Phase 0 → Codebase analysis + spec approval
- *   Phase 1 → Type system extension (condition/loop/router/hitl/sub-workflow)
- *   Phase 2 → Execution engine (runner handles new primitives + session)
- *   Phase 3 → Meta-orchestration (parallel with Phase 4)
- *   Phase 4 → Storage backends (parallel with Phase 3)
- *   Phase 5 → Deployment & observability
- *   Phase 6 → Integration validation + final lead sign-off
- *
- * Run:
- *   npx tsx src/examples/workflow-superiority.ts
- *
- * Environment:
- *   RELAY_API_KEY — optional. If absent the runner auto-provisions a
- *   fresh Relaycast workspace for each run (fully isolated, no caching).
- */
-
-import { workflow } from '../workflows/builder.js';
-import type { WorkflowEvent } from '../workflows/runner.js';
-
-// ── Spec constants ────────────────────────────────────────────────────────────
-
-const WORKFLOW_ROOT = 'packages/sdk/src/workflows';
-const TYPES_FILE = `${WORKFLOW_ROOT}/types.ts`;
-const RUNNER_FILE = `${WORKFLOW_ROOT}/runner.ts`;
-const BUILDER_FILE = `${WORKFLOW_ROOT}/builder.ts`;
-const SCHEMA_FILE = `${WORKFLOW_ROOT}/schema.json`;
-const INDEX_FILE = `${WORKFLOW_ROOT}/index.ts`;
-const MEMORY_DB = `${WORKFLOW_ROOT}/memory-db.ts`;
-const COORDINATOR = `${WORKFLOW_ROOT}/coordinator.ts`;
-const BARRIER_FILE = `${WORKFLOW_ROOT}/barrier.ts`;
-const TEMPLATES = `${WORKFLOW_ROOT}/templates.ts`;
-
-// NOTE: No withExit() wrapper needed — the WorkflowRunner automatically
-// appends self-termination instructions in spawnAndWait() with the agent's
-// actual runtime name. Adding a second exit instruction wastes tokens.
-
-// ── Event handler ─────────────────────────────────────────────────────────────
-
-const onEvent = (event: WorkflowEvent): void => {
-  const ts = new Date().toISOString();
-  switch (event.type) {
-    case 'run:started':
-      console.log(`[${ts}] 🚀 run started  runId=${event.runId}`);
-      break;
-    case 'run:completed':
-      console.log(`[${ts}] ✅ run complete runId=${event.runId}`);
-      break;
-    case 'run:failed':
-      console.error(`[${ts}] ❌ run failed  runId=${event.runId} error=${event.error}`);
-      break;
-    case 'step:started':
-      console.log(`[${ts}]   → ${event.stepName}`);
-      break;
-    case 'step:completed':
-      console.log(`[${ts}]   ✓ ${event.stepName}`);
-      break;
-    case 'step:failed':
-      console.error(`[${ts}]   ✗ ${event.stepName}: ${event.error}`);
-      break;
-    case 'step:skipped':
-      console.log(`[${ts}]   ⊘ ${event.stepName} (skipped)`);
-      break;
-    case 'step:retrying':
-      console.log(`[${ts}]   ↺ ${event.stepName} attempt=${event.attempt}`);
-      break;
-  }
-};
-
-// ── Workflow definition ───────────────────────────────────────────────────────
-
-const result = await workflow('broker-sdk-superiority')
-  .description(
-    'Five-phase multi-agent campaign to make relay broker-sdk workflow system ' +
-      'decisively superior to Agno and Swarms AI. Claude leads; Codex implements; ' +
-      'Claude reviews after every phase.'
-  )
-  .pattern('dag')
-  .channel('wf-broker-sdk-superiority')
-  .maxConcurrency(3)
-  .timeout(28_800_000) // 8 hours — this is a large implementation campaign
-
-  // ── Agents ────────────────────────────────────────────────────────────────
-
-  .agent('lead', {
-    cli: 'claude',
-    role:
-      'Lead architect. Sets direction, reviews each phase output, approves ' +
-      'trajectories, and resolves architectural conflicts. Has final say on ' +
-      'all design decisions.',
-    retries: 2,
-  })
-
-  .agent('code-reviewer', {
-    cli: 'claude',
-    role:
-      'Independent code reviewer. Reviews implementation quality, correctness, ' +
-      'TypeScript type safety, test coverage, and integration coherence after ' +
-      'every phase. Catches issues the lead may have missed.',
-    retries: 2,
-  })
-
-  .agent('spec-analyst', {
-    cli: 'codex',
-    role:
-      'Codebase analyst. Reads the existing workflow source files and produces ' +
-      'a precise, file-by-file implementation plan for all five improvement tiers.',
-    retries: 2,
-  })
-
-  .agent('schema-implementer', {
-    cli: 'codex',
-    role:
-      'Type system specialist. Extends TypeScript interfaces and JSON Schema ' +
-      'definitions to support new workflow primitives.',
-    retries: 2,
-  })
-
-  .agent('engine-implementer', {
-    cli: 'codex',
-    role:
-      'Execution engine specialist. Implements new step-type execution logic ' +
-      'inside WorkflowRunner, adds session concept, and expands the event system.',
-    retries: 3,
-  })
-
-  .agent('meta-implementer', {
-    cli: 'codex',
-    role:
-      'Meta-orchestration specialist. Implements sub-workflow composition, ' +
-      'AutoWorkflowBuilder, and semantic pattern selection.',
-    retries: 2,
-  })
-
-  .agent('storage-implementer', {
-    cli: 'codex',
-    role:
-      'Storage backend specialist. Implements PostgresWorkflowDb, ' +
-      'SqliteWorkflowDb, and RedisWorkflowDb adapters.',
-    retries: 2,
-  })
-
-  .agent('deploy-implementer', {
-    cli: 'codex',
-    role:
-      'Deployment and observability specialist. Implements relay workflow serve ' +
-      'HTTP server, OTel tracing integration, and CLI improvements.',
-    retries: 2,
-  })
-
-  .agent('test-validator', {
-    cli: 'codex',
-    role:
-      'Integration test specialist. Validates all phases compile, tests pass, ' + 'and exports are correct.',
-    retries: 2,
-  })
-
-  // ── Phase 0: Codebase Analysis ────────────────────────────────────────────
-
-  .step('codebase-analysis', {
-    agent: 'spec-analyst',
-    task: `
-You are the first step in a large improvement campaign for the relay broker-sdk
-workflow system. Your job is to read the existing source files and produce a
-concrete, file-by-file implementation plan.
-
-READ THESE FILES THOROUGHLY:
-  - ${TYPES_FILE}
-  - ${RUNNER_FILE}
-  - ${BUILDER_FILE}
-  - ${SCHEMA_FILE}
-  - ${INDEX_FILE}
-  - ${MEMORY_DB}
-  - ${COORDINATOR}
-  - ${BARRIER_FILE}
-  - ${TEMPLATES}
-
-PRODUCE A DETAILED PLAN covering the following improvements (in priority order):
-
-TIER 1 — Schema Primitives (new step types in types.ts + schema.json):
-  a) condition step: WorkflowStep gains optional "condition" string (CEL expr)
-     and optional "type" discriminant. When condition evaluates false → skip.
-  b) loop step: new LoopStepGroup interface { type:"loop", name, steps[],
-     until?: string (CEL expr on step outputs), maxIterations: number }
-  c) router step: new RouterStepGroup interface { type:"router", name,
-     selector: string (CEL expr), routes: RouterRoute[], default?: string[] }
-     RouterRoute: { match: string, steps: string[] }
-  d) parallel step group: new ParallelStepGroup interface { type:"parallel",
-     name, barrier?: "all"|"any"|"majority", timeout?: number, steps[] }
-  e) hitl step: new HitlStep interface { type:"hitl", name, message: string,
-     channel?: string, timeout?: number, onTimeout?: "skip"|"fail" }
-  f) flow shorthand: RelayYamlConfig gains optional "flow?: string" field,
-     parsed as "A -> B, C -> D" notation generating dependsOn edges
-  g) sub-workflow step: new SubWorkflowStep interface { type:"sub-workflow",
-     name, workflow: string (path or registry name), vars?: Record<string,string> }
-  h) Promote retries + timeoutMs to top-level WorkflowStep fields (they already
-     exist — verify they are exported and used correctly in runner.ts)
-
-TIER 2 — Execution Engine (runner.ts):
-  a) Condition evaluation: before executing a step, if step.condition is set,
-     evaluate the CEL expression; if false, mark step skipped
-  b) Loop execution: LoopStepGroup runs its steps[].steps repeatedly until
-     until-condition is true or maxIterations reached
-  c) Router execution: evaluate selector, match route, execute branch steps
-  d) Parallel group: run steps concurrently with barrier semantics
-  e) HITL execution: pause run, write hitl-pending file, poll for response file
-  f) Sub-workflow: recursively create a WorkflowRunner and execute the referenced
-     config, return its output as the step output
-  g) Session concept: WorkflowRunner gains optional sessionId param; a session
-     groups multiple runs and shares state across them via SessionStore
-  h) Input schema validation: RelayYamlConfig gains optional inputSchema field
-     (JSON Schema object); validate vars before execution begins
-  i) Fallback agent: WorkflowStep gains optional fallbackAgent?: string;
-     if primary agent fails all retries, retry once with fallbackAgent
-  j) Expanded events: add 15+ new WorkflowEvent union members for loop iterations,
-     condition evaluations, router selections, hitl pauses, session updates
-
-TIER 3 — Meta-Orchestration:
-  a) AutoWorkflowBuilder: new exported class that takes a task string and
-     available CLIs, calls a meta-agent to generate RelayYamlConfig, validates
-     it, and returns it (or optionally executes immediately)
-  b) Workflow registry: simple JSON file-based registry at
-     ~/.agent-relay/workflow-registry.json that maps name→path; CLI commands
-     relay workflow list, search, install, publish
-
-TIER 4 — Storage Backends:
-  a) PostgresWorkflowDb: implements WorkflowDb interface using node-postgres (pg)
-     with schema migration on first connect
-  b) SqliteWorkflowDb: implements WorkflowDb using better-sqlite3 (sync API
-     wrapped in async interface)
-  c) RedisWorkflowDb: implements WorkflowDb using ioredis with JSON serialization
-     and optional TTL on run records
-  All three: exported from packages/sdk/src/workflows/db/ submodule
-
-TIER 5 — Deployment & Observability:
-  a) relay workflow serve: new CLI subcommand that starts an Express/Fastify HTTP
-     server exposing POST /run, GET /runs/:id, GET /runs/:id/events (SSE),
-     POST /runs/:id/hitl/:step, POST /runs/:id/abort, GET /health
-  b) OTel tracing: optional otel?: { exportTo: string, endpoint: string,
-     serviceName: string } in RelayYamlConfig; runner creates spans for
-     run start/end and each step start/end using @opentelemetry/sdk-node
-  c) CLI improvements: relay workflow dry-run, relay workflow inspect,
-     relay workflow replay --from <step>
-
-For each tier, specify:
-  1. Which existing files change and what lines/sections to modify
-  2. Which new files to create and their full path
-  3. New TypeScript interface/type definitions (exact syntax)
-  4. New function signatures with JSDoc
-
-Output a structured plan with clear section headers.
-End your output with: ANALYSIS_COMPLETE
-    `,
-    retries: 2,
-    verification: { type: 'output_contains', value: 'ANALYSIS_COMPLETE' },
-  })
-
-  .step('spec-approval', {
-    agent: 'lead',
-    task: `
-Review the codebase analysis produced by the spec-analyst:
-
-{{steps.codebase-analysis.output}}
-
-Your job:
-1. Validate that the plan covers all five tiers correctly
-2. Identify any architectural risks or conflicts (e.g., breaking changes to
-   WorkflowStep that would break existing templates)
-3. Clarify the execution order for each tier
-4. Approve or amend the plan — note any changes clearly
-5. Establish a non-negotiable constraint: ALL existing tests in
-   packages/sdk/src/__tests__/ must remain passing after each phase
-
-Key architectural decisions to make explicit:
-  - How should WorkflowStep handle the new type discriminant without breaking
-    existing YAML that has no "type" field? (answer: type defaults to "agent")
-  - Should LoopStepGroup and RouterStepGroup be separate from WorkflowStep in
-    the types, or unified via a discriminated union?
-  - Is the session concept stored in the same WorkflowDb or a separate SessionDb?
-  - For the hitl step, what is the polling mechanism? (file-based, HTTP endpoint,
-    or webhook?) Choose the simplest that works without requiring a server.
-
-Output a concise approved plan with your decisions. End with: SPEC_APPROVED
-    `,
-    dependsOn: ['codebase-analysis'],
-    retries: 2,
-    verification: { type: 'output_contains', value: 'SPEC_APPROVED' },
-  })
-
-  // ── Phase 1: Type System Extension ────────────────────────────────────────
-
-  .step('p1-type-system', {
-    agent: 'schema-implementer',
-    task: `
-Phase 1a: Extend the TypeScript type system for new workflow primitives.
-
-Approved spec context:
-{{steps.spec-approval.output}}
-
-YOUR TASK: Modify ${TYPES_FILE} to add all new types.
-
-SPECIFIC CHANGES:
-
-1. Add a StepType discriminant:
-   export type StepType = "agent" | "condition" | "loop" | "router" | "parallel" | "hitl" | "sub-workflow";
-
-2. Extend WorkflowStep to include new optional fields:
-   - type?: StepType          (default "agent" when absent)
-   - condition?: string       (CEL expression; step skipped if evaluates false)
-   - fallbackAgent?: string   (agent name to use if primary fails all retries)
-
-3. Add new composite step group interfaces:
-
-   export interface LoopStepGroup {
-     type: "loop";
-     name: string;
-     description?: string;
-     steps: WorkflowStep[];
-     until?: string;        // CEL expression evaluated after each iteration
-     maxIterations: number; // required — prevents runaway loops
-     timeoutMs?: number;
-   }
-
-   export interface RouterRoute {
-     match: string;         // CEL expression or substring match
-     steps: string[];       // names of steps to execute for this route
-   }
-
-   export interface RouterStepGroup {
-     type: "router";
-     name: string;
-     description?: string;
-     selector: string;      // CEL expression producing a string value
-     routes: RouterRoute[];
-     default?: string[];    // step names to run if no route matches
-     timeoutMs?: number;
-   }
-
-   export interface ParallelStepGroup {
-     type: "parallel";
-     name: string;
-     description?: string;
-     barrier?: "all" | "any" | "majority"; // default "all"
-     steps: WorkflowStep[];
-     timeoutMs?: number;
-   }
-
-   export interface HitlStep {
-     type: "hitl";
-     name: string;
-     description?: string;
-     message: string;       // human-readable prompt shown to approver
-     channel?: string;      // notification target e.g. "slack:#approvals"
-     timeoutMs?: number;    // how long to wait before applying onTimeout
-     onTimeout?: "skip" | "fail" | "use-default"; // default "fail"
-     defaultResponse?: string; // used when onTimeout is "use-default"
-   }
-
-   export interface SubWorkflowStep {
-     type: "sub-workflow";
-     name: string;
-     description?: string;
-     workflow: string;      // path to relay.yaml or registry name
-     vars?: Record<string, string>; // variable substitutions for the sub-workflow
-     timeoutMs?: number;
-   }
-
-4. Create a union type for any step or step group:
-   export type AnyWorkflowStep =
-     | WorkflowStep
-     | LoopStepGroup
-     | RouterStepGroup
-     | ParallelStepGroup
-     | HitlStep
-     | SubWorkflowStep;
-
-5. Update WorkflowDefinition.steps to use AnyWorkflowStep[]:
-   steps: AnyWorkflowStep[];
-
-6. Add session types:
-   export interface SessionConfig {
-     persist?: boolean;          // default false
-     historyRuns?: number;       // how many prior runs to inject as context
-     ttlMs?: number;
-   }
-
-   export interface SessionRow {
-     id: string;
-     workflowName: string;
-     runIds: string[];
-     stateSnapshot: Record<string, unknown>;
-     createdAt: string;
-     updatedAt: string;
-   }
-
-7. Add inputSchema to RelayYamlConfig:
-   inputSchema?: Record<string, unknown>; // JSON Schema object
-
-8. Add session to RelayYamlConfig:
-   session?: SessionConfig;
-
-9. Expand WorkflowEvent union in runner.ts — ADD to the existing union
-   (note: WorkflowEvent is defined in runner.ts, not types.ts, so create a
-   comment in types.ts pointing to runner.ts where these will be added):
-   // New events will be added to WorkflowEvent in runner.ts:
-   // loop:iteration-started, loop:iteration-completed, loop:ended,
-   // condition:evaluated, condition:skipped, router:evaluated,
-   // parallel:branch-started, parallel:branch-completed,
-   // hitl:paused, hitl:responded, hitl:timeout,
-   // subworkflow:started, subworkflow:completed,
-   // session:state-updated, validation:failed, fallback:agent-switched
-
-10. Export all new types from ${INDEX_FILE}
-
-Make ALL changes. Run: npx tsc --noEmit to verify no type errors.
-End your output with: TYPES_COMPLETE
-    `,
-    dependsOn: ['spec-approval'],
-    retries: 2,
-    verification: { type: 'output_contains', value: 'TYPES_COMPLETE' },
-  })
-
-  .step('p1-json-schema', {
-    agent: 'schema-implementer',
-    task: `
-Phase 1b: Update the JSON Schema to match the new TypeScript types.
-
-Prior type changes:
-{{steps.p1-type-system.output}}
-
-YOUR TASK: Update ${SCHEMA_FILE} to add definitions for all new step group types.
-
-Add new $defs entries:
-  - StepType enum definition
-  - LoopStepGroup object with required: [type, name, steps, maxIterations]
-  - RouterRoute object
-  - RouterStepGroup object with required: [type, name, selector, routes]
-  - ParallelStepGroup object with required: [type, name, steps]
-  - HitlStep object with required: [type, name, message]
-  - SubWorkflowStep object with required: [type, name, workflow]
-  - SessionConfig object
-  - AnyWorkflowStep as oneOf the above plus existing WorkflowStep
-
-Update workflow.steps array to use anyOf: [WorkflowStep, AnyWorkflowStep]
-Update top-level RelayYamlConfig to include inputSchema and session properties.
-
-Also update packages/sdk/src/workflows/builder.ts:
-  - Add a new builder method for sessions:
-    session(config: SessionConfig): this
-  - Add a new builder method for input schema:
-    inputSchema(schema: Record<string, unknown>): this
-
-Verify with: cat ${SCHEMA_FILE} | python3 -m json.tool (or equivalent JSON lint)
-End your output with: SCHEMA_COMPLETE
-    `,
-    dependsOn: ['p1-type-system'],
-    retries: 2,
-    verification: { type: 'output_contains', value: 'SCHEMA_COMPLETE' },
-  })
-
-  .step('p1-lead-review', {
-    agent: 'lead',
-    task: `
-Phase 1 Lead Review: Validate the type system and schema changes.
-
-Type system changes:
-{{steps.p1-type-system.output}}
-
-Schema changes:
-{{steps.p1-json-schema.output}}
-
-REVIEW CRITERIA:
-1. Do the new TypeScript interfaces correctly model the intended semantics?
-2. Is the AnyWorkflowStep discriminated union correctly structured? Each variant
-   must have a unique "type" literal so TypeScript can narrow the type.
-3. Does the WorkflowStep backward compatibility hold? (existing YAML with no
-   "type" field should still work — type defaults to "agent")
-4. Are the new fields in RelayYamlConfig (inputSchema, session) properly optional?
-5. Does the builder extension make sense? Are the new methods ergonomic?
-6. Any naming inconsistencies between the TypeScript types and JSON Schema?
-
-If you find issues, describe them specifically with file:line references.
-If the phase is acceptable, state what should be fixed in the engine phase.
-End with: PHASE_1_APPROVED (even if you request minor fixes — fixes go to
-the code-reviewer, who will direct the implementer if needed)
-    `,
-    dependsOn: ['p1-json-schema'],
-    retries: 1,
-    verification: { type: 'output_contains', value: 'PHASE_1_APPROVED' },
-  })
-
-  .step('p1-code-review', {
-    agent: 'code-reviewer',
-    task: `
-Phase 1 Independent Code Review: TypeScript type system extension.
-(Running in parallel with lead review — review the code independently.)
-
-JSON Schema changes:
-{{steps.p1-json-schema.output}}
-
-YOUR INDEPENDENT REVIEW of ${TYPES_FILE}, ${SCHEMA_FILE}, ${BUILDER_FILE}:
-
-Check:
-1. TypeScript strict-mode compliance — no implicit any, all fields typed
-2. JSDoc on every exported interface and type
-3. Correct use of discriminated unions (each variant's type field is a
-   string literal, not just string)
-4. AnyWorkflowStep is correctly exported from ${INDEX_FILE}
-5. Builder methods follow existing patterns (return this for chaining)
-6. JSON Schema $defs are correctly referenced in anyOf arrays
-7. No circular references in the type definitions
-8. Run: npx tsc --noEmit from packages/sdk and confirm zero errors
-
-List any issues found. For each: file, line (if known), problem, fix required.
-If zero issues: explicitly state "No issues found."
-End with: CODE_REVIEW_1_COMPLETE
-    `,
-    dependsOn: ['p1-json-schema'],
-    retries: 1,
-    verification: { type: 'output_contains', value: 'CODE_REVIEW_1_COMPLETE' },
-  })
-
-  // ── Phase 2: Execution Engine ─────────────────────────────────────────────
-
-  .step('p2-condition-loop', {
-    agent: 'engine-implementer',
-    task: `
-Phase 2a: Implement condition + loop execution in the WorkflowRunner.
-
-Phase 1 review context:
-{{steps.p1-code-review.output}}
-
-YOUR TASK: Modify ${RUNNER_FILE} to handle condition and loop step types.
-
-CONDITION STEP EXECUTION:
-In the executeStep method (or wherever individual steps are dispatched):
-1. Check if step.type === "condition" OR if step.condition is set on a regular step
-2. If step.condition exists, evaluate the CEL expression using a lightweight
-   evaluator. Use the cel-js npm package (add to package.json if not present)
-   OR implement a minimal evaluator that handles:
-     - String contains: "X in Y.output"
-     - String equality: "steps.X.output == 'VALUE'"
-     - Boolean AND/OR
-   The expression context object should include:
-     { steps: Record<name, { output: string, status: string }>,
-       vars: VariableContext }
-3. If condition evaluates to false: mark step as "skipped", emit step:skipped event
-4. If condition evaluates to true (or no condition): proceed normally
-
-Also add to WorkflowEvent union in runner.ts:
-  | { type: "condition:evaluated"; runId: string; stepName: string; result: boolean; expression: string }
-  | { type: "condition:skipped"; runId: string; stepName: string }
-
-LOOP STEP GROUP EXECUTION:
-Add a new method: private async executeLoopGroup(loop: LoopStepGroup, ...): Promise<string>
-1. Run loop.steps sequentially up to loop.maxIterations times
-2. After each iteration, evaluate loop.until CEL expression if provided
-3. If until evaluates to true, break and return last step output
-4. If maxIterations reached without satisfaction, fail with descriptive error
-5. Track step outputs by iteration: steps in context include "loop.STEP.output"
-   for the current iteration
-
-Add to WorkflowEvent:
-  | { type: "loop:iteration-started"; runId: string; loopName: string; iteration: number }
-  | { type: "loop:iteration-completed"; runId: string; loopName: string; iteration: number; continuing: boolean }
-  | { type: "loop:ended"; runId: string; loopName: string; reason: "condition-met" | "max-iterations" }
-
-In the main execution loop (findReadySteps / executeSteps), detect when a step
-is a LoopStepGroup and route it to executeLoopGroup.
-
-Run: npx tsc --noEmit to verify.
-End your output with: CONDITION_LOOP_COMPLETE
-    `,
-    dependsOn: ['p1-code-review'],
-    retries: 2,
-    verification: { type: 'output_contains', value: 'CONDITION_LOOP_COMPLETE' },
-  })
-
-  .step('p2-input-validation', {
-    agent: 'schema-implementer',
-    task: `
-Phase 2b: Implement input schema validation (runs in parallel with p2-condition-loop).
-
-Phase 1 review context:
-{{steps.p1-code-review.output}}
-
-YOUR TASK: Add input schema validation to WorkflowRunner before execution starts.
-
-In ${RUNNER_FILE}, in the execute() method, BEFORE the first findReadySteps call:
-
-1. If config.inputSchema is defined:
-   a. Import or inline a minimal JSON Schema validator. Use the ajv npm package
-      (add to package.json dependencies if not present).
-   b. Compile the schema: const validate = ajv.compile(config.inputSchema)
-   c. Validate the vars object against the schema
-   d. If invalid: emit { type: "validation:failed", runId, errors: AjvError[] }
-      and throw WorkflowValidationError with a human-readable message listing
-      each field error
-
-2. Add WorkflowValidationError class (extends Error) to runner.ts:
-   export class WorkflowValidationError extends Error {
-     constructor(public readonly errors: unknown[]) {
-       super("Workflow input validation failed: " + JSON.stringify(errors));
-       this.name = "WorkflowValidationError";
-     }
-   }
-
-3. Add to WorkflowEvent:
-   | { type: "validation:failed"; runId: string; errors: unknown[] }
-   | { type: "validation:passed"; runId: string }
-
-4. Export WorkflowValidationError from ${INDEX_FILE}
-
-5. Update builder.ts: add the inputSchema method to WorkflowBuilder that sets
-   config.inputSchema (this was noted in Phase 1 but implement it now if not done)
-
-Run: npx tsc --noEmit to verify.
-End your output with: INPUT_VALIDATION_COMPLETE
-    `,
-    dependsOn: ['p1-code-review'],
-    retries: 2,
-    verification: { type: 'output_contains', value: 'INPUT_VALIDATION_COMPLETE' },
-  })
-
-  .step('p2-router-hitl', {
-    agent: 'engine-implementer',
-    task: `
-Phase 2c: Implement router + HITL step execution.
-
-Condition/loop implementation:
-{{steps.p2-condition-loop.output}}
-
-YOUR TASK: Add router and HITL execution to ${RUNNER_FILE}.
-
-ROUTER STEP GROUP EXECUTION:
-Add: private async executeRouterGroup(router: RouterStepGroup, context, ...): Promise<string>
-1. Evaluate router.selector CEL expression to get a string value
-2. Iterate router.routes, find first route where match expression is true
-   (match can be substring check: selectorValue.includes(route.match) or
-   full CEL evaluation depending on complexity)
-3. Collect the branch step names to execute (from route.steps or router.default)
-4. Execute those steps (they must exist in the parent workflow's step list)
-5. Return concatenated outputs of the executed branch steps
-
-Add to WorkflowEvent:
-  | { type: "router:evaluated"; runId: string; routerName: string; selectorValue: string; matchedRoute: string | null }
-  | { type: "router:branch-started"; runId: string; routerName: string; stepName: string }
-
-HITL STEP EXECUTION:
-Add: private async executeHitlStep(hitl: HitlStep, runId: string, ...): Promise<string>
-1. Write a file: {summaryDir}/{runId}/hitl-{hitl.name}-pending.json containing:
-   { runId, stepName: hitl.name, message: hitl.message, channel: hitl.channel,
-     pendingSince: ISO timestamp, timeoutMs: hitl.timeoutMs }
-2. Emit { type: "hitl:paused", runId, stepName, message, channel }
-3. Poll every 5 seconds for a response file:
-   {summaryDir}/{runId}/hitl-{hitl.name}-response.json
-   The response file should contain: { response: string, respondedBy?: string }
-4. If timeoutMs elapses without response:
-   - If onTimeout === "skip": mark step skipped, emit hitl:timeout, return ""
-   - If onTimeout === "use-default": emit hitl:timeout, return hitl.defaultResponse ?? ""
-   - Otherwise (default "fail"): throw Error("HITL step timed out")
-5. On response: delete pending file, emit hitl:responded, return response.response
-
-Add to WorkflowEvent:
-  | { type: "hitl:paused"; runId: string; stepName: string; message: string; channel?: string }
-  | { type: "hitl:responded"; runId: string; stepName: string; response: string; respondedBy?: string }
-  | { type: "hitl:timeout"; runId: string; stepName: string; action: string }
-
-Run: npx tsc --noEmit
-End your output with: ROUTER_HITL_COMPLETE
-    `,
-    dependsOn: ['p2-condition-loop'],
-    retries: 2,
-    verification: { type: 'output_contains', value: 'ROUTER_HITL_COMPLETE' },
-  })
-
-  .step('p2-session-fallback', {
-    agent: 'engine-implementer',
-    task: `
-Phase 2d: Implement session concept and fallback agent switching.
-
-Router/HITL implementation:
-{{steps.p2-router-hitl.output}}
-
-YOUR TASK: Extend WorkflowRunner with session support and fallback agents.
-
-SESSION CONCEPT:
-A session groups multiple workflow runs, shares state across them, and can
-inject prior run outputs as context into new runs.
-
-1. Extend WorkflowRunnerOptions in runner.ts:
-   sessionId?: string;   // if provided, this run joins a named session
-
-2. Add a simple SessionStore (in-memory, backed by WorkflowDb if available):
-   - getSession(sessionId): returns { runIds: string[], stateSnapshot: Record }
-   - addRunToSession(sessionId, runId): appends runId to session run list
-   - getSessionHistory(sessionId, n): returns last n run outputs as context string
-
-3. In execute(), if sessionId is provided:
-   a. Load session history (last config.session?.historyRuns ?? 3 runs)
-   b. Prepend history context to the first step's task:
-      "[Session history - prior runs]\n{history}\n[Current task]\n{task}"
-   c. After run completes, call addRunToSession(sessionId, runId)
-
-4. Add to WorkflowEvent:
-   | { type: "session:run-added"; sessionId: string; runId: string }
-   | { type: "session:history-injected"; sessionId: string; historyRuns: number }
-
-FALLBACK AGENT:
-In the step execution method, after all retries on the primary agent are
-exhausted:
-1. Check if step.fallbackAgent is defined
-2. If yes: look up the fallback agent definition by name from config.agents
-3. Re-attempt execution once with the fallback agent
-4. Emit { type: "fallback:agent-switched"; runId, stepName, fromAgent, toAgent }
-5. If fallback also fails: mark step as failed
-
-Add to WorkflowEvent:
-  | { type: "fallback:agent-switched"; runId: string; stepName: string; fromAgent: string; toAgent: string }
-
-Also implement the flow shorthand parser (if RelayYamlConfig.flow is set):
-  parseFlowString("A -> B, C -> D"): WorkflowStep[]
-  - "A -> B" means B.dependsOn = [A]
-  - "B, C" means B and C are in parallel (no dependency between them)
-  - "A, B -> C" means C.dependsOn = [A, B]
-  - Call this in execute() before building the step graph if config.flow is set
-
-Run: npx tsc --noEmit
-End your output with: SESSION_FALLBACK_COMPLETE
-    `,
-    dependsOn: ['p2-router-hitl'],
-    retries: 2,
-    verification: { type: 'output_contains', value: 'SESSION_FALLBACK_COMPLETE' },
-  })
-
-  .step('p2-lead-review', {
-    agent: 'lead',
-    task: `
-Phase 2 Lead Review: Execution engine implementation.
-
-Input validation:
-{{steps.p2-input-validation.output}}
-
-Session + fallback:
-{{steps.p2-session-fallback.output}}
-
-REVIEW:
-1. Is the CEL condition evaluator robust enough? Does it handle the common
-   patterns we need (output contains, equality, AND/OR)?
-2. Is the loop execution correctly isolated — do step names inside a loop
-   conflict with top-level step names in the output context?
-3. Is the HITL polling approach acceptable? (file-based polling every 5s)
-   Or should it use a simple readline/stdin approach instead?
-4. Does the session history injection make sense — will agents be overwhelmed
-   by injected context if historyRuns is large?
-5. Is the flow string parser correct for all cases:
-   "A -> B, C -> D" and "A, B -> C"?
-6. Are all new WorkflowEvent variants added to the union consistently?
-
-Note any critical fixes needed before Phase 3 begins.
-End with: PHASE_2_APPROVED
-    `,
-    dependsOn: ['p2-session-fallback', 'p2-input-validation'],
-    retries: 1,
-    verification: { type: 'output_contains', value: 'PHASE_2_APPROVED' },
-  })
-
-  .step('p2-code-review', {
-    agent: 'code-reviewer',
-    task: `
-Phase 2 Independent Code Review: Execution engine.
-
-Lead's review:
-{{steps.p2-lead-review.output}}
-
-INDEPENDENT REVIEW of ${RUNNER_FILE}:
-
-1. Correctness: does the condition evaluator correctly handle edge cases
-   (undefined step output, empty strings, non-boolean CEL results)?
-2. Loop safety: is there a guard against infinite loops if maxIterations is 0?
-3. HITL polling: does the polling correctly clean up pending files on both
-   success and timeout paths? No file handle leaks?
-4. Fallback agent: is the agent definition lookup null-safe? What if
-   fallbackAgent name doesn't exist in config.agents?
-5. Session history injection: is it correctly skipped when sessionId is absent?
-6. Flow parser: does it handle edge cases — empty string, single agent,
-   spaces around arrows?
-7. TypeScript: run npx tsc --noEmit and report results
-8. Existing tests: run npx jest packages/sdk and report pass/fail counts
-
-List all issues with specific fixes. State "No issues" for clean sections.
-End with: CODE_REVIEW_2_COMPLETE
-    `,
-    dependsOn: ['p2-lead-review'],
-    retries: 1,
-    verification: { type: 'output_contains', value: 'CODE_REVIEW_2_COMPLETE' },
-  })
-
-  // ── Phase 3: Meta-Orchestration (parallel with Phase 4) ───────────────────
-
-  .step('p3-sub-workflow', {
-    agent: 'meta-implementer',
-    task: `
-Phase 3a: Implement sub-workflow step execution.
-
-Phase 2 review context:
-{{steps.p2-code-review.output}}
-
-YOUR TASK: Add sub-workflow composition to ${RUNNER_FILE}.
-
-SUB-WORKFLOW EXECUTION:
-Add: private async executeSubWorkflow(step: SubWorkflowStep, vars, runId, ...): Promise<string>
-1. Resolve the workflow reference:
-   - If step.workflow starts with "./" or "/": treat as file path
-   - Otherwise: look up in the workflow registry at
-     ~/.agent-relay/workflow-registry.json (create if absent; plain JSON map)
-2. Load and parse the referenced relay.yaml file
-3. Merge step.vars with the current run's vars (step.vars take precedence)
-4. Create a new WorkflowRunner instance (child runner), share the same DB
-5. Execute the sub-workflow config via child runner
-6. Return the sub-workflow's run output (join all step outputs)
-
-Add to WorkflowEvent:
-  | { type: "subworkflow:started"; runId: string; stepName: string; workflowRef: string }
-  | { type: "subworkflow:completed"; runId: string; stepName: string; output: string }
-  | { type: "subworkflow:failed"; runId: string; stepName: string; error: string }
-
-WORKFLOW REGISTRY:
-Create packages/sdk/src/workflows/registry.ts:
-
-  export interface WorkflowRegistryEntry {
-    name: string;
-    path: string;
-    description?: string;
-    tags?: string[];
-    installedAt: string;
-  }
-
-  export class WorkflowRegistry {
-    private readonly registryPath: string;
-    // Load registry from ~/.agent-relay/workflow-registry.json
-    async list(): Promise<WorkflowRegistryEntry[]>
-    async get(name: string): Promise<WorkflowRegistryEntry | null>
-    async register(entry: WorkflowRegistryEntry): Promise<void>
-    async unregister(name: string): Promise<void>
-    async resolvePath(nameOrPath: string): Promise<string>
-    // If starts with ./ or / return as-is; else look up in registry
-  }
-
-Export WorkflowRegistry from ${INDEX_FILE}.
-
-Run: npx tsc --noEmit
-End with: SUB_WORKFLOW_COMPLETE
-    `,
-    dependsOn: ['p2-code-review'],
-    retries: 2,
-    verification: { type: 'output_contains', value: 'SUB_WORKFLOW_COMPLETE' },
-  })
-
-  .step('p3-auto-builder', {
-    agent: 'meta-implementer',
-    task: `
-Phase 3b: Implement AutoWorkflowBuilder.
-
-Sub-workflow implementation:
-{{steps.p3-sub-workflow.output}}
-
-YOUR TASK: Create packages/sdk/src/workflows/auto-builder.ts
-
-The AutoWorkflowBuilder analyzes a task description and uses a meta-agent
-to generate a complete RelayYamlConfig automatically.
-
-  export interface AutoBuildOptions {
-    availableClis?: AgentCli[];   // defaults to ["claude", "codex"]
-    maxAgents?: number;           // defaults to 5
-    maxSteps?: number;            // defaults to 10
-    preferredPattern?: SwarmPattern;
-    dryRun?: boolean;             // if true, return config without executing
-    metaCli?: AgentCli;           // CLI to use for the meta-agent (default "claude")
-  }
-
-  export interface AutoBuildResult {
-    config: RelayYamlConfig;
-    yaml: string;
-    reasoning: string;  // why the meta-agent chose this structure
-    run?: WorkflowRunRow; // present if dryRun is false
-  }
-
-  export class AutoWorkflowBuilder {
-    constructor(private readonly options: AutoBuildOptions = {}) {}
-
-    async build(task: string): Promise<AutoBuildResult> {
-      // 1. Construct a meta-prompt that instructs the meta-agent to:
-      //    a. Analyze the task
-      //    b. Select the best swarm pattern
-      //    c. Define agents (using available CLIs)
-      //    d. Define workflow steps with appropriate dependencies
-      //    e. Output a valid relay.yaml string (fenced in \`\`\`yaml...\`\`\`)
-      //    f. Explain its reasoning
-      // 2. Spawn the meta-agent via AgentRelay
-      // 3. Extract the YAML from the response (find \`\`\`yaml ... \`\`\` block)
-      // 4. Parse and validate the config using WorkflowRunner.parseYamlString
-      // 5. If dryRun: return { config, yaml, reasoning }
-      // 6. Else: execute via WorkflowRunner and return { config, yaml, reasoning, run }
-    }
-
-    // Convenience: build and run immediately
-    async run(task: string): Promise<WorkflowRunRow> {
-      const result = await this.build(task);
-      if (!result.run) throw new Error("Set dryRun: false to execute");
-      return result.run;
-    }
-  }
-
-  // Convenience export
-  export async function autoWorkflow(task: string, options?: AutoBuildOptions): Promise<AutoBuildResult> {
-    return new AutoWorkflowBuilder(options).build(task);
-  }
-
-Export AutoWorkflowBuilder and autoWorkflow from ${INDEX_FILE}.
-
-Also add the meta-workflow type to types.ts if not already done:
-  export type MetaWorkflowConfig = RelayYamlConfig & { type: "meta-workflow" };
-  (A meta-workflow is a relay.yaml where steps are sub-workflow steps)
-
-Run: npx tsc --noEmit
-End with: AUTO_BUILDER_COMPLETE
-    `,
-    dependsOn: ['p3-sub-workflow'],
-    retries: 2,
-    verification: { type: 'output_contains', value: 'AUTO_BUILDER_COMPLETE' },
-  })
-
-  // ── Phase 4: Storage Backends (parallel with Phase 3) ────────────────────
-
-  .step('p4-db-adapters', {
-    agent: 'storage-implementer',
-    task: `
-Phase 4: Implement production-ready WorkflowDb adapters.
-(Runs in parallel with Phase 3 — no dependency between them.)
-
-Phase 2 review context:
-{{steps.p2-code-review.output}}
-
-Create a new directory: packages/sdk/src/workflows/db/
-
-Create these files:
-
-1. packages/sdk/src/workflows/db/postgres.ts
-   export class PostgresWorkflowDb implements WorkflowDb {
-     constructor(options: { connectionString: string; tablePrefix?: string })
-     // Creates tables on first connect if they don't exist:
-     //   {prefix}workflow_runs, {prefix}workflow_steps
-     // Schema mirrors WorkflowRunRow and WorkflowStepRow
-     // Uses node-postgres (pg) — add to package.json if absent
-     async insertRun(run: WorkflowRunRow): Promise<void>
-     async updateRun(id: string, patch: Partial<WorkflowRunRow>): Promise<void>
-     async getRun(id: string): Promise<WorkflowRunRow | null>
-     async insertStep(step: WorkflowStepRow): Promise<void>
-     async updateStep(id: string, patch: Partial<WorkflowStepRow>): Promise<void>
-     async getStepsByRunId(runId: string): Promise<WorkflowStepRow[]>
-     async close(): Promise<void>
-   }
-
-2. packages/sdk/src/workflows/db/sqlite.ts
-   export class SqliteWorkflowDb implements WorkflowDb {
-     constructor(options: { path: string; tablePrefix?: string })
-     // Uses better-sqlite3 — synchronous API wrapped in async methods
-     // Same schema as PostgresWorkflowDb
-     // Creates tables if they don't exist on construction
-   }
-
-3. packages/sdk/src/workflows/db/redis.ts
-   export class RedisWorkflowDb implements WorkflowDb {
-     constructor(options: {
-       url: string;
-       keyPrefix?: string;  // default "relay:workflow:"
-       runTtlMs?: number;   // optional TTL on run records
-     })
-     // Uses ioredis — add to package.json if absent
-     // Stores runs as JSON strings at key: {prefix}run:{id}
-     // Stores step lists at key: {prefix}steps:{runId} (Redis list)
-     // Stores individual steps at: {prefix}step:{id}
-   }
-
-4. packages/sdk/src/workflows/db/index.ts
-   export { PostgresWorkflowDb } from './postgres.js';
-   export { SqliteWorkflowDb } from './sqlite.js';
-   export { RedisWorkflowDb } from './redis.js';
-
-5. Update packages/sdk/src/workflows/index.ts to export from db/:
-   export * from './db/index.js';
-
-IMPORTANT: Add the three packages to package.json as optional peer dependencies
-with peerDependenciesMeta markings optional: true, so users only need to install
-the adapter they use.
-
-Run: npx tsc --noEmit (adapters will have type errors only if packages are absent;
-mark them as type-only imports with // @ts-expect-error if needed with clear comment)
-End with: DB_ADAPTERS_COMPLETE
-    `,
-    dependsOn: ['p2-code-review'],
-    retries: 2,
-    verification: { type: 'output_contains', value: 'DB_ADAPTERS_COMPLETE' },
-  })
-
-  // ── Phase 3+4 Combined Review ─────────────────────────────────────────────
-
-  .step('p34-lead-review', {
-    agent: 'lead',
-    task: `
-Phase 3+4 Lead Review: Meta-orchestration and storage backends.
-
-Phase 3 — AutoBuilder:
-{{steps.p3-auto-builder.output}}
-
-Phase 4 — DB adapters:
-{{steps.p4-db-adapters.output}}
-
-REVIEW:
-
-META-ORCHESTRATION:
-1. Is the sub-workflow execution correctly isolated? (child runner should not
-   share the parent runner's event listeners, but should share the DB)
-2. Does the WorkflowRegistry file path (~/.agent-relay/) correctly use os.homedir()?
-3. Is the AutoWorkflowBuilder meta-prompt clear enough to reliably generate
-   valid relay.yaml configs? What guardrails are needed?
-4. Does the YAML extraction from meta-agent output handle cases where the
-   agent outputs multiple code blocks?
-
-DB ADAPTERS:
-5. Are the SQL schemas in PostgresWorkflowDb and SqliteWorkflowDb correct?
-   (JSON columns for config/stateSnapshot, TEXT for status, ISO timestamps)
-6. Is the Redis adapter correctly handling concurrent updates?
-   (Multiple parallel steps updating the same run record — race condition risk)
-7. Are optional peer dependencies correctly marked in package.json?
-8. Do the adapters correctly handle NULL/missing optional fields?
-
-State fixes needed for the code reviewer to validate.
-End with: PHASE_34_APPROVED
-    `,
-    dependsOn: ['p3-auto-builder', 'p4-db-adapters'],
-    retries: 1,
-    verification: { type: 'output_contains', value: 'PHASE_34_APPROVED' },
-  })
-
-  .step('p34-code-review', {
-    agent: 'code-reviewer',
-    task: `
-Phase 3+4 Independent Code Review.
-
-Lead's notes:
-{{steps.p34-lead-review.output}}
-
-REVIEW packages/sdk/src/workflows/registry.ts,
-       packages/sdk/src/workflows/auto-builder.ts,
-       packages/sdk/src/workflows/db/:
-
-1. Registry: does resolvePath correctly return file paths unchanged and look up
-   by name for non-path strings? Is the registry JSON correctly pretty-printed?
-2. AutoBuilder: is the meta-prompt templating safe from injection if the task
-   string contains special characters or YAML-like content?
-3. PostgresWorkflowDb: are SQL queries parameterized? (No string interpolation
-   in SQL — security requirement)
-4. SqliteWorkflowDb: does the sync API wrap correctly without blocking the event
-   loop for extended periods?
-5. RedisWorkflowDb: is the JSON serialization of WorkflowRunRow round-trip safe?
-   (dates become strings, Record<string,unknown> stays correct)
-6. All three adapters: does getStepsByRunId return steps in consistent order?
-7. Run npx tsc --noEmit and report results
-
-List issues with specific file + line references.
-End with: CODE_REVIEW_34_COMPLETE
-    `,
-    dependsOn: ['p34-lead-review'],
-    retries: 1,
-    verification: { type: 'output_contains', value: 'CODE_REVIEW_34_COMPLETE' },
-  })
-
-  // ── Phase 5: Deployment and Observability ─────────────────────────────────
-
-  .step('p5-serve-command', {
-    agent: 'deploy-implementer',
-    task: `
-Phase 5a: Implement "relay workflow serve" HTTP server.
-
-Phase 3+4 review context:
-{{steps.p34-code-review.output}}
-
-YOUR TASK: Create packages/sdk/src/workflows/server.ts
-
-Implement a lightweight HTTP server (use Node.js built-in http module — no
-Express/Fastify dependency) that exposes:
-
-  POST /run
-    Body: { workflowPath: string, vars?: VariableContext, sessionId?: string }
-    Response: { runId: string, status: "started" }
-    Behavior: parse the relay.yaml at workflowPath, start execution (non-blocking),
-    return runId immediately
-
-  GET /runs/:runId
-    Response: WorkflowRunRow | { error: "not found" }
-
-  GET /runs/:runId/events
-    Response: text/event-stream (Server-Sent Events)
-    Each WorkflowEvent becomes a SSE data: {json}\n\n line
-    Connection stays open until run completes or client disconnects
-
-  POST /runs/:runId/hitl/:stepName/respond
-    Body: { response: string, respondedBy?: string }
-    Behavior: write {summaryDir}/{runId}/hitl-{stepName}-response.json
-    Response: { ok: true }
-
-  POST /runs/:runId/abort
-    Behavior: call runner.abort(runId) if supported
-    Response: { ok: true }
-
-  GET /health
-    Response: { status: "ok", uptime: process.uptime() }
-
-Also create packages/sdk/src/workflows/serve.ts — the CLI entry point:
-  export async function serveWorkflows(options: {
-    port?: number;     // default 3747
-    host?: string;     // default "0.0.0.0"
-    db?: WorkflowDb;
-  }): Promise<void>
-
-Export serveWorkflows from ${INDEX_FILE}.
-
-The serve command will be integrated into the relay CLI in the next step.
-
-Run: npx tsc --noEmit
-End with: SERVE_COMMAND_COMPLETE
-    `,
-    dependsOn: ['p34-code-review'],
-    retries: 2,
-    verification: { type: 'output_contains', value: 'SERVE_COMMAND_COMPLETE' },
-  })
-
-  .step('p5-otel-tracing', {
-    agent: 'deploy-implementer',
-    task: `
-Phase 5b: Implement OpenTelemetry tracing integration.
-(Running in parallel with p5-serve-command — these are independent.)
-
-Phase 3+4 review context:
-{{steps.p34-code-review.output}}
-
-YOUR TASK: Add optional OTel tracing to WorkflowRunner.
-
-1. Add otel config to RelayYamlConfig in types.ts (if not already present):
-   telemetry?: {
-     otel?: boolean;              // enable OTel tracing
-     endpoint?: string;           // OTLP endpoint, default "http://localhost:4318"
-     serviceName?: string;        // default "relay-workflows"
-     exportTo?: "otlp" | "console" | "none";  // default "otlp"
-   }
-
-2. Create packages/sdk/src/workflows/tracing.ts:
-
-   export interface TracingOptions {
-     enabled: boolean;
-     endpoint?: string;
-     serviceName?: string;
-     exportTo?: "otlp" | "console" | "none";
-   }
-
-   export class WorkflowTracer {
-     constructor(options: TracingOptions) {}
-
-     // Create root span for workflow run
-     startRun(runId: string, workflowName: string, pattern: string): Span
-
-     // Create child span for a step
-     startStep(parentSpan: Span, stepName: string, agentName: string): Span
-
-     // Record events on spans
-     recordEvent(span: Span, event: WorkflowEvent): void
-
-     // End spans
-     endSpan(span: Span, status: "ok" | "error", error?: string): void
-
-     // Shutdown exporter cleanly
-     async shutdown(): Promise<void>
-   }
-
-Use @opentelemetry/sdk-node and @opentelemetry/api (add as optional peer deps
-with peerDependenciesMeta optional: true in package.json).
-
-Guard all OTel imports with a try/catch or dynamic import so the runner works
-without OTel installed:
-  let tracer: WorkflowTracer | null = null;
-  try {
-    const { WorkflowTracer } = await import('./tracing.js');
-    tracer = new WorkflowTracer(config.telemetry?.otel ? { enabled: true, ...config.telemetry } : { enabled: false });
-  } catch {
-    // OTel packages not installed — tracing disabled
-  }
-
-3. In WorkflowRunner.execute():
-   - If tracer enabled: create root run span
-   - In executeStep(): create child step span, record start/complete/fail events
-   - On run complete: end root span
-
-Export WorkflowTracer from ${INDEX_FILE}.
-
-Run: npx tsc --noEmit
-End with: OTEL_TRACING_COMPLETE
-    `,
-    dependsOn: ['p34-code-review'],
-    retries: 2,
-    verification: { type: 'output_contains', value: 'OTEL_TRACING_COMPLETE' },
-  })
-
-  .step('p5-cli-improvements', {
-    agent: 'deploy-implementer',
-    task: `
-Phase 5c: Implement CLI improvements.
-
-OTel tracing implementation:
-{{steps.p5-otel-tracing.output}}
-
-YOUR TASK: Find the CLI entry point for the relay workflow commands and add:
-
-First, locate the CLI code (likely in packages/sdk/src/workflows/cli.ts):
-  cat packages/sdk/src/workflows/cli.ts
-
-Add these subcommands to the workflow CLI:
-
-1. relay workflow dry-run <yaml-path> [--var KEY=VALUE...]
-   - Parse and validate the YAML (run validateConfig)
-   - Resolve variable templates (show substituted values)
-   - Show the resolved DAG: step names, dependencies, agent assignments
-   - Show which steps can run in parallel
-   - Do NOT actually execute — print "DRY RUN: would execute N steps across M agents"
-
-2. relay workflow inspect <yaml-path>
-   - Show full config parsed and pretty-printed as JSON
-   - Show detected swarm pattern with reason
-   - Show agent topology (edges from SwarmCoordinator)
-   - Show barrier definitions
-   - Show coordination config
-
-3. relay workflow replay <runId> --from <step-name> [--db-path <sqlite-path>]
-   - Load existing run record from DB (requires SqliteWorkflowDb)
-   - Skip steps that completed successfully before the target step
-   - Re-execute from the specified step name onwards
-   - Useful for resuming failed runs without restarting from scratch
-
-4. relay workflow serve [--port <N>] [--db sqlite:<path>|postgres:<url>|redis:<url>]
-   - Starts the HTTP server from p5-serve-command
-   - Accepts DB connection string via --db flag, parses the scheme prefix
-
-Also update the README at packages/sdk/src/workflows/README.md to document
-all new CLI commands with usage examples.
-
-Run: npx tsc --noEmit
-End with: CLI_IMPROVEMENTS_COMPLETE
-    `,
-    dependsOn: ['p5-serve-command', 'p5-otel-tracing'],
-    retries: 2,
-    verification: { type: 'output_contains', value: 'CLI_IMPROVEMENTS_COMPLETE' },
-  })
-
-  .step('p5-lead-review', {
-    agent: 'lead',
-    task: `
-Phase 5 Lead Review: Deployment and observability.
-
-Serve command:
-{{steps.p5-serve-command.output}}
-
-OTel tracing:
-{{steps.p5-otel-tracing.output}}
-
-CLI improvements:
-{{steps.p5-cli-improvements.output}}
-
-REVIEW:
-1. HTTP server: is SSE implemented correctly? (headers: Content-Type: text/event-stream,
-   Cache-Control: no-cache, Connection: keep-alive; proper flushing with res.write)
-2. HTTP server: is the HITL respond endpoint correctly writing the response file
-   to the same path the runner is polling?
-3. OTel: is the dynamic import guard (try/catch) robust? Will it work in CJS builds?
-4. OTel: are span hierarchies correct — run span is parent, step spans are children?
-5. CLI dry-run: does it show enough information to be useful for debugging?
-6. CLI replay: what happens if a replay step depends on a step that was NOT
-   completed in the prior run? (Should fail with clear error message.)
-7. Is the README updated with accurate examples?
-
-Note critical fixes. End with: PHASE_5_APPROVED
-    `,
-    dependsOn: ['p5-cli-improvements'],
-    retries: 1,
-    verification: { type: 'output_contains', value: 'PHASE_5_APPROVED' },
-  })
-
-  .step('p5-code-review', {
-    agent: 'code-reviewer',
-    task: `
-Phase 5 Independent Code Review: Deployment and observability.
-(Running in parallel with lead review — review the code independently.)
-
-CLI improvements:
-{{steps.p5-cli-improvements.output}}
-
-REVIEW packages/sdk/src/workflows/server.ts,
-       packages/sdk/src/workflows/tracing.ts,
-       packages/sdk/src/workflows/cli.ts:
-
-1. HTTP server: no prototype pollution risk in request body parsing?
-   (Validate Content-Type, parse JSON safely with try/catch)
-2. SSE endpoint: does it correctly handle client disconnect without leaving
-   zombie event listeners on the WorkflowRunner?
-3. HITL respond: path traversal risk? (runId and stepName used in file path —
-   must sanitize to alphanumeric + hyphen only)
-4. OTel: does shutdown() await the exporter flush before process.exit?
-5. CLI replay: is the step-skip logic correct? (A skipped-previously-completed
-   step should return its stored output for downstream template resolution)
-6. Run npx jest packages/sdk and report pass/fail counts
-7. Run npx tsc --noEmit and report results
-
-End with: CODE_REVIEW_5_COMPLETE
-    `,
-    dependsOn: ['p5-cli-improvements'],
-    retries: 1,
-    verification: { type: 'output_contains', value: 'CODE_REVIEW_5_COMPLETE' },
-  })
-
-  // ── Phase 6: Integration Validation + Final Sign-Off ─────────────────────
-
-  .step('integration-validation', {
-    agent: 'test-validator',
-    task: `
-Phase 6: Integration validation across all five tiers.
-
-Phase 5 review:
-{{steps.p5-code-review.output}}
-
-YOUR TASK: Run comprehensive validation of the full implementation.
-
-1. TYPE CHECK:
-   cd packages/sdk && npx tsc --noEmit
-   Report: zero errors or list all errors
-
-2. EXISTING TESTS:
-   npx jest packages/sdk/src/__tests__/
-   Report: pass count, fail count, any failures
-
-3. BUILD:
-   cd packages/sdk && npm run build
-   Report: success or errors
-
-4. INTEGRATION SMOKE TESTS — run each of these and report output:
-
-   a. Condition step test:
-      Create a temporary relay.yaml with a condition step that checks if
-      "SKIP" is in a prior step's output, run it via the WorkflowRunner
-      in TypeScript (programmatic, not CLI), verify the step is skipped.
-
-   b. Loop step test:
-      Create a temporary relay.yaml with a loop that runs max 3 iterations,
-      verify it runs exactly 3 times when until-condition is never met.
-
-   c. Input validation test:
-      Create a RelayYamlConfig with inputSchema requiring a "task" field,
-      call runner.execute() without "task" in vars, verify WorkflowValidationError
-      is thrown.
-
-   d. Flow shorthand test:
-      Parse the flow string "planner -> developer, reviewer -> lead" and verify
-      that developer.dependsOn = ["planner"], reviewer.dependsOn = ["planner"],
-      lead.dependsOn = ["developer", "reviewer"].
-
-   e. SqliteWorkflowDb test:
-      Create an in-memory SQLite DB, insert a run, update it, retrieve it,
-      verify round-trip fidelity of all fields.
-
-5. EXPORTS CHECK:
-   Verify that the following are exported from packages/sdk/src/workflows/index.ts:
-   - WorkflowBuilder, workflow
-   - WorkflowRunner, WorkflowRunnerOptions, WorkflowEvent, WorkflowEventListener
-   - WorkflowValidationError
-   - AutoWorkflowBuilder, autoWorkflow
-   - WorkflowRegistry
-   - SqliteWorkflowDb, PostgresWorkflowDb, RedisWorkflowDb
-   - WorkflowTracer
-   - All new types: AnyWorkflowStep, LoopStepGroup, RouterStepGroup,
-     ParallelStepGroup, HitlStep, SubWorkflowStep, SessionConfig
-
-Report full results. End with: INTEGRATION_VALIDATED
-    `,
-    dependsOn: ['p5-code-review', 'p5-lead-review'],
-    retries: 2,
-    verification: { type: 'output_contains', value: 'INTEGRATION_VALIDATED' },
-  })
-
-  .step('final-lead-review', {
-    agent: 'lead',
-    task: `
-FINAL LEAD REVIEW: Complete broker-sdk workflow superiority implementation.
-
-Integration validation results:
-{{steps.integration-validation.output}}
-
-This is the culmination of a five-phase implementation campaign. Your job:
-
-1. CAPABILITY AUDIT — verify we now have all of these (check integration results):
-   □ condition step type (CEL-based conditional execution)
-   □ loop step type (iterative with until-condition)
-   □ router step type (runtime branch selection)
-   □ parallel step group (explicit with any/majority barriers)
-   □ HITL step type (human-in-the-loop with file-based pause/resume)
-   □ sub-workflow step (workflow composition)
-   □ flow shorthand (string notation "A -> B, C")
-   □ session concept (multi-run state sharing)
-   □ input schema validation (JSON Schema via Ajv)
-   □ fallback agent switching
-   □ AutoWorkflowBuilder (LLM-generated workflows)
-   □ WorkflowRegistry (name-to-path resolution)
-   □ PostgresWorkflowDb, SqliteWorkflowDb, RedisWorkflowDb
-   □ HTTP serve command with SSE event streaming
-   □ OTel tracing (optional, dynamic import)
-   □ CLI: dry-run, inspect, replay, serve
-   □ 30+ WorkflowEvent types
-   □ All exports correct from index.ts
-
-2. COMPETITIVE POSITION — confirm we now surpass:
-   AGNO: We have everything Agno has (condition=Condition, loop=Loop,
-   router=Router, session, input validation, serve, OTel) PLUS barriers,
-   consensus, HITL, polyglot backends, YAML portability, sub-workflow composition.
-
-   SWARMS: We have equivalent patterns PLUS out-of-process PTY isolation,
-   YAML portability, true relay protocol, HITL, OTel, sub-workflow composition,
-   HTTP serve. Swarms has more built-in swarm types (15+ vs our 10) but we
-   cover all critical execution patterns with richer composition primitives.
-
-3. REMAINING GAPS (if any) — list anything that was not fully implemented
-   and should be tracked as future work.
-
-4. DOCUMENTATION — confirm README.md in the workflows directory is updated
-   with examples for all new features.
-
-Produce a final capability report with the checklist above filled in.
-End with: IMPLEMENTATION_COMPLETE
-    `,
-    dependsOn: ['integration-validation'],
-    retries: 1,
-    verification: { type: 'output_contains', value: 'IMPLEMENTATION_COMPLETE' },
-  })
-
-  .onError('retry', { maxRetries: 2, retryDelayMs: 10_000 })
-
-  .run({
-    onEvent,
-    vars: {
-      // Override these at runtime if needed:
-      // workflowRoot: 'packages/sdk/src/workflows',
-    },
-  });
-
-console.log('\n── Run complete ─────────────────────────────────────────────────');
-console.log(`status:      ${result.status}`);
-console.log(`runId:       ${result.id}`);
-console.log(`workflow:    ${result.workflowName}`);
-console.log(`pattern:     ${result.pattern}`);
-console.log(`started:     ${result.startedAt}`);
-console.log(`completed:   ${result.completedAt ?? '—'}`);
-if (result.error) {
-  console.error(`error:       ${result.error}`);
-}
diff --git a/packages/sdk/src/examples/workflows/README.md b/packages/sdk/src/examples/workflows/README.md
deleted file mode 100644
index 199ec8408..000000000
--- a/packages/sdk/src/examples/workflows/README.md
+++ /dev/null
@@ -1,156 +0,0 @@
-# Super-Powered Ralph Loops
-
-These workflows are the agent-relay take on the [Ralph Wiggum technique](https://github.com/mikeyobrien/ralph-orchestrator) — autonomous AI agents looping on a codebase until work is done. Where vanilla ralph runs one agent at a time, these workflows run **squads of specialists** with real quality gates, multi-model assignment, and observable coordination.
-
-## What makes these different
-
-| Vanilla Ralph                  | agent-relay Ralph                                                   |
-| ------------------------------ | ------------------------------------------------------------------- |
-| 1 agent per loop               | 2–10 agents per loop                                                |
-| Single model                   | Multi-model (opus plans, sonnet leads, codex builds, gemini audits) |
-| Agent checks its own work      | Independent reviewer with no confirmation bias                      |
-| Polling for completion signals | DAG-based wave scheduling with verification gates                   |
-| No parallelism                 | Workers implement features simultaneously                           |
-| One retry strategy             | Per-step `maxIterations` + global `errorHandling`                   |
-| No observability               | Trajectories, Relaycast channels, step output chaining              |
-
----
-
-## `ralph-tdd.yaml` — Test-Driven Loop
-
-**Best for:** Projects with an existing test framework where correctness is the priority.
-
-```
-architect writes failing tests
-         ↓
-builder implements to pass them (maxIterations: 3)
-         ↓
-npm test / pytest / go test  ←── deterministic gate
-         ↓
-arch-review ──┐
-              ├── both must PASS (consensus: unanimous)
-sec-review  ──┘
-         ↓
-address feedback (maxIterations: 2)
-         ↓
-commit + record learnings → next story
-```
-
-**Key agents:** 3 (architect/sonnet, builder/codex, reviewer/opus)
-**Key feature:** Tests are written BEFORE implementation. Reviewer is separate from architect — no confirmation bias.
-
-```bash
-PRD_PATH=my-prd.json QUALITY_CMD="npm test" \
-  node packages/sdk/dist/workflows/cli.js ralph-tdd.yaml
-```
-
----
-
-## `ralph-swarm.yaml` — Parallel Implementation Squad
-
-**Best for:** Large backlogs where work can be decomposed into independent tasks.
-
-```
-tech-lead decomposes PRD into 5 atomic tasks
-         ↓
-worker-1 ──┐
-worker-2   │
-worker-3   ├── all 5 implement in parallel
-worker-4   │
-worker-5 ──┘
-         ↓
-npm test / tsc / lint  ←── gate
-         ↓
-fix-failures (if gate red)
-         ↓
-review-correctness ──┐
-review-architecture  ├── all 3 must PASS
-review-security    ──┘
-         ↓
-consensus → address rework → commit → loop
-```
-
-**Key agents:** 10 (opus tech-lead, 5 codex workers, 2 claude reviewers, gemini security auditor)
-**Key feature:** 5x parallelism. Three independent reviewers. Gemini on security catches what Claude misses.
-
-```bash
-PRD_PATH=my-prd.json \
-  node packages/sdk/dist/workflows/cli.js ralph-swarm.yaml
-```
-
----
-
-## `ralph-overnight.yaml` — 24-Hour Autonomous Session
-
-**Best for:** Long sessions where you want to drop a repo before bed and wake up to PRs.
-
-```
-product-manager reads backlog, prioritizes, assigns to squads
-         ↓
-tech-lead plans architecture, creates feature branch
-         ↓
-squad-alpha (lead + 2 codex builders) ──┐
-                                         ├── parallel on different files
-squad-beta  (lead + 2 codex builders) ──┘
-         ↓
-full CI gate (lint + tsc + npm test)
-         ↓
-qa-engineer writes integration tests ──┐
-                                        ├── parallel
-security-auditor (gemini) audits     ──┘
-         ↓
-tech-lead reviews → fix if needed
-         ↓
-git push → gh pr create (draft)
-         ↓
-PM writes session-log.txt morning summary
-→ mark stories complete → next batch
-```
-
-**Key agents:** 10 (PM/opus, tech-lead/sonnet, 2 squad leads/sonnet, 4 codex builders, QA/sonnet, security/gemini-pro)
-**Key feature:** True hierarchical org. PM → Tech Lead → Squads. Morning report written to `session-log.txt`. Runs safely overnight with `errorHandling: continue` (one story failure doesn't kill the session).
-
-```bash
-BACKLOG_PATH=my-backlog.json SESSION_LOG=session-log.txt \
-  node packages/sdk/dist/workflows/cli.js ralph-overnight.yaml
-```
-
----
-
-## Running any of these
-
-```bash
-# Preview the execution plan without spending tokens
-DRY_RUN=1 node packages/sdk/dist/workflows/cli.js ralph-tdd.yaml
-
-# Run for real
-node packages/sdk/dist/workflows/cli.js ralph-tdd.yaml
-
-# Watch Relaycast for live agent communication
-# → open https://relaycast.dev and join the workflow's channel
-```
-
-## PRD / Backlog format
-
-These workflows expect a JSON file with your stories:
-
-```json
-{
-  "branchName": "feature/my-project",
-  "userStories": [
-    {
-      "id": "US-001",
-      "title": "User can log in with email",
-      "description": "Implement email/password authentication",
-      "acceptanceCriteria": [
-        "POST /auth/login returns 200 with JWT on valid credentials",
-        "Returns 401 on invalid credentials",
-        "Passwords are bcrypt hashed"
-      ],
-      "passes": false
-    }
-  ]
-}
-```
-
-For `ralph-overnight.yaml`, use `backlog.json` with `priority` and `effort` fields.
diff --git a/packages/sdk/src/examples/workflows/fix-dashboard-user-registration.yaml b/packages/sdk/src/examples/workflows/fix-dashboard-user-registration.yaml
deleted file mode 100644
index e79be11bd..000000000
--- a/packages/sdk/src/examples/workflows/fix-dashboard-user-registration.yaml
+++ /dev/null
@@ -1,182 +0,0 @@
-version: '1.0'
-name: fix-dashboard-user-registration
-description: >
-  Fixes the dashboard agent registration so the user registers as the current
-  system user (whoami / os.userInfo().username) instead of the cwd directory name.
-
-  Currently, both relaycast-provider.ts and proxy-server.ts in relay-dashboard
-  derive projectIdentity from path.basename(path.resolve(dataDir, '..')) — which
-  gives the working directory name. This workflow changes both to use
-  os.userInfo().username so the registered name reflects the actual user.
-
-swarm:
-  pattern: pipeline
-  channel: wf-fix-dashboard-user-reg
-  maxConcurrency: 3
-  timeoutMs: 1200000 # 20 min
-
-agents:
-  - name: implementer
-    cli: claude
-    preset: worker
-    role: 'Makes targeted edits to two dashboard-server files to use os.userInfo().username instead of path.basename(cwd).'
-    constraints:
-      model: sonnet
-
-  - name: reviewer
-    cli: claude
-    preset: reviewer
-    role: 'Reviews the diff to confirm correctness and no unintended side effects.'
-    constraints:
-      model: sonnet
-
-workflows:
-  - name: default
-    onError: fail-fast
-
-    steps:
-      # ── Phase 1: Capture current code for context injection ──────────────────
-
-      - name: read-relaycast-provider
-        type: deterministic
-        command: >
-          sed -n '1,15p' ../relay-dashboard/packages/dashboard-server/src/relaycast-provider.ts &&
-          echo "---" &&
-          sed -n '80,100p' ../relay-dashboard/packages/dashboard-server/src/relaycast-provider.ts
-        captureOutput: true
-        failOnError: true
-
-      - name: read-proxy-server
-        type: deterministic
-        command: >
-          grep -n "^import" ../relay-dashboard/packages/dashboard-server/src/proxy-server.ts | head -20 &&
-          echo "---" &&
-          sed -n '205,220p' ../relay-dashboard/packages/dashboard-server/src/proxy-server.ts
-        captureOutput: true
-        failOnError: true
-
-      # ── Phase 2: Implement the fix ───────────────────────────────────────────
-
-      - name: implement
-        type: agent
-        agent: implementer
-        dependsOn: [read-relaycast-provider, read-proxy-server]
-        task: |
-          Fix two files in the relay-dashboard package so the dashboard user registers
-          with the system username instead of the cwd directory name.
-
-          ── File 1: ../relay-dashboard/packages/dashboard-server/src/relaycast-provider.ts ──
-
-          Current imports and loadRelaycastConfig function:
-          {{steps.read-relaycast-provider.output}}
-
-          Changes required:
-          1. Add `import os from 'node:os';` after the existing `import path from 'path';` line.
-          2. In the `loadRelaycastConfig` function, replace:
-               const projectDir = path.basename(path.resolve(dataDir, '..'));
-             with:
-               const projectIdentity = os.userInfo().username;
-          3. Remove the line `const projectIdentity = projectDir.trim();` (it's now set above).
-          4. The return statement `return { apiKey: envApiKey, baseUrl, projectIdentity };` stays the same.
-
-          ── File 2: ../relay-dashboard/packages/dashboard-server/src/proxy-server.ts ──
-
-          Current imports and resolveRelaycastConfig function:
-          {{steps.read-proxy-server.output}}
-
-          Changes required:
-          1. Add `import os from 'node:os';` near the top of the file with the other imports.
-          2. In the `resolveRelaycastConfig` function, replace:
-               const projectDir = path.basename(path.resolve(dataDir, '..'));
-             with:
-               const projectIdentity = os.userInfo().username;
-          3. Update the `applyCachedAgentIdentity` call: change `projectIdentity: projectDir`
-             to `projectIdentity: projectIdentity` (variable is already named correctly).
-
-          IMPORTANT:
-          - Write both files to disk using your file-writing tools.
-          - Use `import os from 'node:os'` (Node.js built-in with node: prefix).
-          - Do not change anything else in either file.
-          - Preserve all existing imports, logic, and formatting.
-        verification:
-          type: exit_code
-
-      # ── Phase 3: Verify the changes look correct ─────────────────────────────
-
-      - name: verify-changes
-        type: deterministic
-        dependsOn: [implement]
-        command: |
-          echo "=== relaycast-provider.ts: os import ==="
-          grep -n "import os\|node:os" ../relay-dashboard/packages/dashboard-server/src/relaycast-provider.ts || echo "MISSING: os import"
-
-          echo ""
-          echo "=== relaycast-provider.ts: loadRelaycastConfig ==="
-          sed -n '85,96p' ../relay-dashboard/packages/dashboard-server/src/relaycast-provider.ts
-
-          echo ""
-          echo "=== proxy-server.ts: os import ==="
-          grep -n "import os\|node:os" ../relay-dashboard/packages/dashboard-server/src/proxy-server.ts || echo "MISSING: os import"
-
-          echo ""
-          echo "=== proxy-server.ts: resolveRelaycastConfig ==="
-          grep -n -A8 "const resolveRelaycastConfig" ../relay-dashboard/packages/dashboard-server/src/proxy-server.ts | head -15
-
-          echo ""
-          echo "=== Confirm no remaining path.basename(.*dataDir) calls ==="
-          grep -n "path.basename.*dataDir\|basename.*resolve.*dataDir" \
-            ../relay-dashboard/packages/dashboard-server/src/relaycast-provider.ts \
-            ../relay-dashboard/packages/dashboard-server/src/proxy-server.ts && echo "WARN: stale cwd reference found" || echo "OK: no stale cwd references"
-        captureOutput: true
-        failOnError: false
-
-      # ── Phase 4: Capture diff for review ─────────────────────────────────────
-
-      - name: capture-diff
-        type: deterministic
-        dependsOn: [verify-changes]
-        command: >
-          cd ../relay-dashboard &&
-          git diff packages/dashboard-server/src/relaycast-provider.ts
-          packages/dashboard-server/src/proxy-server.ts
-        captureOutput: true
-        failOnError: false
-
-      # ── Phase 5: Code review ──────────────────────────────────────────────────
-
-      - name: review
-        type: agent
-        agent: reviewer
-        dependsOn: [capture-diff, verify-changes]
-        task: |
-          Review this change to the relay-dashboard dashboard-server package.
-
-          The goal: dashboard user now registers with os.userInfo().username (the system user
-          running the process) instead of path.basename(cwd) (the working directory name).
-
-          Verification output:
-          {{steps.verify-changes.output}}
-
-          Diff:
-          {{steps.capture-diff.output}}
-
-          Review checklist:
-          1. Both files now import `os` from `'node:os'` — correct prefix?
-          2. `os.userInfo().username` is used in both `loadRelaycastConfig` and
-             `resolveRelaycastConfig` — no leftover `path.basename` / `projectDir` references?
-          3. The `projectIdentity` variable name is preserved in both call sites?
-          4. No unintended whitespace, import order, or formatting changes?
-          5. The `path` import in relaycast-provider.ts is still present if used elsewhere in the file?
-
-errorHandling:
-  strategy: fail-fast
-  maxRetries: 1
-  retryDelayMs: 5000
-
-state:
-  backend: memory
-  ttlMs: 3600000 # 1 hour
-
-trajectories:
-  enabled: true
-  autoDecisions: true
diff --git a/packages/sdk/src/examples/workflows/ralph-overnight.yaml b/packages/sdk/src/examples/workflows/ralph-overnight.yaml
deleted file mode 100644
index 2ed6124c1..000000000
--- a/packages/sdk/src/examples/workflows/ralph-overnight.yaml
+++ /dev/null
@@ -1,421 +0,0 @@
-version: '1.0'
-name: ralph-overnight
-description: >
-  Autonomous 24-hour dev session. A product manager reads the backlog, a tech
-  lead plans the architecture, parallel squads implement features, a CI runner
-  gates every batch, and the cycle repeats until the backlog is empty or
-  morning arrives. Drop it on a repo before bed, wake up to merged features.
-
-  What this showcases vs vanilla ralph:
-    - Hierarchical orchestration: PM → Tech Lead → Implementation Squads
-    - Mixed CLI team: claude thinks, codex builds, gemini audits
-    - Integrated CI: actual git branch, PR creation, CI status polling
-    - Progressive learning: each loop iteration reads prior session notes
-    - Human checkpoint: if stuck 3x on same story, posts a question to Slack
-      (or a file) and pauses for human input before continuing
-    - Session summary written at the end for morning review
-
-swarm:
-  pattern: hierarchical
-  maxConcurrency: 5
-  timeoutMs: 86400000 # 24 hours — true overnight session
-  channel: ralph-overnight
-  idleNudge:
-    nudgeAfterMs: 600000 # 10 min — these agents think deeply
-    escalateAfterMs: 600000
-    maxNudges: 3
-
-agents:
-  # ── Strategic layer ────────────────────────────────────────────────────────
-
-  - name: product-manager
-    cli: claude
-    channels: [ralph-overnight, strategy]
-    role: >
-      Reads the backlog, prioritizes stories by impact/effort, plans the
-      session's scope, and writes the morning summary report.
-    constraints:
-      model: opus
-
-  - name: tech-lead
-    cli: claude
-    channels: [ralph-overnight, engineering]
-    role: >
-      Translates PM priorities into technical tasks, resolves architectural
-      decisions, monitors squad progress, unblocks stuck agents, and gates PRs.
-    constraints:
-      model: sonnet
-
-  # ── Implementation squads ──────────────────────────────────────────────────
-
-  - name: squad-alpha-lead
-    cli: claude
-    channels: [squad-alpha, ralph-overnight]
-    role: 'Leads squad alpha. Coordinates two codex builders on #squad-alpha.'
-    constraints:
-      model: sonnet
-
-  - name: squad-alpha-builder-1
-    cli: codex
-    role: 'Implements BUILDER_1_SPEC from squad-alpha output via {{steps.squad-alpha.output}}.'
-    interactive: false
-    constraints:
-      model: gpt-5.3-codex
-
-  - name: squad-alpha-builder-2
-    cli: codex
-    role: 'Implements BUILDER_2_SPEC from squad-alpha output via {{steps.squad-alpha.output}}.'
-    interactive: false
-    constraints:
-      model: gpt-5.3-codex-spark
-
-  - name: squad-beta-lead
-    cli: claude
-    channels: [squad-beta, ralph-overnight]
-    role: 'Leads squad beta. Coordinates two codex builders on #squad-beta.'
-    constraints:
-      model: sonnet
-
-  - name: squad-beta-builder-1
-    cli: codex
-    role: 'Implements BUILDER_1_SPEC from squad-beta output via {{steps.squad-beta.output}}.'
-    interactive: false
-    constraints:
-      model: gpt-5.3-codex
-
-  - name: squad-beta-builder-2
-    cli: codex
-    role: 'Implements BUILDER_2_SPEC from squad-beta output via {{steps.squad-beta.output}}.'
-    interactive: false
-    constraints:
-      model: gpt-5.3-codex-spark
-
-  # ── Quality & audit ────────────────────────────────────────────────────────
-
-  - name: qa-engineer
-    cli: claude
-    channels: [ralph-overnight]
-    role: 'Writes integration tests for completed features. Runs the test suite.'
-    interactive: false
-    constraints:
-      model: sonnet
-
-  - name: security-auditor
-    cli: gemini
-    channels: [ralph-overnight]
-    role: 'Audits all changes for security issues before PR creation.'
-    interactive: false
-    constraints:
-      model: gemini-2.5-pro
-
-workflows:
-  - name: overnight-session
-    description: >
-      PM planning → tech architecture → parallel squads (alpha+beta) →
-      QA + security audit → CI gate → PR → advance backlog → loop.
-    onError: continue # don't abort entire session on one story failure
-    preflight:
-      - command: test -f "${BACKLOG_PATH:-backlog.json}"
-        description: 'Backlog file exists'
-      - command: git status --porcelain
-        failIf: non-empty
-        description: 'Clean working directory for overnight session'
-      - command: git rev-parse --abbrev-ref HEAD
-        description: 'Confirm current branch'
-        captureOutput: true
-
-    steps:
-      # ── Wave 1: PM reads backlog and plans the night's scope ─────────────
-
-      - name: pm-planning
-        type: agent
-        agent: product-manager
-        task: |
-          Read ${BACKLOG_PATH:-backlog.json} and ${SESSION_LOG:-session-log.txt}.
-
-          Select the highest-priority stories for a ~4-hour parallel session.
-          Assign to two squads working on DIFFERENT files (no conflicts):
-            Alpha squad: stories + file paths
-            Beta squad: stories + file paths
-          Include risk flags for any cross-squad dependencies.
-
-          Post SESSION_PLAN to #ralph-overnight, then output: PLANNING_COMPLETE
-        verification:
-          type: output_contains
-          value: PLANNING_COMPLETE
-        retries: 1
-
-      # ── Wave 2: Tech lead creates feature branches + architecture notes ───
-
-      - name: tech-architecture
-        type: agent
-        agent: tech-lead
-        dependsOn: [pm-planning]
-        task: |
-          PM plan: {{steps.pm-planning.output}}
-
-          1. Create feature branch: git checkout -b overnight/$(date +%Y%m%d)
-          2. For each story assigned to squads, write implementation notes:
-             - Which files to touch and why
-             - Any shared utilities to create first
-             - Test strategy (unit / integration / e2e)
-          3. Flag any cross-squad dependencies that need sequencing
-          4. Post architecture notes to #ralph-overnight
-
-          Output: ARCHITECTURE_READY
-        verification:
-          type: output_contains
-          value: ARCHITECTURE_READY
-
-      - name: create-branch
-        type: deterministic
-        dependsOn: [tech-architecture]
-        command: >
-          git checkout -b "overnight/$(date +%Y%m%d)" 2>/dev/null ||
-          git checkout "overnight/$(date +%Y%m%d)"
-        captureOutput: true
-
-      # ── Wave 3: Squad leads plan and produce builder specs ───────────────
-      # Leads run first, produce self-contained task specs for each builder.
-      # Builders run in wave 4 after the lead completes, reading specs via
-      # {{steps.squad-alpha.output}} — no channel needed for non-interactive agents.
-
-      - name: squad-alpha
-        type: agent
-        agent: squad-alpha-lead
-        dependsOn: [create-branch]
-        task: |
-          Lead squad alpha on #squad-alpha.
-          Architecture: {{steps.tech-architecture.output}}
-          PM plan (alpha): {{steps.pm-planning.output}}
-
-          Split alpha stories into two self-contained tasks. For each, write
-          a complete implementation spec including: files to change, exact
-          changes needed, and the shell command to verify it works.
-
-          Format your output as:
-          BUILDER_1_SPEC: <complete spec for builder 1>
-          BUILDER_2_SPEC: <complete spec for builder 2>
-          Output: ALPHA_SPECS_READY
-        verification:
-          type: output_contains
-          value: ALPHA_SPECS_READY
-
-      - name: squad-beta
-        type: agent
-        agent: squad-beta-lead
-        dependsOn: [create-branch]
-        task: |
-          Lead squad beta on #squad-beta.
-          Architecture: {{steps.tech-architecture.output}}
-          PM plan (beta): {{steps.pm-planning.output}}
-
-          Split beta stories into two self-contained tasks. Write complete
-          specs for each builder: files, changes, verification command.
-
-          Format:
-          BUILDER_1_SPEC: <complete spec for builder 1>
-          BUILDER_2_SPEC: <complete spec for builder 2>
-          Output: BETA_SPECS_READY
-        verification:
-          type: output_contains
-          value: BETA_SPECS_READY
-
-      # ── Wave 4: Builders implement from lead specs (non-interactive) ──────
-      # Each builder reads its spec from {{steps.squad-X.output}} — no channel
-      # needed. They run in parallel across both squads (same wave).
-
-      - name: squad-alpha-b1
-        type: agent
-        agent: squad-alpha-builder-1
-        dependsOn: [squad-alpha]
-        task: |
-          Implement BUILDER_1_SPEC from the squad alpha lead output:
-          {{steps.squad-alpha.output}}
-
-          Follow the spec exactly. Run the verification command to confirm.
-          Output: ALPHA_B1_DONE:<one-line summary>
-        verification:
-          type: output_contains
-          value: ALPHA_B1_DONE
-
-      - name: squad-alpha-b2
-        type: agent
-        agent: squad-alpha-builder-2
-        dependsOn: [squad-alpha]
-        task: |
-          Implement BUILDER_2_SPEC from the squad alpha lead output:
-          {{steps.squad-alpha.output}}
-
-          Follow the spec exactly. Run the verification command to confirm.
-          Output: ALPHA_B2_DONE:<one-line summary>
-        verification:
-          type: output_contains
-          value: ALPHA_B2_DONE
-
-      - name: squad-beta-b1
-        type: agent
-        agent: squad-beta-builder-1
-        dependsOn: [squad-beta]
-        task: |
-          Implement BUILDER_1_SPEC from the squad beta lead output:
-          {{steps.squad-beta.output}}
-
-          Follow the spec exactly. Run the verification command to confirm.
-          Output: BETA_B1_DONE:<one-line summary>
-        verification:
-          type: output_contains
-          value: BETA_B1_DONE
-
-      - name: squad-beta-b2
-        type: agent
-        agent: squad-beta-builder-2
-        dependsOn: [squad-beta]
-        task: |
-          Implement BUILDER_2_SPEC from the squad beta lead output:
-          {{steps.squad-beta.output}}
-
-          Follow the spec exactly. Run the verification command to confirm.
-          Output: BETA_B2_DONE:<one-line summary>
-        verification:
-          type: output_contains
-          value: BETA_B2_DONE
-
-      # ── Wave 4: Full test suite gate ─────────────────────────────────────
-
-      - name: ci-gate
-        type: deterministic
-        dependsOn: [squad-alpha-b1, squad-alpha-b2, squad-beta-b1, squad-beta-b2]
-        command: >
-          npm run lint 2>&1 | tail -5 &&
-          npx tsc --noEmit 2>&1 | tail -5 &&
-          npm test 2>&1 | tail -40 &&
-          echo "CI_GREEN" || echo "CI_RED"
-        captureOutput: true
-        failOnError: false
-
-      # ── Wave 5: QA writes integration tests + security audit (parallel) ──
-
-      - name: qa-tests
-        type: agent
-        agent: qa-engineer
-        dependsOn: [ci-gate]
-        task: |
-          CI results: {{steps.ci-gate.output}}
-          Alpha built: {{steps.squad-alpha.output}}
-          Beta built: {{steps.squad-beta.output}}
-
-          Write integration tests for the newly implemented features.
-          Focus on the happy path and the two most likely failure modes per feature.
-          Run the full test suite including your new tests.
-
-          Output: QA_DONE:<test count added> new tests, all green
-        verification:
-          type: output_contains
-          value: QA_DONE
-
-      - name: security-audit
-        type: agent
-        agent: security-auditor
-        dependsOn: [ci-gate]
-        task: |
-          Security audit of all changes in this overnight session.
-
-          Run: git diff main 2>/dev/null | head -1000
-
-          Check for:
-          - SQL/command injection vectors
-          - Authentication bypass risks
-          - Secrets or tokens in code
-          - Unvalidated user input reaching sensitive operations
-          - Insecure direct object references
-
-          Output: SECURITY:CLEAN or SECURITY:ISSUES:<list>
-        verification:
-          type: output_contains
-          value: 'SECURITY:'
-
-      # ── Wave 6: Tech lead reviews and gates the PR ────────────────────────
-
-      - name: tech-review
-        type: agent
-        agent: tech-lead
-        dependsOn: [qa-tests, security-audit]
-        task: |
-          QA: {{steps.qa-tests.output}}
-          Security: {{steps.security-audit.output}}
-          CI: {{steps.ci-gate.output}}
-          Alpha: {{steps.squad-alpha.output}}
-          Beta: {{steps.squad-beta.output}}
-
-          If security issues found: fix them first, then output TECH_REVIEW:PASS
-          If CI is red: identify root cause, apply fix, re-run test, output TECH_REVIEW:PASS
-          If all green: output TECH_REVIEW:PASS
-
-          Do NOT output TECH_REVIEW:PASS with outstanding security issues.
-        verification:
-          type: output_contains
-          value: TECH_REVIEW:PASS
-        maxIterations: 2
-
-      # ── Wave 7: Commit, push, create PR ───────────────────────────────────
-
-      - name: push-and-pr
-        type: deterministic
-        dependsOn: [tech-review]
-        command: >
-          git add -A &&
-          git commit -m "feat: overnight session $(date +%Y-%m-%d) — autonomous batch" &&
-          git push -u origin HEAD 2>&1 &&
-          gh pr create --title "Overnight session $(date +%Y-%m-%d)" \
-            --body "Autonomous dev session. See session-log.txt for details." \
-            --draft 2>&1 ||
-          echo "PR_CREATED_OR_UPDATED"
-        captureOutput: true
-        failOnError: false
-
-      # ── Wave 8: PM writes morning summary ────────────────────────────────
-
-      - name: morning-summary
-        type: agent
-        agent: product-manager
-        dependsOn: [push-and-pr]
-        task: |
-          Write the morning summary to ${SESSION_LOG:-session-log.txt}.
-
-          Results: alpha={{steps.squad-alpha.output}} | beta={{steps.squad-beta.output}}
-          CI={{steps.ci-gate.output}} | QA={{steps.qa-tests.output}}
-          Security={{steps.security-audit.output}} | PR={{steps.push-and-pr.output}}
-
-          Include: completed stories, CI/quality status, learnings, next priorities.
-          Mark completed stories done in ${BACKLOG_PATH:-backlog.json}.
-
-          Output: SESSION_COMPLETE
-        verification:
-          type: output_contains
-          value: SESSION_COMPLETE
-
-coordination:
-  barriers:
-    - name: squads-complete
-      waitFor: [squad-alpha-b1, squad-alpha-b2, squad-beta-b1, squad-beta-b2]
-      timeoutMs: 7200000
-    - name: quality-gates-complete
-      waitFor: [qa-tests, security-audit]
-      timeoutMs: 3600000
-
-state:
-  backend: memory
-  ttlMs: 86400000
-
-errorHandling:
-  strategy: continue # one story failing shouldn't abort the whole night
-  maxRetries: 1
-  retryDelayMs: 10000
-  notifyChannel: ralph-overnight
-
-trajectories:
-  enabled: true
-  reflectOnBarriers: true
-  reflectOnConverge: true
-  autoDecisions: true
diff --git a/packages/sdk/src/examples/workflows/ralph-swarm.yaml b/packages/sdk/src/examples/workflows/ralph-swarm.yaml
deleted file mode 100644
index 652744d67..000000000
--- a/packages/sdk/src/examples/workflows/ralph-swarm.yaml
+++ /dev/null
@@ -1,411 +0,0 @@
-version: '1.0'
-name: ralph-swarm
-description: >
-  Parallel Implementation Squad. A tech lead decomposes the PRD into atomic
-  tasks, five codex workers implement them simultaneously, three specialized
-  reviewers run in parallel, a consensus gate synthesizes their verdicts, and
-  the cycle repeats until the backlog is empty.
-
-  What this showcases vs vanilla ralph:
-    - Fan-out to N parallel workers (not one at a time)
-    - Multi-model squad: codex workers + claude reviewers + gemini security
-    - Real consensus: all 3 reviewers must pass before merge
-    - Tech lead stays active throughout — course-corrects workers in real-time
-    - Barriers coordinate the fan-in before the next wave starts
-    - The whole backlog processed in one autonomous overnight session
-
-swarm:
-  pattern: dag
-  maxConcurrency: 5
-  timeoutMs: 14400000 # 4 hours — big PRDs take time
-  channel: ralph-swarm
-  idleNudge:
-    nudgeAfterMs: 300000
-    escalateAfterMs: 300000
-    maxNudges: 2
-
-agents:
-  # ── Leadership ─────────────────────────────────────────────────────────────
-
-  - name: tech-lead
-    cli: claude
-    channels: [ralph-swarm, planning]
-    role: 'Decomposes PRD into atomic tasks, assigns to workers, reviews integration.'
-    constraints:
-      model: opus
-
-  - name: integration-lead
-    cli: claude
-    channels: [ralph-swarm]
-    role: 'Integrates parallel worker output, resolves conflicts, gates the PR.'
-    constraints:
-      model: sonnet
-
-  # ── Implementation workers ─────────────────────────────────────────────────
-  # Each gets one atomic task. interactive: false means one-shot, exits cleanly.
-
-  - name: worker-1
-    cli: codex
-    role: 'Implements assigned atomic task.'
-    interactive: false
-    constraints:
-      model: gpt-5.3-codex
-
-  - name: worker-2
-    cli: codex
-    role: 'Implements assigned atomic task.'
-    interactive: false
-    constraints:
-      model: gpt-5.3-codex
-
-  - name: worker-3
-    cli: codex
-    role: 'Implements assigned atomic task.'
-    interactive: false
-    constraints:
-      model: gpt-5.3-codex
-
-  - name: worker-4
-    cli: codex
-    role: 'Implements assigned atomic task.'
-    interactive: false
-    constraints:
-      model: gpt-5.3-codex-spark
-
-  - name: worker-5
-    cli: codex
-    role: 'Implements assigned atomic task.'
-    interactive: false
-    constraints:
-      model: gpt-5.3-codex-spark
-
-  # ── Review squad ───────────────────────────────────────────────────────────
-
-  - name: reviewer-correctness
-    cli: claude
-    role: 'Reviews logic, tests, edge cases.'
-    interactive: false
-    constraints:
-      model: sonnet
-
-  - name: reviewer-architecture
-    cli: claude
-    role: 'Reviews coupling, abstractions, patterns.'
-    interactive: false
-    constraints:
-      model: opus
-
-  - name: reviewer-security
-    cli: gemini
-    role: 'Reviews attack surface, injection, secrets.'
-    interactive: false
-    constraints:
-      model: gemini-2.5-flash
-
-workflows:
-  - name: swarm-loop
-    description: >
-      Decompose → fan-out workers → deterministic test gate → parallel review
-      → consensus → integration → commit. Repeat until backlog empty.
-    onError: retry
-    preflight:
-      - command: test -f "${PRD_PATH:-prd.json}"
-        description: 'PRD file exists'
-      - command: git status --porcelain
-        failIf: non-empty
-        description: 'Clean working directory'
-
-    steps:
-      # ── Wave 1: Decompose PRD into atomic tasks ───────────────────────────
-
-      - name: decompose
-        type: agent
-        agent: tech-lead
-        task: |
-          Read ${PRD_PATH:-prd.json} (incomplete stories) and
-          ${PROGRESS_PATH:-progress.txt} (learnings from previous batches).
-
-          Decompose the next 5 stories into atomic, independent tasks.
-          Each task: one coding session, no shared files with other tasks,
-          a shell verify command to confirm it works.
-
-          Output a JSON block: {"batch":[{"id":"task-N","title":"...",
-          "files":["src/..."],"prompt":"full impl instruction","verify":"cmd"}]}
-
-          Post the decomposition to #ralph-swarm so all workers can read it.
-          Output: DECOMPOSED
-        verification:
-          type: output_contains
-          value: DECOMPOSED
-        retries: 1
-
-      # ── Wave 2: Five workers implement in parallel ────────────────────────
-      # Each worker gets the full decomposition and self-assigns task N.
-
-      - name: work-1
-        type: agent
-        agent: worker-1
-        dependsOn: [decompose]
-        task: |
-          Tech lead decomposition: {{steps.decompose.output}}
-
-          Implement task-1 from the decomposition above.
-          Follow all existing code conventions in this repo.
-          Run the verification command from the task spec to confirm it works.
-          Output: TASK_1_DONE:<brief summary of what you implemented>
-        verification:
-          type: output_contains
-          value: TASK_1_DONE
-
-      - name: work-2
-        type: agent
-        agent: worker-2
-        dependsOn: [decompose]
-        task: |
-          Tech lead decomposition: {{steps.decompose.output}}
-
-          Implement task-2 from the decomposition above.
-          Follow all existing code conventions in this repo.
-          Run the verification command from the task spec to confirm it works.
-          Output: TASK_2_DONE:<brief summary of what you implemented>
-        verification:
-          type: output_contains
-          value: TASK_2_DONE
-
-      - name: work-3
-        type: agent
-        agent: worker-3
-        dependsOn: [decompose]
-        task: |
-          Tech lead decomposition: {{steps.decompose.output}}
-
-          Implement task-3 from the decomposition above. If fewer than 3 tasks
-          exist in the batch, output: TASK_3_DONE:skipped
-          Follow all existing code conventions in this repo.
-          Output: TASK_3_DONE:<brief summary>
-        verification:
-          type: output_contains
-          value: TASK_3_DONE
-
-      - name: work-4
-        type: agent
-        agent: worker-4
-        dependsOn: [decompose]
-        task: |
-          Tech lead decomposition: {{steps.decompose.output}}
-
-          Implement task-4 from the decomposition above. If fewer than 4 tasks
-          exist in the batch, output: TASK_4_DONE:skipped
-          Output: TASK_4_DONE:<brief summary>
-        verification:
-          type: output_contains
-          value: TASK_4_DONE
-
-      - name: work-5
-        type: agent
-        agent: worker-5
-        dependsOn: [decompose]
-        task: |
-          Tech lead decomposition: {{steps.decompose.output}}
-
-          Implement task-5 from the decomposition above. If fewer than 5 tasks
-          exist in the batch, output: TASK_5_DONE:skipped
-          Output: TASK_5_DONE:<brief summary>
-        verification:
-          type: output_contains
-          value: TASK_5_DONE
-
-      # ── Wave 3: Quality gate — run the full test suite ───────────────────
-
-      - name: test-gate
-        type: deterministic
-        dependsOn: [work-1, work-2, work-3, work-4, work-5]
-        command: >
-          npm run lint 2>&1 | tail -10 &&
-          npx tsc --noEmit 2>&1 | tail -10 &&
-          npm test 2>&1 | tail -30 &&
-          echo "GATE_PASSED" || echo "GATE_FAILED"
-        captureOutput: true
-        failOnError: false
-
-      # ── Wave 4: Fix failures if gate failed ─────────────────────────────
-
-      - name: fix-failures
-        type: agent
-        agent: tech-lead
-        dependsOn: [test-gate]
-        task: |
-          Test gate results: {{steps.test-gate.output}}
-
-          Worker summaries:
-          - Task 1: {{steps.work-1.output}}
-          - Task 2: {{steps.work-2.output}}
-          - Task 3: {{steps.work-3.output}}
-          - Task 4: {{steps.work-4.output}}
-          - Task 5: {{steps.work-5.output}}
-
-          If GATE_PASSED: output FIX_DONE:none
-          If GATE_FAILED: identify which worker's change broke the gate,
-          apply the minimal fix, re-run the failing tests, output FIX_DONE:<what you fixed>
-        verification:
-          type: output_contains
-          value: FIX_DONE
-        maxIterations: 3
-        retries: 1
-
-      # ── Wave 5: Capture diff for all three reviewers ─────────────────────
-
-      - name: capture-diff
-        type: deterministic
-        dependsOn: [fix-failures]
-        command: git diff HEAD 2>/dev/null | head -500
-        captureOutput: true
-
-      # ── Wave 6: Three parallel reviewers ─────────────────────────────────
-
-      - name: review-correctness
-        type: agent
-        agent: reviewer-correctness
-        dependsOn: [capture-diff]
-        task: |
-          Review this diff for logic correctness, test coverage, and edge cases.
-
-          Worker summaries: {{steps.fix-failures.output}}
-          Diff: {{steps.capture-diff.output}}
-
-          Be specific. Reference file:line for any issues.
-          Output: CORRECTNESS:PASS or CORRECTNESS:FAIL:<numbered issues>
-        verification:
-          type: output_contains
-          value: 'CORRECTNESS:'
-
-      - name: review-architecture
-        type: agent
-        agent: reviewer-architecture
-        dependsOn: [capture-diff]
-        task: |
-          Review this diff for architecture quality, coupling, and long-term maintainability.
-
-          Worker summaries: {{steps.fix-failures.output}}
-          Diff: {{steps.capture-diff.output}}
-
-          Output: ARCHITECTURE:PASS or ARCHITECTURE:FAIL:<numbered issues>
-        verification:
-          type: output_contains
-          value: 'ARCHITECTURE:'
-
-      - name: review-security
-        type: agent
-        agent: reviewer-security
-        dependsOn: [capture-diff]
-        task: |
-          Security review: check for injection, secrets, auth bypass, input validation.
-
-          Diff: {{steps.capture-diff.output}}
-
-          Output: SECURITY:PASS or SECURITY:FAIL:<numbered issues>
-        verification:
-          type: output_contains
-          value: 'SECURITY:'
-
-      # ── Wave 7: Consensus — all three must pass ──────────────────────────
-
-      - name: consensus
-        type: agent
-        agent: integration-lead
-        dependsOn: [review-correctness, review-architecture, review-security]
-        task: |
-          Synthesize the three reviews and decide: merge or rework?
-
-          Correctness: {{steps.review-correctness.output}}
-          Architecture: {{steps.review-architecture.output}}
-          Security: {{steps.review-security.output}}
-
-          If ALL THREE are PASS: output CONSENSUS:MERGE
-          If ANY failed: output CONSENSUS:REWORK:<prioritized list of issues to fix>
-        verification:
-          type: output_contains
-          value: 'CONSENSUS:'
-
-      # ── Wave 8: Address rework if needed, then commit ────────────────────
-
-      - name: address-rework
-        type: agent
-        agent: tech-lead
-        dependsOn: [consensus]
-        task: |
-          Consensus verdict: {{steps.consensus.output}}
-
-          If CONSENSUS:MERGE — output REWORK_DONE:none
-          If CONSENSUS:REWORK — fix all issues listed in the verdict.
-          Run tests again to confirm green, then output REWORK_DONE:<what changed>
-        verification:
-          type: output_contains
-          value: REWORK_DONE
-        maxIterations: 2
-
-      - name: final-test
-        type: deterministic
-        dependsOn: [address-rework]
-        command: npm test 2>&1 | tail -20 && echo "FINAL_GREEN" || echo "FINAL_RED"
-        captureOutput: true
-        failOnError: false
-
-      - name: commit-batch
-        type: deterministic
-        dependsOn: [final-test]
-        command: >
-          git add -A &&
-          git commit -m "feat: parallel swarm batch — $(date +%Y%m%d-%H%M)" 2>/dev/null ||
-          echo "nothing to commit"
-
-      - name: record-and-advance
-        type: agent
-        agent: tech-lead
-        dependsOn: [commit-batch]
-        task: |
-          Final results:
-          - Test gate: {{steps.test-gate.output}}
-          - Consensus: {{steps.consensus.output}}
-          - Final: {{steps.final-test.output}}
-
-          1. Append to ${PROGRESS_PATH:-progress.txt}:
-             - Which tasks succeeded / failed this batch
-             - Patterns in the codebase worth remembering
-             - What caused rework (if any)
-
-          2. Mark completed stories as passed in ${PRD_PATH:-prd.json}
-
-          3. Check if any incomplete stories remain. If yes, output BATCH_DONE:more
-             If all done, output BATCH_DONE:complete
-
-          Output: BATCH_DONE:...
-        verification:
-          type: output_contains
-          value: 'BATCH_DONE:'
-
-coordination:
-  barriers:
-    - name: workers-complete
-      waitFor: [work-1, work-2, work-3, work-4, work-5]
-      timeoutMs: 3600000
-    - name: reviews-complete
-      waitFor: [review-correctness, review-architecture, review-security]
-      timeoutMs: 1800000
-  consensusStrategy: unanimous
-
-state:
-  backend: memory
-  ttlMs: 86400000
-
-errorHandling:
-  strategy: retry
-  maxRetries: 1
-  retryDelayMs: 10000
-  notifyChannel: ralph-swarm
-
-trajectories:
-  enabled: true
-  reflectOnBarriers: true
-  reflectOnConverge: true
-  autoDecisions: true
diff --git a/packages/sdk/src/examples/workflows/ralph-tdd.yaml b/packages/sdk/src/examples/workflows/ralph-tdd.yaml
deleted file mode 100644
index 5bb6ade64..000000000
--- a/packages/sdk/src/examples/workflows/ralph-tdd.yaml
+++ /dev/null
@@ -1,259 +0,0 @@
-version: '1.0'
-name: ralph-tdd
-description: >
-  Test-Driven Ralph Loop. An architect writes failing tests first, a builder
-  implements until they pass, a quality gate runs the real test suite, and
-  the loop repeats with review feedback until every story is green.
-
-  What this showcases vs vanilla ralph:
-    - Tests are written BEFORE implementation (true TDD)
-    - Deterministic quality gate: actual `npm test` / `tsc` output chains into next step
-    - Parallel arch + security reviewer — fresh eyes, no confirmation bias
-    - maxIterations loop prevents infinite spinning
-    - Learnings from each round feed back into the next as {{steps.X.output}}
-
-swarm:
-  pattern: review-loop
-  maxConcurrency: 4
-  timeoutMs: 7200000
-  channel: ralph-tdd
-  idleNudge:
-    nudgeAfterMs: 300000
-    escalateAfterMs: 300000
-    maxNudges: 2
-
-agents:
-  - name: architect
-    cli: claude
-    channels: [ralph-tdd]
-    role: "Writes failing tests, plans implementation, reviews the builder's output."
-    constraints:
-      model: sonnet
-
-  - name: builder
-    cli: codex
-    role: "Implements code to make the architect's failing tests pass."
-    interactive: false
-    constraints:
-      model: gpt-5.3-codex
-
-  - name: reviewer
-    cli: claude
-    channels: [ralph-tdd]
-    role: 'Independent code quality + security review. No confirmation bias.'
-    interactive: false
-    constraints:
-      model: opus
-
-workflows:
-  - name: tdd-loop
-    description: >
-      For each story in the PRD: write tests → implement → test gate →
-      parallel review → address feedback → loop until green.
-    onError: retry
-    preflight:
-      - command: test -f "${PRD_PATH:-prd.json}"
-        description: 'PRD file exists'
-      - command: git status --porcelain
-        failIf: non-empty
-        description: 'Clean working directory before starting'
-
-    steps:
-      # ── Phase 1: Architect writes failing tests ──────────────────────────
-
-      - name: write-tests
-        type: agent
-        agent: architect
-        task: |
-          Read the next unpassed story from ${PRD_PATH:-prd.json}.
-          Read previous learnings from ${PROGRESS_PATH:-progress.txt} if it exists.
-
-          Write FAILING tests first (TDD). The tests must:
-          - Cover all acceptance criteria exactly
-          - Use the project's existing test framework (detect from package.json / pytest / go test)
-          - Fail when run right now (implementation doesn't exist yet)
-          - Have clear assertion messages so failures are informative
-
-          After writing tests, run them to confirm they fail:
-            npm test 2>&1 || pytest 2>&1 || go test ./... 2>&1
-
-          Post the test file paths and what each test verifies to #ralph-tdd.
-          Output: TESTS_WRITTEN
-        verification:
-          type: output_contains
-          value: TESTS_WRITTEN
-        retries: 1
-
-      # ── Phase 2: Capture failing test output for builder context ─────────
-
-      - name: capture-failures
-        type: deterministic
-        dependsOn: [write-tests]
-        command: npm test 2>&1 || pytest 2>&1 || go test ./... 2>&1 || echo "tests ran"
-        captureOutput: true
-        failOnError: false
-
-      # ── Phase 3: Builder implements to make tests pass ───────────────────
-
-      - name: implement
-        type: agent
-        agent: builder
-        dependsOn: [capture-failures]
-        task: |
-          The architect has written failing tests. Your job: make them pass.
-
-          Failing test output:
-          {{steps.capture-failures.output}}
-
-          Implementation plan from #ralph-tdd:
-          {{steps.write-tests.output}}
-
-          Rules:
-          - Do NOT modify the test files
-          - Implement only what's needed to pass the tests
-          - Follow existing code patterns and conventions in this repo
-          - Run the tests yourself to verify they pass before finishing
-
-          Output: IMPLEMENTATION_COMPLETE
-        verification:
-          type: output_contains
-          value: IMPLEMENTATION_COMPLETE
-        retries: 2
-        maxIterations: 3
-
-      # ── Phase 4: Quality gate — real test suite ──────────────────────────
-
-      - name: test-gate
-        type: deterministic
-        dependsOn: [implement]
-        command: >
-          npm run lint 2>&1 | tail -5;
-          npm run type-check 2>&1 | tail -5;
-          npm test 2>&1
-        captureOutput: true
-        failOnError: false
-
-      # ── Phase 5: Parallel review (arch + independent reviewer) ───────────
-
-      - name: arch-review
-        type: agent
-        agent: architect
-        dependsOn: [test-gate]
-        task: |
-          Review the implementation for correctness, completeness, and test coverage.
-
-          Test results:
-          {{steps.test-gate.output}}
-
-          Check:
-          1. All acceptance criteria met (read the story from prd.json)
-          2. No test was skipped or marked pending
-          3. Edge cases handled
-          4. No obvious performance issues
-
-          Output: ARCH_REVIEW:PASS if all good, ARCH_REVIEW:FAIL:<issues> if not.
-        verification:
-          type: output_contains
-          value: 'ARCH_REVIEW:'
-
-      - name: sec-review
-        type: agent
-        agent: reviewer
-        dependsOn: [test-gate]
-        task: |
-          Security and code quality review of the implementation.
-
-          Test results: {{steps.test-gate.output}}
-
-          Check git diff for:
-          - Input validation and sanitization
-          - No hardcoded secrets or credentials
-          - Error handling doesn't leak internals
-          - No obvious injection vectors
-
-          Output: SEC_REVIEW:PASS or SEC_REVIEW:FAIL:<issues>
-        verification:
-          type: output_contains
-          value: 'SEC_REVIEW:'
-
-      # ── Phase 6: Address feedback and finalize ───────────────────────────
-
-      - name: address-feedback
-        type: agent
-        agent: builder
-        dependsOn: [arch-review, sec-review]
-        task: |
-          Address all review feedback, then run the full test suite.
-
-          Architecture review: {{steps.arch-review.output}}
-          Security review: {{steps.sec-review.output}}
-
-          If both are PASS, output: ALL_REVIEWS_PASSED
-          Otherwise fix the issues, run tests again to confirm still green,
-          then output: FEEDBACK_ADDRESSED
-        verification:
-          type: output_contains
-          value: 'ALL_REVIEWS_PASSED|FEEDBACK_ADDRESSED'
-        maxIterations: 2
-
-      # ── Phase 7: Final test run + commit ─────────────────────────────────
-
-      - name: final-test
-        type: deterministic
-        dependsOn: [address-feedback]
-        command: npm test 2>&1 && echo "ALL_GREEN" || echo "STILL_FAILING"
-        captureOutput: true
-        failOnError: false
-
-      - name: commit
-        type: deterministic
-        dependsOn: [final-test]
-        command: >
-          git add -A &&
-          git commit -m "feat: implement story from prd (TDD)" 2>/dev/null ||
-          echo "nothing to commit"
-
-      - name: record-learnings
-        type: agent
-        agent: architect
-        dependsOn: [commit]
-        task: |
-          Record learnings for the next story iteration.
-
-          Final test result: {{steps.final-test.output}}
-          Reviews: {{steps.arch-review.output}} | {{steps.sec-review.output}}
-
-          Append to ${PROGRESS_PATH:-progress.txt}:
-          - What approach worked for this story
-          - Any patterns discovered in this codebase
-          - Gotchas or non-obvious things to remember
-
-          Then mark this story as passed in ${PRD_PATH:-prd.json}
-          by setting its "passes" field to true.
-
-          Output: DONE
-        verification:
-          type: output_contains
-          value: DONE
-
-coordination:
-  barriers:
-    - name: reviews-complete
-      waitFor: [arch-review, sec-review]
-      timeoutMs: 1800000
-  consensusStrategy: unanimous
-
-state:
-  backend: memory
-  ttlMs: 86400000
-
-errorHandling:
-  strategy: retry
-  maxRetries: 2
-  retryDelayMs: 5000
-  notifyChannel: ralph-tdd
-
-trajectories:
-  enabled: true
-  reflectOnBarriers: true
-  autoDecisions: true
diff --git a/packages/sdk/src/examples/workflows/runner-idle-refactor.yaml b/packages/sdk/src/examples/workflows/runner-idle-refactor.yaml
deleted file mode 100644
index ee3a65eaa..000000000
--- a/packages/sdk/src/examples/workflows/runner-idle-refactor.yaml
+++ /dev/null
@@ -1,306 +0,0 @@
-version: '1.0'
-name: runner-idle-refactor
-description: >
-  Refactors WorkflowRunner with two changes:
-    1. Remove agent pre-registration (preflightAgents) — agents spawn only when their step runs.
-    2. Idle = done — when no idleNudge config is set, race waitForExit vs waitForIdle;
-       if idle fires first the step completes immediately.
-
-  Workflow: read context → implement → update tests → type-check → run tests
-  → fix if broken → final test run → review.
-
-swarm:
-  pattern: pipeline
-  maxConcurrency: 3
-  timeoutMs: 1800000 # 30 min
-  channel: wf-runner-refactor
-
-# No idleNudge — each agent is spawned per step and exits when done.
-# Non-interactive preset for all agents (pure code changes, no relay tools needed).
-
-agents:
-  - name: implementer
-    cli: codex
-    preset: worker
-    role: 'Makes the two targeted edits to packages/sdk/src/workflows/runner.ts.'
-    constraints:
-      model: gpt-5.3-codex
-
-  - name: test-writer
-    cli: codex
-    preset: worker
-    role: 'Adds new test cases to idle-nudge.test.ts covering the idle=done behavior.'
-    constraints:
-      model: gpt-5.3-codex
-
-  - name: fixer
-    cli: codex
-    preset: worker
-    role: 'Fixes TypeScript errors or failing tests found in the test run.'
-    constraints:
-      model: gpt-5.3-codex
-
-  - name: reviewer
-    cli: claude
-    preset: reviewer
-    role: 'Reviews the diff for correctness, edge cases, and backwards compatibility.'
-    constraints:
-      model: sonnet
-
-workflows:
-  - name: default
-    onError: continue
-
-    steps:
-      # ── Phase 1: Capture context for agents ───────────────────────────────
-
-      - name: read-prespawn-block
-        type: deterministic
-        command: >
-          grep -n "Pre-register all interactive\|preflightAgents\|Agent pre-registration"
-          packages/sdk/src/workflows/runner.ts | head -10 &&
-          echo "---" &&
-          awk '/Pre-register all interactive agent steps/,/Agent pre-registration complete/{print NR": "$0}'
-          packages/sdk/src/workflows/runner.ts
-        captureOutput: true
-        failOnError: false
-
-      - name: read-spawn-comment
-        type: deterministic
-        command: >
-          grep -n "cache.*hit\|preflightAgents\|token cache"
-          packages/sdk/src/workflows/runner.ts | head -10
-        captureOutput: true
-        failOnError: false
-
-      - name: read-idle-method
-        type: deterministic
-        command: >
-          awk '/private async waitForExitWithIdleNudging/,/^  \}$/{print NR": "$0}'
-          packages/sdk/src/workflows/runner.ts | head -80
-        captureOutput: true
-        failOnError: false
-
-      - name: read-test-file
-        type: deterministic
-        dependsOn: [read-prespawn-block]
-        command: cat packages/sdk/src/__tests__/idle-nudge.test.ts
-        captureOutput: true
-        failOnError: false
-
-      # ── Phase 2: Implement runner.ts changes ──────────────────────────────
-
-      - name: implement
-        type: agent
-        agent: implementer
-        dependsOn: [read-prespawn-block, read-spawn-comment, read-idle-method]
-        task: |
-          Make exactly two changes to `packages/sdk/src/workflows/runner.ts`:
-
-          ── Change 1: Remove agent pre-registration block ──
-
-          Find the block that starts with this comment and delete it entirely:
-            // Pre-register all interactive agent steps with Relaycast before execution.
-
-          The block ends with:
-            this.log('Agent pre-registration complete');
-          followed by the closing `}` of the if statement.
-
-          Here is what the block looks like (with line numbers for reference):
-          {{steps.read-prespawn-block.output}}
-
-          Also find and update the stale comment inside `spawnAndWait` that says something
-          about "token cache" / "cache hits" / "preflightAgents" — those references are now
-          stale. Keep just: "Deterministic name: step name + first 8 chars of run ID."
-
-          Stale comment location:
-          {{steps.read-spawn-comment.output}}
-
-          ── Change 2: Idle = done in waitForExitWithIdleNudging ──
-
-          Find the `waitForExitWithIdleNudging` method. In the branch where `nudgeConfig` is
-          absent, replace the simple `return agent.waitForExit(timeoutMs)` with a race between
-          `waitForExit` and `waitForIdle`. If idle wins, release the agent and return 'released'.
-
-          Current method (with line numbers):
-          {{steps.read-idle-method.output}}
-
-          Replace the no-nudge-config branch with:
-          ```typescript
-          if (!nudgeConfig) {
-            // Idle = done: race exit against idle. Whichever fires first completes the step.
-            const result = await Promise.race([
-              agent.waitForExit(timeoutMs).then((r) => ({ kind: 'exit' as const, result: r })),
-              agent.waitForIdle(timeoutMs).then((r) => ({ kind: 'idle' as const, result: r })),
-            ]);
-            if (result.kind === 'idle' && result.result === 'idle') {
-              this.log(`[${step.name}] Agent "${agent.name}" went idle — treating as complete`);
-              this.postToChannel(`**[${step.name}]** Agent \`${agent.name}\` idle — treating as complete`);
-              await agent.release();
-              return 'released';
-            }
-            // Exit won the race, or idle returned 'exited'/'timeout' — pass through.
-            return result.result as 'exited' | 'timeout' | 'released';
-          }
-          ```
-
-          Only modify these two things. Do not change anything else.
-        verification:
-          type: exit_code
-
-      # ── Phase 3: Update tests ──────────────────────────────────────────────
-
-      - name: update-tests
-        type: agent
-        agent: test-writer
-        dependsOn: [implement, read-test-file]
-        task: |
-          Add new test cases to `packages/sdk/src/__tests__/idle-nudge.test.ts` for the
-          new idle=done behavior. Do NOT modify any existing tests — only append new ones.
-
-          Current test file:
-          {{steps.read-test-file.output}}
-
-          Background on the change:
-          - When `idleNudge` config is absent in the swarm config, `waitForExitWithIdleNudging`
-            now races `waitForExit` vs `waitForIdle`.
-          - If `waitForIdle` resolves with `'idle'` first → `agent.release()` is called and
-            the method returns `'released'`.
-          - If `waitForExit` resolves first → that result is returned as-is.
-          - If `waitForIdle` resolves with `'exited'` or `'timeout'` → exit result wins.
-
-          The mock infrastructure already has `waitForExitFn` and `waitForIdleFn` that you
-          can control. Add a new describe block: `'Idle = done (no idleNudge config)'` with:
-
-          Test 1 — idle fires first:
-            waitForIdleFn resolves 'idle' immediately
-            waitForExitFn never resolves (returns a never-settling promise or very long timeout)
-            → workflow run should complete (step succeeds, agent.release() is called)
-
-          Test 2 — exit fires first:
-            waitForExitFn resolves 'exited' immediately
-            waitForIdleFn resolves 'timeout' (or never fires before exit)
-            → workflow run should complete, agent.release() NOT called by idle logic
-
-          Test 3 — both timeout:
-            waitForExitFn resolves 'timeout'
-            waitForIdleFn resolves 'timeout'
-            → step should fail with a timeout error
-
-          Use the existing `makeConfig()` and `makeDb()` helpers. Use the existing
-          `WorkflowRunner` import pattern already in the file.
-        verification:
-          type: exit_code
-
-      # ── Phase 4: Type-check ────────────────────────────────────────────────
-
-      - name: type-check
-        type: deterministic
-        dependsOn: [implement, update-tests]
-        command: >
-          cd packages/sdk &&
-          npx tsc --noEmit 2>&1 | tail -30 &&
-          echo "TYPE_CHECK_PASSED" || echo "TYPE_CHECK_FAILED"
-        captureOutput: true
-        failOnError: false
-
-      # ── Phase 5: Run vitest ────────────────────────────────────────────────
-
-      - name: run-tests
-        type: deterministic
-        dependsOn: [type-check]
-        command: >-
-          cd packages/sdk && { npx vitest run 2>&1; echo "EXIT:$?"; } | tail -80
-        captureOutput: true
-        failOnError: false
-
-      # ── Phase 6: Fix failures ──────────────────────────────────────────────
-
-      - name: fix-if-broken
-        type: agent
-        agent: fixer
-        dependsOn: [run-tests, type-check]
-        task: |
-          Review the type-check and test results. Fix any failures.
-
-          Type-check:
-          {{steps.type-check.output}}
-
-          Test run:
-          {{steps.run-tests.output}}
-
-          If both show PASSED / ALL_TESTS_PASSED, output: FIX_DONE:none
-
-          Otherwise:
-          - For TypeScript errors: fix packages/sdk/src/workflows/runner.ts
-          - For failing tests: fix packages/sdk/src/__tests__/idle-nudge.test.ts
-          - Do NOT change the intended behavior — only fix syntax/type/mock issues
-
-        verification:
-          type: exit_code
-        maxIterations: 2
-
-      # ── Phase 7: Final test run ────────────────────────────────────────────
-
-      - name: final-tests
-        type: deterministic
-        dependsOn: [fix-if-broken]
-        command: >-
-          cd packages/sdk && { npx vitest run 2>&1; echo "EXIT:$?"; } | tail -60
-        captureOutput: true
-        failOnError: false
-
-      # ── Phase 8: Capture diff for review ──────────────────────────────────
-
-      - name: capture-diff
-        type: deterministic
-        dependsOn: [final-tests]
-        command: >
-          git diff packages/sdk/src/workflows/runner.ts
-          packages/sdk/src/__tests__/idle-nudge.test.ts
-        captureOutput: true
-        failOnError: false
-
-      # ── Phase 9: Code review ───────────────────────────────────────────────
-
-      - name: review
-        type: agent
-        agent: reviewer
-        dependsOn: [capture-diff, final-tests]
-        task: |
-          Review these changes to WorkflowRunner. Be precise and thorough.
-
-          Final test result:
-          {{steps.final-tests.output}}
-
-          Diff:
-          {{steps.capture-diff.output}}
-
-          Review checklist:
-          1. Pre-registration block is fully gone — no leftover `preflightAgents` calls or
-             stale comments referencing "token cache" / "cache hits"
-          2. Race logic in `waitForExitWithIdleNudging`: both promises created before awaiting?
-             No floating promise leak if exit wins before idle settles?
-          3. Edge case: `waitForIdle` returns 'exited' (agent already gone) — does the cast
-             `result.result as 'exited' | 'timeout' | 'released'` hold? Check the union types.
-          4. Edge case: `waitForIdle` returns 'timeout' and exit won — correct fallthrough?
-          5. New tests: do they actually cover all three cases with proper mock wiring?
-          6. No unintended changes to the nudge path (idleNudge config present) — that code
-             should be unchanged.
-
-        verification:
-          type: exit_code
-
-errorHandling:
-  strategy: continue # best-effort — don't abort if an optional step fails
-  maxRetries: 1
-  retryDelayMs: 3000
-  notifyChannel: wf-runner-refactor
-
-state:
-  backend: memory
-  ttlMs: 7200000 # 2 hours
-
-trajectories:
-  enabled: true
-  autoDecisions: true
diff --git a/packages/sdk/src/index.ts b/packages/sdk/src/index.ts
index 3ac0bcaa0..829fb31eb 100644
--- a/packages/sdk/src/index.ts
+++ b/packages/sdk/src/index.ts
@@ -44,12 +44,11 @@ export * from './consensus.js';
 export * from './shadow.js';
 export * from './relay-adapter.js';
 export * from './harness.js';
-export * from './workflows/index.js';
 export * from './spawn-from-env.js';
 export * from './cli-registry.js';
 export * from './cli-resolver.js';
 export * from './personas.js';
 export * as github from './github.js';
-export { createGitHubStep, GitHubClient } from './github.js';
+export { GitHubClient } from '@agent-relay/github-primitive';
 export * as slack from './slack.js';
-export { createSlackStep, SlackClient } from './slack.js';
+export { SlackClient } from '@agent-relay/slack-primitive';
diff --git a/packages/sdk/src/provisioner/__tests__/audit.test.ts b/packages/sdk/src/provisioner/__tests__/audit.test.ts
deleted file mode 100644
index 7ca616158..000000000
--- a/packages/sdk/src/provisioner/__tests__/audit.test.ts
+++ /dev/null
@@ -1,62 +0,0 @@
-import assert from 'node:assert/strict';
-import { mkdtemp, mkdir, readFile, rm, writeFile } from 'node:fs/promises';
-import { tmpdir } from 'node:os';
-import path from 'node:path';
-import test from 'node:test';
-
-import { createLocalJwksKeyPair, provisionWorkflowAgents } from '../index.js';
-
-async function createWorkspace(): Promise<{ dir: string; cleanup: () => Promise<void> }> {
-  const dir = await mkdtemp(path.join(tmpdir(), 'relay-provisioner-audit-'));
-  await mkdir(path.join(dir, 'src'), { recursive: true });
-  await writeFile(path.join(dir, 'src', 'index.ts'), 'export const value = 1;\n');
-
-  return {
-    dir,
-    cleanup: () => rm(dir, { recursive: true, force: true }),
-  };
-}
-
-test('provisionWorkflowAgents writes a permission audit without token values', async () => {
-  const workspace = await createWorkspace();
-
-  try {
-    const result = await provisionWorkflowAgents({
-      tokenSigningKey: createLocalJwksKeyPair(),
-      workspace: 'audit-workspace',
-      projectDir: workspace.dir,
-      relayfileBaseUrl: 'http://127.0.0.1:8080',
-      agents: {
-        worker: {
-          access: 'readonly',
-        },
-      },
-      skipSeeding: true,
-      skipMount: true,
-    });
-
-    const auditPath = path.join(workspace.dir, '.agent-relay', 'permission-audit.json');
-    const auditRaw = await readFile(auditPath, 'utf8');
-    const auditJson = JSON.parse(auditRaw) as {
-      entries: Array<{
-        agentName: string;
-        action: string;
-        details: Record<string, unknown>;
-      }>;
-    };
-
-    assert.ok(auditJson.entries.length >= 3);
-    assert.deepEqual(
-      auditJson.entries.map((entry) => `${entry.agentName}:${entry.action}`),
-      ['worker:resolve', 'worker:mint', 'relay-admin:mint']
-    );
-    assert.equal(
-      auditJson.entries[1]?.details.jwtPath,
-      path.join(workspace.dir, '.relay', 'tokens', 'worker.jwt')
-    );
-    assert.ok(!auditRaw.includes(result.agents.worker.token));
-    assert.ok(!auditRaw.includes(result.adminToken));
-  } finally {
-    await workspace.cleanup();
-  }
-});
diff --git a/packages/sdk/src/provisioner/__tests__/seeder.test.ts b/packages/sdk/src/provisioner/__tests__/seeder.test.ts
deleted file mode 100644
index a651074ee..000000000
--- a/packages/sdk/src/provisioner/__tests__/seeder.test.ts
+++ /dev/null
@@ -1,284 +0,0 @@
-import assert from 'node:assert/strict';
-import { mkdtemp, mkdir, rm, writeFile } from 'node:fs/promises';
-import { tmpdir } from 'node:os';
-import path from 'node:path';
-import test, { afterEach, mock } from 'node:test';
-
-import { RelayFileClient } from '@relayfile/sdk';
-
-import { seedAclRules, seedWorkflowAcls, seedWorkspace } from '../seeder.js';
-
-interface FetchResponseShape {
-  ok: boolean;
-  status: number;
-  text(): Promise<string>;
-}
-
-const originalFetch = globalThis.fetch;
-
-async function createWorkspace(
-  files: Record<string, string | Buffer>
-): Promise<{ dir: string; cleanup: () => Promise<void> }> {
-  const dir = await mkdtemp(path.join(tmpdir(), 'relay-seeder-'));
-
-  for (const [relativePath, content] of Object.entries(files)) {
-    const filePath = path.join(dir, relativePath);
-    await mkdir(path.dirname(filePath), { recursive: true });
-    await writeFile(filePath, content);
-  }
-
-  return {
-    dir,
-    cleanup: () => rm(dir, { recursive: true, force: true }),
-  };
-}
-
-function createFetchResponse(body: string, status = 200): FetchResponseShape {
-  return {
-    ok: status >= 200 && status < 300,
-    status,
-    async text(): Promise<string> {
-      return body;
-    },
-  };
-}
-
-function parseFetchBody(fetchMock: ReturnType<typeof mock.method>): { files: unknown[] } {
-  assert.equal(fetchMock.mock.calls.length, 1);
-  const [, options] = fetchMock.mock.calls[0]!.arguments as [string, RequestInit];
-  assert.equal(typeof options.body, 'string');
-  return JSON.parse(options.body as string) as { files: unknown[] };
-}
-
-afterEach(() => {
-  mock.restoreAll();
-  globalThis.fetch = originalFetch;
-});
-
-test('seedWorkspace posts the expected HTTP payload after SDK fallback', async () => {
-  const workspace = await createWorkspace({
-    'alpha.txt': 'alpha payload',
-    'binary.bin': Buffer.from([0xff, 0x00, 0x61]),
-    '.relay/ignored.txt': 'skip',
-    '.git/config': 'skip',
-    'node_modules/pkg/index.js': 'skip',
-    'custom-skip/ignored.txt': 'skip',
-    '.relayfile-mount-state.json': '{"skip":true}',
-  });
-
-  try {
-    mock.method(RelayFileClient.prototype, 'bulkWrite', async () => {
-      throw new Error('fall back to HTTP');
-    });
-
-    const fetchMock = mock.method(globalThis, 'fetch', async () =>
-      createFetchResponse(JSON.stringify({ written: 2, errorCount: 0, errors: [] }))
-    );
-
-    const seededCount = await seedWorkspace(
-      'https://relay.example///',
-      'admin-token',
-      ' workspace-123 ',
-      workspace.dir,
-      ['custom-skip']
-    );
-
-    assert.equal(seededCount, 2);
-    assert.equal(fetchMock.mock.calls.length, 1);
-
-    const [url, options] = fetchMock.mock.calls[0]!.arguments as [string, RequestInit];
-    assert.equal(url, 'https://relay.example/v1/workspaces/workspace-123/fs/bulk');
-    assert.equal(options.method, 'POST');
-    assert.deepEqual(options.headers, {
-      Authorization: 'Bearer admin-token',
-      'Content-Type': 'application/json',
-      'X-Correlation-Id': options.headers && (options.headers as Record<string, string>)['X-Correlation-Id'],
-    });
-    assert.match(
-      (options.headers as Record<string, string>)['X-Correlation-Id'],
-      /^seed-workspace-workspace-123-\d+-0$/u
-    );
-
-    const body = parseFetchBody(fetchMock);
-    assert.deepEqual(body.files, [
-      {
-        path: '/alpha.txt',
-        content: 'alpha payload',
-        encoding: 'utf-8',
-      },
-      {
-        path: '/binary.bin',
-        content: Buffer.from([0xff, 0x00, 0x61]).toString('base64'),
-        encoding: 'base64',
-      },
-    ]);
-  } finally {
-    await workspace.cleanup();
-  }
-});
-
-test('seedAclRules formats ACL files for root and nested directories', async () => {
-  mock.method(RelayFileClient.prototype, 'bulkWrite', async () => {
-    throw new Error('fall back to HTTP');
-  });
-
-  const fetchMock = mock.method(globalThis, 'fetch', async () =>
-    createFetchResponse(JSON.stringify({ written: 2, errorCount: 0, errors: [] }))
-  );
-
-  await seedAclRules('https://relay.example/', 'acl-token', 'workspace-acl', {
-    '/': ['allow:agent:lead:read'],
-    '/docs/': ['allow:agent:writer:write', 'deny:agent:reader'],
-  });
-
-  const body = parseFetchBody(fetchMock);
-  assert.deepEqual(body.files, [
-    {
-      path: '/.relayfile.acl',
-      content: JSON.stringify({
-        semantics: { permissions: ['allow:agent:lead:read'] },
-      }),
-      encoding: 'utf-8',
-    },
-    {
-      path: '/docs/.relayfile.acl',
-      content: JSON.stringify({
-        semantics: {
-          permissions: ['allow:agent:writer:write', 'deny:agent:reader'],
-        },
-      }),
-      encoding: 'utf-8',
-    },
-  ]);
-});
-
-test('seedWorkflowAcls merges multiple agents onto shared directories', async () => {
-  mock.method(RelayFileClient.prototype, 'bulkWrite', async () => {
-    throw new Error('fall back to HTTP');
-  });
-
-  const fetchMock = mock.method(globalThis, 'fetch', async () =>
-    createFetchResponse(JSON.stringify({ written: 2, errorCount: 0, errors: [] }))
-  );
-
-  await seedWorkflowAcls({
-    relayfileUrl: 'https://relay.example',
-    adminToken: 'workflow-token',
-    workspace: 'workflow-merge',
-    agents: [
-      { name: 'qa-reviewer', acl: { src: ['read'] } },
-      { name: 'builder', acl: { 'src\\': ['write'], '/docs/': ['read'] } },
-      { name: 'analyst', acl: { docs: ['read'] } },
-    ],
-  });
-
-  const body = parseFetchBody(fetchMock);
-  assert.deepEqual(body.files, [
-    {
-      path: '/docs/.relayfile.acl',
-      content: JSON.stringify({
-        semantics: {
-          permissions: [
-            'allow:agent:analyst:read',
-            'allow:agent:builder:read',
-            'allow:agent:qa-reviewer:read',
-          ],
-        },
-      }),
-      encoding: 'utf-8',
-    },
-    {
-      path: '/src/.relayfile.acl',
-      content: JSON.stringify({
-        semantics: {
-          permissions: [
-            'allow:agent:builder:read',
-            'allow:agent:builder:write',
-            'allow:agent:qa-reviewer:read',
-            'deny:agent:analyst',
-          ],
-        },
-      }),
-      encoding: 'utf-8',
-    },
-  ]);
-});
-
-test('seedWorkflowAcls unions deny rules for agents missing directory access', async () => {
-  mock.method(RelayFileClient.prototype, 'bulkWrite', async () => {
-    throw new Error('fall back to HTTP');
-  });
-
-  const fetchMock = mock.method(globalThis, 'fetch', async () =>
-    createFetchResponse(JSON.stringify({ written: 2, errorCount: 0, errors: [] }))
-  );
-
-  await seedWorkflowAcls({
-    relayfileUrl: 'https://relay.example',
-    adminToken: 'workflow-token',
-    workspace: 'workflow-deny',
-    agents: [
-      { name: 'alpha', acl: { src: ['read'] } },
-      { name: 'beta', acl: { docs: ['write'] } },
-    ],
-  });
-
-  const body = parseFetchBody(fetchMock);
-  assert.deepEqual(body.files, [
-    {
-      path: '/docs/.relayfile.acl',
-      content: JSON.stringify({
-        semantics: {
-          permissions: ['allow:agent:beta:read', 'allow:agent:beta:write', 'deny:agent:alpha'],
-        },
-      }),
-      encoding: 'utf-8',
-    },
-    {
-      path: '/src/.relayfile.acl',
-      content: JSON.stringify({
-        semantics: {
-          permissions: ['allow:agent:alpha:read', 'deny:agent:beta'],
-        },
-      }),
-      encoding: 'utf-8',
-    },
-  ]);
-});
-
-test('seedWorkflowAcls is a no-op when there are no ACL directories to seed', async () => {
-  const bulkWriteMock = mock.method(RelayFileClient.prototype, 'bulkWrite', async () => {
-    throw new Error('bulkWrite should not be called');
-  });
-  const fetchMock = mock.method(globalThis, 'fetch', async () => {
-    throw new Error('fetch should not be called');
-  });
-
-  await seedWorkflowAcls({
-    relayfileUrl: 'https://relay.example',
-    adminToken: 'workflow-token',
-    workspace: 'workflow-empty',
-    agents: [
-      { name: 'builder', acl: {} },
-      { name: 'qa-reviewer', acl: {} },
-    ],
-  });
-
-  assert.equal(bulkWriteMock.mock.calls.length, 0);
-  assert.equal(fetchMock.mock.calls.length, 0);
-});
-
-test('seedAclRules surfaces HTTP failures from the fallback API', async () => {
-  mock.method(RelayFileClient.prototype, 'bulkWrite', async () => {
-    throw new Error('fall back to HTTP');
-  });
-
-  mock.method(globalThis, 'fetch', async () => createFetchResponse('relay unavailable', 503));
-
-  await assert.rejects(
-    seedAclRules('https://relay.example', 'acl-token', 'workspace-http', {
-      '/': ['allow:agent:builder:read'],
-    }),
-    new Error('failed to seed workspace workspace-http: HTTP 503 relay unavailable')
-  );
-});
diff --git a/packages/sdk/src/provisioner/__tests__/tar-seeder.test.ts b/packages/sdk/src/provisioner/__tests__/tar-seeder.test.ts
deleted file mode 100644
index bd44174d3..000000000
--- a/packages/sdk/src/provisioner/__tests__/tar-seeder.test.ts
+++ /dev/null
@@ -1,249 +0,0 @@
-import fs from 'node:fs';
-import { tmpdir } from 'node:os';
-import path from 'node:path';
-import * as tar from 'tar';
-import { afterEach, describe, expect, it, vi } from 'vitest';
-
-const bulkWriteMock = vi.hoisted(() => vi.fn());
-const relayFileClientMock = vi.hoisted(() => vi.fn());
-const execSyncMock = vi.hoisted(() => vi.fn());
-
-vi.mock('@relayfile/sdk', () => ({
-  RelayFileClient: relayFileClientMock.mockImplementation(() => ({
-    bulkWrite: bulkWriteMock,
-  })),
-}));
-
-vi.mock('node:child_process', () => ({
-  execSync: execSyncMock,
-}));
-
-import { seedWorkspaceTar } from '../seeder.js';
-
-const tempDirs: string[] = [];
-
-function makeTempDir(prefix: string): string {
-  const dir = fs.mkdtempSync(path.join(tmpdir(), prefix));
-  tempDirs.push(dir);
-  return dir;
-}
-
-function jsonResponse(payload: unknown, status = 200): Response {
-  return new Response(JSON.stringify(payload), {
-    status,
-    headers: { 'Content-Type': 'application/json' },
-  });
-}
-
-function listRelativeFiles(rootDir: string, currentDir = rootDir): string[] {
-  const files: string[] = [];
-  const entries = fs.readdirSync(currentDir, { withFileTypes: true });
-
-  for (const entry of entries) {
-    const absolutePath = path.join(currentDir, entry.name);
-    if (entry.isDirectory()) {
-      files.push(...listRelativeFiles(rootDir, absolutePath));
-      continue;
-    }
-    if (entry.isFile()) {
-      files.push(path.relative(rootDir, absolutePath).split(path.sep).join('/'));
-    }
-  }
-
-  return files.sort((left, right) => left.localeCompare(right));
-}
-
-async function extractTarballEntries(body: unknown): Promise<string[]> {
-  const archiveDir = makeTempDir('relay-tar-archive-');
-  const extractDir = makeTempDir('relay-tar-extract-');
-  const archivePath = path.join(archiveDir, 'seed.tar.gz');
-
-  fs.writeFileSync(archivePath, Buffer.from(body as Uint8Array));
-  await tar.extract({ file: archivePath, cwd: extractDir, gzip: true });
-
-  return listRelativeFiles(extractDir);
-}
-
-afterEach(() => {
-  bulkWriteMock.mockReset();
-  relayFileClientMock.mockClear();
-  execSyncMock.mockReset();
-  vi.restoreAllMocks();
-  vi.unstubAllGlobals();
-  for (const dir of tempDirs.splice(0)) {
-    fs.rmSync(dir, { recursive: true, force: true });
-  }
-});
-
-describe('seedWorkspaceTar', () => {
-  it('creates and uploads a tar.gz to the import endpoint and respects excludeDirs', async () => {
-    const projectDir = makeTempDir('relay-seed-project-');
-    fs.mkdirSync(path.join(projectDir, 'src'), { recursive: true });
-    fs.mkdirSync(path.join(projectDir, 'ignored'), { recursive: true });
-    fs.mkdirSync(path.join(projectDir, 'node_modules', 'left-pad'), { recursive: true });
-
-    fs.writeFileSync(path.join(projectDir, 'src', 'hello.txt'), 'hello world\n');
-    fs.writeFileSync(path.join(projectDir, 'src', 'data.bin'), Buffer.from([0xff, 0x00, 0xaa]));
-    fs.writeFileSync(path.join(projectDir, 'ignored', 'skip.txt'), 'skip me\n');
-    fs.writeFileSync(path.join(projectDir, 'node_modules', 'left-pad', 'index.js'), 'module.exports = 1;\n');
-    fs.writeFileSync(path.join(projectDir, '.relayfile-mount-state.json'), '{}\n');
-
-    execSyncMock.mockReturnValue(
-      [
-        'src/hello.txt',
-        'src/data.bin',
-        'ignored/skip.txt',
-        'node_modules/left-pad/index.js',
-        '.relayfile-mount-state.json',
-      ].join('\0')
-    );
-
-    const fetchMock = vi.fn().mockResolvedValue(jsonResponse({ imported: 2 }));
-    vi.stubGlobal('fetch', fetchMock);
-
-    const imported = await seedWorkspaceTar('https://relayfile.example/', 'token', 'rw_demo', projectDir, [
-      'ignored',
-    ]);
-
-    expect(imported).toBe(2);
-    expect(fetchMock).toHaveBeenCalledTimes(1);
-
-    const [url, init] = fetchMock.mock.calls[0];
-    expect(String(url)).toContain('/v1/workspaces/rw_demo/fs/import');
-    expect(init.method).toBe('POST');
-    expect(init.headers).toMatchObject({
-      Authorization: 'Bearer token',
-      'Content-Type': 'application/gzip',
-      'X-Correlation-Id': expect.stringMatching(/^seed-tar-rw_demo-/),
-    });
-    expect(init.body).toBeInstanceOf(Uint8Array);
-
-    const entries = await extractTarballEntries(init.body);
-    expect(entries).toEqual(expect.arrayContaining(['src/data.bin', 'src/hello.txt']));
-    expect(entries).not.toContain('ignored/skip.txt');
-    expect(entries).not.toContain('node_modules/left-pad/index.js');
-    expect(entries).not.toContain('.relayfile-mount-state.json');
-  });
-
-  it('falls back to seedWorkspace when the import endpoint returns 404', async () => {
-    const projectDir = makeTempDir('relay-seed-project-');
-    fs.mkdirSync(path.join(projectDir, 'src'), { recursive: true });
-    fs.writeFileSync(path.join(projectDir, 'src', 'hello.txt'), 'hello fallback\n');
-
-    execSyncMock.mockReturnValue('src/hello.txt\0');
-    bulkWriteMock.mockRejectedValue({ status: undefined });
-
-    const fetchMock = vi
-      .fn()
-      .mockResolvedValueOnce(new Response('missing', { status: 404 }))
-      .mockResolvedValueOnce(jsonResponse({ written: 1, errorCount: 0, errors: [] }));
-    vi.stubGlobal('fetch', fetchMock);
-
-    const imported = await seedWorkspaceTar('https://relayfile.example/', 'token', 'rw_demo', projectDir, []);
-
-    expect(imported).toBe(1);
-    expect(fetchMock).toHaveBeenCalledTimes(2);
-    expect(String(fetchMock.mock.calls[0]?.[0])).toContain('/v1/workspaces/rw_demo/fs/import');
-    expect(String(fetchMock.mock.calls[1]?.[0])).toContain('/v1/workspaces/rw_demo/fs/bulk');
-
-    const payload = JSON.parse(String(fetchMock.mock.calls[1]?.[1].body));
-    expect(payload.files).toEqual([
-      { path: '/src/hello.txt', content: 'hello fallback\n', encoding: 'utf-8' },
-    ]);
-  });
-
-  it('throws on non-404 HTTP errors', async () => {
-    const projectDir = makeTempDir('relay-seed-project-');
-    fs.mkdirSync(path.join(projectDir, 'src'), { recursive: true });
-    fs.writeFileSync(path.join(projectDir, 'src', 'hello.txt'), 'hello\n');
-
-    execSyncMock.mockReturnValue('src/hello.txt\0');
-
-    const fetchMock = vi.fn().mockResolvedValue(new Response('boom', { status: 500 }));
-    vi.stubGlobal('fetch', fetchMock);
-
-    await expect(
-      seedWorkspaceTar('https://relayfile.example/', 'token', 'rw_demo', projectDir, [])
-    ).rejects.toThrow('tar import failed for workspace rw_demo: HTTP 500 boom');
-  });
-
-  it('works for non-git directories via the directory-walk fallback path', async () => {
-    const projectDir = makeTempDir('relay-seed-project-');
-    fs.mkdirSync(path.join(projectDir, 'src'), { recursive: true });
-    fs.mkdirSync(path.join(projectDir, 'nested', 'docs'), { recursive: true });
-    fs.mkdirSync(path.join(projectDir, 'custom-ignore'), { recursive: true });
-    fs.mkdirSync(path.join(projectDir, 'node_modules', 'left-pad'), { recursive: true });
-
-    fs.writeFileSync(path.join(projectDir, 'src', 'app.ts'), 'export const app = true;\n');
-    fs.writeFileSync(path.join(projectDir, 'nested', 'docs', 'readme.md'), '# hello\n');
-    fs.writeFileSync(path.join(projectDir, 'custom-ignore', 'skip.txt'), 'skip\n');
-    fs.writeFileSync(path.join(projectDir, 'node_modules', 'left-pad', 'index.js'), 'module.exports = 1;\n');
-    fs.writeFileSync(path.join(projectDir, '.relayfile-mount-state.json'), '{}\n');
-
-    execSyncMock.mockImplementation(() => {
-      throw new Error('not a git repo');
-    });
-
-    const fetchMock = vi.fn().mockResolvedValue(jsonResponse({ imported: 2 }));
-    vi.stubGlobal('fetch', fetchMock);
-
-    const imported = await seedWorkspaceTar('https://relayfile.example/', 'token', 'rw_demo', projectDir, [
-      'custom-ignore',
-    ]);
-
-    expect(imported).toBe(2);
-    expect(fetchMock).toHaveBeenCalledTimes(1);
-
-    const [, init] = fetchMock.mock.calls[0];
-    const entries = await extractTarballEntries(init.body);
-    expect(entries).toEqual(expect.arrayContaining(['nested/docs/readme.md', 'src/app.ts']));
-    expect(entries).not.toContain('custom-ignore/skip.txt');
-    expect(entries).not.toContain('node_modules/left-pad/index.js');
-    expect(entries).not.toContain('.relayfile-mount-state.json');
-  });
-
-  it('includes untracked files returned by git ls-files and preserves gitignore filtering', async () => {
-    const projectDir = makeTempDir('relay-seed-project-');
-    fs.mkdirSync(path.join(projectDir, 'src'), { recursive: true });
-    fs.mkdirSync(path.join(projectDir, 'ignored-by-git'), { recursive: true });
-
-    fs.writeFileSync(path.join(projectDir, 'src', 'tracked.ts'), 'export const tracked = true;\n');
-    fs.writeFileSync(path.join(projectDir, 'src', 'draft.ts'), 'export const draft = true;\n');
-    fs.writeFileSync(path.join(projectDir, 'ignored-by-git', 'skip.txt'), 'skip\n');
-
-    execSyncMock.mockReturnValue(['src/tracked.ts', 'src/draft.ts'].join('\0'));
-
-    const fetchMock = vi.fn().mockResolvedValue(jsonResponse({ imported: 2 }));
-    vi.stubGlobal('fetch', fetchMock);
-
-    const imported = await seedWorkspaceTar('https://relayfile.example/', 'token', 'rw_demo', projectDir, []);
-
-    expect(imported).toBe(2);
-    expect(execSyncMock).toHaveBeenCalledWith(
-      'git ls-files -z --cached --others --exclude-standard',
-      expect.objectContaining({ cwd: path.resolve(projectDir), encoding: 'utf-8' })
-    );
-
-    const [, init] = fetchMock.mock.calls[0];
-    const entries = await extractTarballEntries(init.body);
-    expect(entries).toEqual(['src/draft.ts', 'src/tracked.ts']);
-    expect(entries).not.toContain('ignored-by-git/skip.txt');
-  });
-
-  it('does not fall back to a directory walk when git ls-files succeeds with no files', async () => {
-    const projectDir = makeTempDir('relay-seed-project-');
-    fs.mkdirSync(path.join(projectDir, 'ignored-by-git'), { recursive: true });
-    fs.writeFileSync(path.join(projectDir, 'ignored-by-git', 'skip.txt'), 'skip\n');
-
-    execSyncMock.mockReturnValue('');
-
-    const fetchMock = vi.fn().mockResolvedValue(jsonResponse({ imported: 0 }));
-    vi.stubGlobal('fetch', fetchMock);
-
-    const imported = await seedWorkspaceTar('https://relayfile.example/', 'token', 'rw_demo', projectDir, []);
-
-    expect(imported).toBe(0);
-
-    expect(fetchMock).not.toHaveBeenCalled();
-  });
-});
diff --git a/packages/sdk/src/provisioner/index.ts b/packages/sdk/src/provisioner/index.ts
deleted file mode 100644
index c6d8c88b2..000000000
--- a/packages/sdk/src/provisioner/index.ts
+++ /dev/null
@@ -1,335 +0,0 @@
-import { existsSync, readdirSync } from 'node:fs';
-import path from 'node:path';
-
-import { getDefaultPermissionAuditPath, PermissionAuditLog } from './audit.js';
-import { compileAgentScopes } from './compiler.js';
-import { ensureRelayfileMount } from './mount.js';
-import { createWorkspaceIfNeeded, seedWorkspace, seedWorkflowAcls } from './seeder.js';
-import { DEFAULT_ADMIN_AGENT_NAME, DEFAULT_ADMIN_SCOPES, mintAgentToken } from './token.js';
-import type {
-  AgentPermissions,
-  AgentProvisionMap,
-  AgentProvisionResult,
-  CompiledAgentPermissions,
-  ProvisionResult,
-  ProvisionSummary,
-  WorkflowProvisionConfig,
-} from './types.js';
-
-export * from './compiler.js';
-export * from './local-jwks.js';
-export * from './mount.js';
-export * from './seeder.js';
-export * from './token.js';
-export * from './types.js';
-export * from './audit.js';
-
-interface ProvisionableAgent {
-  name: string;
-  permissions: AgentPermissions;
-  resolutionSource: 'configured' | 'auto-discovered';
-}
-
-const DEFAULT_AGENT_NAME = 'default-agent';
-
-function discoverAgentNames(projectDir: string): string[] {
-  if (!existsSync(projectDir)) {
-    return [DEFAULT_AGENT_NAME];
-  }
-
-  const agentNames = new Set<string>();
-
-  for (const entry of readdirSync(projectDir)) {
-    const match = entry.match(/^\.(.+)\.(agentignore|agentreadonly)$/u);
-    if (match?.[1]) {
-      agentNames.add(match[1]);
-    }
-  }
-
-  const discovered = [...agentNames].sort((left, right) => left.localeCompare(right));
-  return discovered.length > 0 ? discovered : [DEFAULT_AGENT_NAME];
-}
-
-function resolveAgents(config: WorkflowProvisionConfig): ProvisionableAgent[] {
-  const configuredAgents = Object.entries(config.agents ?? {});
-  if (configuredAgents.length > 0) {
-    return configuredAgents.map(([name, permissions]) => ({
-      name,
-      permissions: permissions ?? {},
-      resolutionSource: 'configured',
-    }));
-  }
-
-  return discoverAgentNames(config.projectDir).map((name) => ({
-    name,
-    permissions: {},
-    resolutionSource: 'auto-discovered',
-  }));
-}
-
-function buildSummary(compilations: readonly CompiledAgentPermissions[]): ProvisionSummary {
-  return compilations.reduce<ProvisionSummary>(
-    (summary, compiled) => ({
-      readonly: summary.readonly + compiled.summary.readonly,
-      readwrite: summary.readwrite + compiled.summary.readwrite,
-      denied: summary.denied + compiled.summary.denied,
-      customScopes: summary.customScopes + compiled.summary.customScopes,
-    }),
-    {
-      readonly: 0,
-      readwrite: 0,
-      denied: 0,
-      customScopes: 0,
-    }
-  );
-}
-
-function buildAgentResult(
-  projectDir: string,
-  name: string,
-  token: string,
-  compiled: CompiledAgentPermissions,
-  mountPoint?: string
-): AgentProvisionResult {
-  return {
-    name,
-    tokenPath: path.resolve(projectDir, '.relay', 'tokens', `${name}.jwt`),
-    token,
-    scopes: [...compiled.scopes],
-    compiled,
-    mountPoint,
-  };
-}
-
-function sanitizePathComponent(value: string): string {
-  return value.replace(/[^a-zA-Z0-9._-]+/g, '-');
-}
-
-function countAclDirectories(compilations: readonly CompiledAgentPermissions[]): number {
-  const directories = new Set<string>();
-
-  for (const compilation of compilations) {
-    for (const directory of Object.keys(compilation.acl)) {
-      directories.add(directory);
-    }
-  }
-
-  return directories.size;
-}
-
-export async function provisionWorkflowAgents(config: WorkflowProvisionConfig): Promise<ProvisionResult> {
-  const audit = new PermissionAuditLog();
-  const auditPath = getDefaultPermissionAuditPath(config.projectDir);
-
-  try {
-    const agents = resolveAgents(config);
-    const tokens = new Map<string, string>();
-    const scopes = new Map<string, string[]>();
-    const mounts = new Map<string, Awaited<ReturnType<typeof ensureRelayfileMount>>>();
-    const agentResults: AgentProvisionMap = {};
-    const compilations: CompiledAgentPermissions[] = [];
-    const compiledByAgent = new Map<string, CompiledAgentPermissions>();
-
-    for (const agent of agents) {
-      audit.log({
-        agentName: agent.name,
-        action: 'resolve',
-        details: {
-          source: agent.resolutionSource,
-          workspace: config.workspace,
-          permissionKeys: Object.keys(agent.permissions).sort(),
-        },
-      });
-
-      const compiled = compileAgentScopes({
-        agentName: agent.name,
-        workspace: config.workspace,
-        projectDir: config.projectDir,
-        permissions: agent.permissions,
-      });
-      const token = mintAgentToken({
-        privateKey: config.tokenSigningKey.privateKey,
-        kid: config.tokenSigningKey.kid,
-        agentName: agent.name,
-        workspace: config.workspace,
-        scopes: compiled.scopes,
-        ttlSeconds: config.tokenTtlSeconds,
-      });
-
-      audit.log({
-        agentName: agent.name,
-        action: 'mint',
-        details: {
-          workspace: config.workspace,
-          jwtPath: path.resolve(config.projectDir, '.relay', 'tokens', `${agent.name}.jwt`),
-          scopeCount: compiled.scopes.length,
-          scopes: [...compiled.scopes],
-          ttlSeconds: config.tokenTtlSeconds ?? null,
-        },
-      });
-
-      tokens.set(agent.name, token);
-      scopes.set(agent.name, [...compiled.scopes]);
-      compilations.push(compiled);
-      compiledByAgent.set(agent.name, compiled);
-    }
-
-    const adminScopes = [...(config.adminScopes ?? DEFAULT_ADMIN_SCOPES)];
-    const adminToken = mintAgentToken({
-      privateKey: config.tokenSigningKey.privateKey,
-      kid: config.tokenSigningKey.kid,
-      agentName: DEFAULT_ADMIN_AGENT_NAME,
-      workspace: config.workspace,
-      scopes: adminScopes,
-      ttlSeconds: config.tokenTtlSeconds,
-    });
-
-    audit.log({
-      agentName: DEFAULT_ADMIN_AGENT_NAME,
-      action: 'mint',
-      details: {
-        workspace: config.workspace,
-        role: 'admin',
-        scopeCount: adminScopes.length,
-        scopes: adminScopes,
-        ttlSeconds: config.tokenTtlSeconds ?? null,
-      },
-    });
-
-    let seededAclCount = 0;
-    let seededFileCount = 0;
-
-    if (!config.skipSeeding) {
-      await createWorkspaceIfNeeded(config.relayfileBaseUrl, adminToken, config.workspace);
-      audit.log({
-        agentName: DEFAULT_ADMIN_AGENT_NAME,
-        action: 'seed',
-        details: {
-          workspace: config.workspace,
-          step: 'workspace',
-          relayfileBaseUrl: config.relayfileBaseUrl,
-        },
-      });
-
-      seededFileCount = await seedWorkspace(
-        config.relayfileBaseUrl,
-        adminToken,
-        config.workspace,
-        config.projectDir,
-        config.excludeDirs ?? []
-      );
-      audit.log({
-        agentName: DEFAULT_ADMIN_AGENT_NAME,
-        action: 'seed',
-        details: {
-          workspace: config.workspace,
-          step: 'files',
-          projectDir: config.projectDir,
-          excludeDirs: config.excludeDirs ?? [],
-          fileCount: seededFileCount,
-        },
-      });
-
-      await seedWorkflowAcls({
-        relayfileUrl: config.relayfileBaseUrl,
-        adminToken,
-        workspace: config.workspace,
-        agents: compilations.map((compilation) => ({
-          name: compilation.agentName,
-          acl: compilation.acl,
-        })),
-      });
-      seededAclCount = countAclDirectories(compilations);
-      audit.log({
-        agentName: DEFAULT_ADMIN_AGENT_NAME,
-        action: 'seed',
-        details: {
-          workspace: config.workspace,
-          step: 'acl',
-          directoryCount: seededAclCount,
-          agentCount: compilations.length,
-        },
-      });
-    }
-
-    if (!config.skipMount) {
-      const mountRoot = path.resolve(config.mountBaseDir ?? path.join(config.projectDir, '.relay'));
-      try {
-        for (const agent of agents) {
-          const token = tokens.get(agent.name);
-          const compiled = compiledByAgent.get(agent.name);
-          if (!token || !compiled) {
-            continue;
-          }
-
-          const mountHandle = await ensureRelayfileMount({
-            binaryPath: config.mountBinaryPath,
-            relayfileUrl: config.relayfileBaseUrl,
-            workspace: config.workspace,
-            token,
-            mountPoint: path.join(
-              mountRoot,
-              `workspace-${sanitizePathComponent(config.workspace)}-${sanitizePathComponent(agent.name)}`
-            ),
-          });
-
-          mounts.set(agent.name, mountHandle);
-          agentResults[agent.name] = buildAgentResult(
-            config.projectDir,
-            agent.name,
-            token,
-            compiled,
-            mountHandle.mountPoint
-          );
-        }
-      } catch (mountError) {
-        for (const [, mount] of mounts) {
-          try {
-            if (typeof mount.stop === 'function') {
-              await mount.stop();
-            }
-          } catch {
-            // Best-effort cleanup — ignore individual stop failures.
-          }
-        }
-        mounts.clear();
-        throw mountError;
-      }
-    } else {
-      for (const agent of agents) {
-        const token = tokens.get(agent.name);
-        const compiled = compiledByAgent.get(agent.name);
-        if (!token || !compiled) {
-          continue;
-        }
-
-        agentResults[agent.name] = buildAgentResult(config.projectDir, agent.name, token, compiled);
-      }
-    }
-
-    return {
-      agents: agentResults,
-      agentNames: agents.map((agent) => agent.name),
-      adminToken,
-      seededFileCount,
-      seededAclCount,
-      summary: buildSummary(compilations),
-      mounts,
-      tokens,
-      scopes,
-    };
-  } finally {
-    try {
-      await audit.writeTo(auditPath);
-    } catch (error) {
-      if (config.verbose) {
-        const message = error instanceof Error ? error.message : String(error);
-        console.warn(`Failed to write permission audit to ${auditPath}: ${message}`);
-      }
-    }
-
-    if (config.verbose) {
-      console.info(audit.summary());
-    }
-  }
-}
diff --git a/packages/sdk/src/provisioner/mount.ts b/packages/sdk/src/provisioner/mount.ts
deleted file mode 100644
index 049197299..000000000
--- a/packages/sdk/src/provisioner/mount.ts
+++ /dev/null
@@ -1,419 +0,0 @@
-import { execSync, spawn, type ChildProcess } from 'node:child_process';
-import { createHash } from 'node:crypto';
-import {
-  accessSync,
-  chmodSync,
-  constants,
-  createWriteStream,
-  existsSync,
-  mkdirSync,
-  readFileSync,
-  renameSync,
-  rmSync,
-  writeFileSync,
-} from 'node:fs';
-import { mkdtemp, rm } from 'node:fs/promises';
-import https from 'node:https';
-import os from 'node:os';
-import path from 'node:path';
-
-const RELAYFILE_VERSION = '0.1.6';
-const RELEASE_BASE_URL = 'https://github.com/AgentWorkforce/relayfile/releases/download';
-const CHECKSUMS_FILE = 'checksums.txt';
-const CACHE_DIR = path.join(os.homedir(), '.agent-relay', 'bin');
-const CACHE_PATH = path.join(CACHE_DIR, 'relayfile-mount');
-const VERSION_PATH = path.join(CACHE_DIR, 'relayfile-mount.version');
-const SUPPORTED_TARGETS = ['darwin-arm64', 'darwin-amd64', 'linux-arm64', 'linux-amd64'].join(', ');
-
-const PLATFORM_ARCH_MAP: Record<string, string> = {
-  'darwin:arm64': 'darwin-arm64',
-  'darwin:x64': 'darwin-amd64',
-  'linux:arm64': 'linux-arm64',
-  'linux:x64': 'linux-amd64',
-};
-
-export interface MountConfig {
-  binaryPath?: string;
-  relayfileUrl: string;
-  workspace: string;
-  token: string;
-  mountPoint?: string;
-}
-
-export interface MountHandle {
-  pid: number;
-  mountPoint: string;
-  stop(): Promise<void>;
-}
-
-function ensureCacheDir(): void {
-  mkdirSync(CACHE_DIR, { recursive: true });
-}
-
-function getRelayfileTarget(): string {
-  const target = PLATFORM_ARCH_MAP[`${os.platform()}:${os.arch()}`];
-  if (!target) {
-    throw new Error(
-      `Unsupported platform for relayfile-mount: ${os.platform()}-${os.arch()}. Supported targets: ${SUPPORTED_TARGETS}.`
-    );
-  }
-
-  return target;
-}
-
-function getReleaseAssetUrl(assetName: string): string {
-  return `${RELEASE_BASE_URL}/v${RELAYFILE_VERSION}/${assetName}`;
-}
-
-function readCachedVersion(): string | null {
-  try {
-    return readFileSync(VERSION_PATH, 'utf8').trim() || null;
-  } catch {
-    return null;
-  }
-}
-
-function isExecutable(filePath: string): boolean {
-  try {
-    accessSync(filePath, constants.X_OK);
-    return true;
-  } catch {
-    return false;
-  }
-}
-
-function downloadErrorMessage(url: string, status: number): string {
-  return `Download failed with status ${status} for ${url}`;
-}
-
-function downloadBinary(url: string, destPath: string, maxRedirects = 5): Promise<void> {
-  ensureCacheDir();
-
-  const attemptDownload = (
-    currentUrl: string,
-    redirectsRemaining: number,
-    resolve: () => void,
-    reject: (error: Error) => void
-  ) => {
-    const request = https.get(currentUrl, (res) => {
-      const status = res.statusCode ?? 0;
-      const location = res.headers.location;
-      const isRedirect = status >= 300 && status < 400 && location;
-
-      if (isRedirect) {
-        if (redirectsRemaining <= 0) {
-          res.resume();
-          reject(new Error('Too many redirects while downloading relayfile-mount'));
-          return;
-        }
-
-        const nextUrl = new URL(location, currentUrl).toString();
-        res.resume();
-        attemptDownload(nextUrl, redirectsRemaining - 1, resolve, reject);
-        return;
-      }
-
-      if (status !== 200) {
-        res.resume();
-        reject(new Error(downloadErrorMessage(currentUrl, status)));
-        return;
-      }
-
-      const fileStream = createWriteStream(destPath, { mode: 0o755 });
-      res.pipe(fileStream);
-      fileStream.on('finish', () => {
-        fileStream.close(() => resolve());
-      });
-      fileStream.on('error', (error) => reject(error instanceof Error ? error : new Error(String(error))));
-      res.on('error', (error) => reject(error instanceof Error ? error : new Error(String(error))));
-    });
-
-    request.on('error', (error) => reject(error instanceof Error ? error : new Error(String(error))));
-  };
-
-  return new Promise<void>((resolve, reject) => {
-    attemptDownload(url, maxRedirects, resolve, reject);
-  }).catch((error: unknown) => {
-    try {
-      rmSync(destPath, { force: true });
-    } catch {
-      // Ignore cleanup failures.
-    }
-
-    throw error;
-  });
-}
-
-function downloadText(url: string, maxRedirects = 5): Promise<string> {
-  const fetchWithRedirects = (
-    currentUrl: string,
-    redirectsRemaining: number,
-    resolve: (text: string) => void,
-    reject: (error: Error) => void
-  ) => {
-    const request = https.get(currentUrl, (res) => {
-      const status = res.statusCode ?? 0;
-      const location = res.headers.location;
-      const isRedirect = status >= 300 && status < 400 && location;
-
-      if (isRedirect) {
-        if (redirectsRemaining <= 0) {
-          res.resume();
-          reject(new Error('Too many redirects while downloading relayfile checksums'));
-          return;
-        }
-
-        const nextUrl = new URL(location, currentUrl).toString();
-        res.resume();
-        fetchWithRedirects(nextUrl, redirectsRemaining - 1, resolve, reject);
-        return;
-      }
-
-      if (status !== 200) {
-        res.resume();
-        reject(new Error(downloadErrorMessage(currentUrl, status)));
-        return;
-      }
-
-      const chunks: Buffer[] = [];
-      res.on('data', (chunk) => {
-        chunks.push(Buffer.isBuffer(chunk) ? chunk : Buffer.from(chunk));
-      });
-      res.on('end', () => resolve(Buffer.concat(chunks).toString('utf8')));
-      res.on('error', (error) => reject(error instanceof Error ? error : new Error(String(error))));
-    });
-
-    request.on('error', (error) => reject(error instanceof Error ? error : new Error(String(error))));
-  };
-
-  return new Promise((resolve, reject) => {
-    fetchWithRedirects(url, maxRedirects, resolve, reject);
-  });
-}
-
-function getExpectedChecksum(checksumContent: string, binaryName: string): string {
-  for (const line of checksumContent.split('\n')) {
-    const trimmed = line.trim();
-    if (!trimmed) {
-      continue;
-    }
-
-    const match = trimmed.match(/^([a-fA-F0-9]{64})\s+\*?(.+)$/);
-    if (!match) {
-      continue;
-    }
-
-    const entryName = path.basename(match[2].trim());
-    if (entryName === binaryName) {
-      return match[1].toLowerCase();
-    }
-  }
-
-  throw new Error(`No checksum entry found for ${binaryName}`);
-}
-
-async function verifyChecksum(filePath: string, binaryName: string): Promise<void> {
-  const checksumUrl = getReleaseAssetUrl(CHECKSUMS_FILE);
-  const checksumContent = await downloadText(checksumUrl);
-  const expectedHash = getExpectedChecksum(checksumContent, binaryName);
-  const actualHash = createHash('sha256').update(readFileSync(filePath)).digest('hex');
-
-  if (actualHash !== expectedHash) {
-    throw new Error(`Checksum mismatch for ${binaryName}: expected ${expectedHash}, got ${actualHash}`);
-  }
-}
-
-function resignBinaryForMacOS(binaryPath: string): void {
-  if (os.platform() !== 'darwin') {
-    return;
-  }
-
-  try {
-    execSync(`codesign --force --sign - "${binaryPath}"`, { stdio: 'pipe' });
-  } catch {
-    // Ignore best-effort re-sign failures.
-  }
-}
-
-async function ensureRelayfileMountBinary(binaryPath?: string): Promise<string> {
-  if (binaryPath) {
-    return binaryPath;
-  }
-
-  if (process.env.RELAYFILE_ROOT) {
-    return path.join(process.env.RELAYFILE_ROOT, 'bin', 'relayfile-mount');
-  }
-
-  const target = getRelayfileTarget();
-  const binaryName = `relayfile-mount-${target}`;
-  const downloadUrl = getReleaseAssetUrl(binaryName);
-
-  ensureCacheDir();
-
-  if (existsSync(CACHE_PATH) && readCachedVersion() === RELAYFILE_VERSION) {
-    if (!isExecutable(CACHE_PATH)) {
-      chmodSync(CACHE_PATH, 0o755);
-    }
-    return CACHE_PATH;
-  }
-
-  const tempPath = path.join(CACHE_DIR, `relayfile-mount.${process.pid}.${Date.now()}.download`);
-
-  try {
-    await downloadBinary(downloadUrl, tempPath);
-    await verifyChecksum(tempPath, binaryName);
-    chmodSync(tempPath, 0o755);
-    renameSync(tempPath, CACHE_PATH);
-    chmodSync(CACHE_PATH, 0o755);
-    resignBinaryForMacOS(CACHE_PATH);
-    writeFileSync(VERSION_PATH, `${RELAYFILE_VERSION}\n`, 'utf8');
-    return CACHE_PATH;
-  } catch (error) {
-    try {
-      rmSync(tempPath, { force: true });
-    } catch {
-      // Ignore cleanup failures.
-    }
-
-    const message = error instanceof Error ? error.message : String(error);
-    throw new Error(`Failed to install relayfile-mount from ${downloadUrl}: ${message}`);
-  }
-}
-
-async function runCommandCapture(command: string, args: string[], env: NodeJS.ProcessEnv): Promise<string> {
-  return await new Promise((resolve, reject) => {
-    const proc = spawn(command, args, { stdio: ['ignore', 'pipe', 'pipe'], env });
-    let output = '';
-
-    proc.stdout.setEncoding('utf8');
-    proc.stderr.setEncoding('utf8');
-
-    proc.stdout.on('data', (chunk: string) => {
-      output += chunk;
-    });
-    proc.stderr.on('data', (chunk: string) => {
-      output += chunk;
-    });
-
-    proc.on('error', (error) => {
-      reject(error);
-    });
-
-    proc.on('close', (code, signal) => {
-      if (code === 0) {
-        resolve(output);
-        return;
-      }
-
-      const reason = signal ? `signal ${signal}` : `exit code ${typeof code === 'number' ? code : 'unknown'}`;
-      const detail = output.trim();
-      reject(new Error(detail || `command failed with ${reason}`));
-    });
-  });
-}
-
-function ensureProcessRunning(processRef: ChildProcess): boolean {
-  return processRef.exitCode === null && !processRef.killed;
-}
-
-async function stopMountProcess(processRef: ChildProcess): Promise<void> {
-  if (processRef.exitCode !== null || !processRef.pid) {
-    return;
-  }
-
-  processRef.kill('SIGTERM');
-  await new Promise<void>((resolve) => {
-    const timeout = setTimeout(() => {
-      if (processRef.exitCode === null && processRef.pid) {
-        processRef.kill('SIGKILL');
-      }
-      resolve();
-    }, 1200);
-    processRef.once('exit', () => {
-      clearTimeout(timeout);
-      resolve();
-    });
-  });
-}
-
-export async function ensureRelayfileMount(config: MountConfig): Promise<MountHandle> {
-  const binaryPath = await ensureRelayfileMountBinary(config.binaryPath);
-  if (!existsSync(binaryPath)) {
-    throw new Error(`missing relayfile mount binary: ${binaryPath}`);
-  }
-
-  const mountPoint =
-    config.mountPoint ?? (await mkdtemp(path.join(os.tmpdir(), `relayfile-mount-${config.workspace}-`)));
-  mkdirSync(mountPoint, { recursive: true });
-
-  const mountBaseArgs = [
-    '--base-url',
-    config.relayfileUrl,
-    '--workspace',
-    config.workspace,
-    '--local-dir',
-    mountPoint,
-  ];
-  const onceArgs = [...mountBaseArgs, '--once'];
-  const mountEnv = {
-    ...process.env,
-    RELAYFILE_TOKEN: config.token,
-  };
-
-  let mountProc: ChildProcess | undefined;
-  let startupPhase = 'initial workspace sync';
-  try {
-    await runCommandCapture(binaryPath, onceArgs, mountEnv);
-
-    startupPhase = 'mount process startup';
-    const startedMountProc = spawn(binaryPath, mountBaseArgs, {
-      stdio: ['ignore', 'ignore', 'ignore'],
-      env: mountEnv,
-    });
-    mountProc = startedMountProc;
-
-    await new Promise<void>((resolve, reject) => {
-      const timer = setTimeout(() => resolve(), 600);
-      startedMountProc.on('error', (spawnError) => {
-        clearTimeout(timer);
-        reject(spawnError);
-      });
-      startedMountProc.on('spawn', () => {
-        clearTimeout(timer);
-        resolve();
-      });
-    });
-
-    if (!ensureProcessRunning(startedMountProc) || typeof startedMountProc.pid !== 'number') {
-      await stopMountProcess(startedMountProc).catch(() => undefined);
-      throw new Error(`mount process for workspace ${config.workspace} exited before continuing`);
-    }
-  } catch (error) {
-    if (mountProc) {
-      await stopMountProcess(mountProc).catch(() => undefined);
-    }
-    await rm(mountPoint, { recursive: true, force: true }).catch(() => undefined);
-    const message = error instanceof Error ? error.message : String(error);
-    throw new Error(`${startupPhase} failed for ${config.workspace}: ${message}`);
-  }
-
-  if (!mountProc || typeof mountProc.pid !== 'number') {
-    await rm(mountPoint, { recursive: true, force: true }).catch(() => undefined);
-    throw new Error(`mount process startup failed for ${config.workspace}: missing process id`);
-  }
-
-  let stopped = false;
-
-  return {
-    pid: mountProc.pid,
-    mountPoint,
-    async stop(): Promise<void> {
-      if (stopped) {
-        return;
-      }
-      stopped = true;
-      await stopMountProcess(mountProc).catch(() => undefined);
-      await rm(mountPoint, { recursive: true, force: true }).catch(() => undefined);
-    },
-  };
-}
diff --git a/packages/sdk/src/provisioner/seeder.ts b/packages/sdk/src/provisioner/seeder.ts
deleted file mode 100644
index 4b3c4e192..000000000
--- a/packages/sdk/src/provisioner/seeder.ts
+++ /dev/null
@@ -1,571 +0,0 @@
-import { RelayFileClient } from '@relayfile/sdk';
-import { execSync } from 'node:child_process';
-import fs from 'node:fs';
-import path from 'node:path';
-import * as tar from 'tar';
-
-interface BulkWriteResponseShape {
-  written?: number;
-  errorCount?: number;
-  errors?: unknown;
-}
-
-interface SeedFile {
-  path: string;
-  content: string;
-  encoding?: 'utf-8' | 'base64';
-}
-
-interface SeedFileResult {
-  written: number;
-  errorCount: number;
-  errors: unknown;
-}
-
-const DEFAULT_EXCLUDED_DIRS = ['.relay', '.git', 'node_modules'];
-const DEFAULT_EXCLUDED_FILES = new Set(['.relayfile-mount-state.json']);
-const BATCH_SIZE = 50;
-const utf8Decoder = new TextDecoder('utf-8', { fatal: true });
-
-interface WorkflowAclAgent {
-  name: string;
-  acl: Record<string, string[]>;
-}
-
-interface SeedWorkflowAclsOptions {
-  relayfileUrl: string;
-  adminToken: string;
-  workspace: string;
-  agents: WorkflowAclAgent[];
-}
-
-function normalizeBaseUrl(baseUrl: string): string {
-  const url = String(baseUrl ?? '').trim();
-  let end = url.length;
-  while (end > 0 && url.charCodeAt(end - 1) === 0x2f) {
-    end--;
-  }
-  return end === url.length ? url : url.slice(0, end);
-}
-
-function normalizeWorkspaceId(workspaceId: string): string {
-  const value = String(workspaceId ?? '').trim();
-  if (!value) {
-    throw new Error('workspaceId is required');
-  }
-  return value;
-}
-
-function normalizeExcludeDirs(excludeDirs: string[]): Set<string> {
-  const result = new Set<string>();
-  for (const dir of excludeDirs) {
-    const normalized = String(dir ?? '')
-      .trim()
-      .replace(/^[/\\]+|[/\\]+$/g, '');
-    if (!normalized) {
-      continue;
-    }
-    result.add(normalized);
-  }
-  return result;
-}
-
-function normalizeAclDirectory(dirPath: string): string {
-  const normalized = String(dirPath ?? '')
-    .trim()
-    .replace(/\\/gu, '/')
-    .replace(/\/+$/u, '');
-
-  if (!normalized || normalized === '/') {
-    return '/';
-  }
-
-  return normalized.startsWith('/') ? normalized : `/${normalized}`;
-}
-
-function isReviewerAgent(agentName: string): boolean {
-  return /reviewer/iu.test(String(agentName ?? '').trim());
-}
-
-function createClient(baseUrl: string, token: string): RelayFileClient {
-  return new RelayFileClient({
-    baseUrl: normalizeBaseUrl(baseUrl),
-    token,
-    retry: { maxRetries: 0 },
-  });
-}
-
-function isUtf8(raw: Buffer): boolean {
-  try {
-    utf8Decoder.decode(raw);
-    return true;
-  } catch {
-    return false;
-  }
-}
-
-function buildSeedFilePayload(filePath: string, rootDir: string): SeedFile {
-  const relative = path.relative(rootDir, filePath).split(path.sep).join('/');
-  const raw = fs.readFileSync(filePath);
-  if (isUtf8(raw)) {
-    return { path: `/${relative}`, content: raw.toString('utf8'), encoding: 'utf-8' };
-  }
-  return { path: `/${relative}`, content: raw.toString('base64'), encoding: 'base64' };
-}
-
-function collectSeedPaths(
-  rootDir: string,
-  currentRelative: string,
-  excludeDirs: Set<string>,
-  output: string[]
-): void {
-  const absoluteDir = path.join(rootDir, currentRelative);
-  const entries = fs.readdirSync(absoluteDir, { withFileTypes: true });
-
-  for (const entry of entries) {
-    if (excludeDirs.has(entry.name)) {
-      continue;
-    }
-    if (DEFAULT_EXCLUDED_FILES.has(entry.name)) {
-      continue;
-    }
-
-    const nextRelative = currentRelative ? `${currentRelative}/${entry.name}` : entry.name;
-    const absolutePath = path.join(rootDir, nextRelative);
-
-    if (excludeDirs.has(nextRelative)) {
-      continue;
-    }
-
-    if (entry.isDirectory()) {
-      collectSeedPaths(rootDir, nextRelative, excludeDirs, output);
-      continue;
-    }
-
-    if (entry.isFile()) {
-      output.push(absolutePath);
-      continue;
-    }
-
-    if (entry.isSymbolicLink()) {
-      try {
-        const resolved = fs.realpathSync(absolutePath);
-        if (!resolved.startsWith(rootDir + path.sep) && resolved !== rootDir) {
-          continue;
-        }
-        const stat = fs.statSync(resolved);
-        if (stat.isDirectory()) {
-          collectSeedPaths(rootDir, nextRelative, excludeDirs, output);
-          continue;
-        }
-        if (stat.isFile()) {
-          output.push(absolutePath);
-        }
-      } catch {
-        // Ignore symlinks that cannot be resolved.
-      }
-    }
-  }
-}
-
-function parseBulkWriteResponse(payload: unknown): SeedFileResult {
-  if (!payload || typeof payload !== 'object') {
-    return { written: 0, errorCount: 0, errors: [] };
-  }
-  const parsed = payload as BulkWriteResponseShape;
-  return {
-    written: typeof parsed.written === 'number' ? parsed.written : 0,
-    errorCount: typeof parsed.errorCount === 'number' ? parsed.errorCount : 0,
-    errors: parsed.errors ?? [],
-  };
-}
-
-async function postBulkWrite(
-  baseUrl: string,
-  token: string,
-  workspaceId: string,
-  files: SeedFile[],
-  correlationId: string
-): Promise<SeedFileResult> {
-  const response = await fetch(
-    `${normalizeBaseUrl(baseUrl)}/v1/workspaces/${encodeURIComponent(workspaceId)}/fs/bulk`,
-    {
-      method: 'POST',
-      headers: {
-        Authorization: `Bearer ${token}`,
-        'Content-Type': 'application/json',
-        'X-Correlation-Id': correlationId,
-      },
-      body: JSON.stringify({ files }),
-    }
-  );
-
-  const body = await response.text();
-  if (!response.ok) {
-    throw new Error(`failed to seed workspace ${workspaceId}: HTTP ${response.status} ${body}`.trim());
-  }
-
-  if (!body) {
-    return { written: files.length, errorCount: 0, errors: [] };
-  }
-  try {
-    return parseBulkWriteResponse(JSON.parse(body));
-  } catch {
-    return { written: files.length, errorCount: 0, errors: [] };
-  }
-}
-
-async function writeBulkWrite(
-  baseUrl: string,
-  token: string,
-  workspaceId: string,
-  files: SeedFile[],
-  correlationId: string
-): Promise<SeedFileResult> {
-  const client = createClient(baseUrl, token);
-  try {
-    const response = await client.bulkWrite({
-      workspaceId,
-      files,
-      correlationId,
-    });
-    return parseBulkWriteResponse(response);
-  } catch (error) {
-    if (typeof (error as { status?: number }).status === 'number') {
-      throw error;
-    }
-  }
-
-  return postBulkWrite(baseUrl, token, workspaceId, files, correlationId);
-}
-
-export async function createWorkspaceIfNeeded(
-  baseUrl: string,
-  token: string,
-  workspaceId: string
-): Promise<void> {
-  const workspace = normalizeWorkspaceId(workspaceId);
-  const client = createClient(baseUrl, token);
-
-  const maybeCreateWorkspace = client as unknown as {
-    createWorkspace?: (...input: unknown[]) => Promise<unknown>;
-  };
-  if (typeof maybeCreateWorkspace.createWorkspace === 'function') {
-    for (const arg of [workspace, { id: workspace }, { workspaceId: workspace }, { name: workspace }]) {
-      try {
-        await maybeCreateWorkspace.createWorkspace(arg);
-        return;
-      } catch {
-        // Continue to the next overload candidate, then fallback to HTTP.
-      }
-    }
-  }
-
-  const endpoint = `${normalizeBaseUrl(baseUrl)}/v1/workspaces`;
-  const bodyCandidates: Array<Record<string, string>> = [
-    { name: workspace },
-    { workspace: workspace },
-    { workspaceId: workspace },
-    { id: workspace },
-  ];
-  let lastFailure: string | null = null;
-
-  for (const body of bodyCandidates) {
-    try {
-      const response = await fetch(endpoint, {
-        method: 'POST',
-        headers: {
-          Authorization: `Bearer ${token}`,
-          'Content-Type': 'application/json',
-          'X-Correlation-Id': `create-workspace-${Date.now()}`,
-        },
-        body: JSON.stringify(body),
-      });
-
-      if (
-        response.status === 200 ||
-        response.status === 201 ||
-        response.status === 204 ||
-        response.status === 409
-      ) {
-        return;
-      }
-
-      const responseBody = await response.text().catch(() => '');
-      lastFailure = `HTTP ${response.status} ${responseBody}`.trim();
-      if (response.status < 500 && response.status !== 409) {
-        continue;
-      }
-    } catch (error) {
-      lastFailure = String(error);
-    }
-  }
-
-  if (lastFailure) {
-    throw new Error(`Failed to create workspace ${workspace}: ${lastFailure}`);
-  }
-}
-
-export async function seedAclRules(
-  baseUrl: string,
-  token: string,
-  workspaceId: string,
-  aclRules: Record<string, string[]>
-): Promise<void> {
-  const workspace = normalizeWorkspaceId(workspaceId);
-  const files = Object.entries(aclRules).map(([dirPath, rules]) => {
-    const normalizedDir = String(dirPath ?? '')
-      .trim()
-      .replace(/\/+$/, '');
-    const aclPath =
-      normalizedDir === '' || normalizedDir === '/' ? '/.relayfile.acl' : `${normalizedDir}/.relayfile.acl`;
-    return {
-      path: aclPath,
-      content: JSON.stringify({ semantics: { permissions: rules } }),
-      encoding: 'utf-8' as const,
-    };
-  });
-
-  if (files.length === 0) {
-    return;
-  }
-
-  const result = await writeBulkWrite(
-    baseUrl,
-    token,
-    workspace,
-    files,
-    `seed-acl-${workspace}-${Date.now()}`
-  );
-  if (result.errorCount > 0) {
-    const details = result.errors ? JSON.stringify(result.errors) : '[]';
-    throw new Error(`ACL seeding had ${result.errorCount} error(s) for workspace ${workspace}: ${details}`);
-  }
-}
-
-export async function seedWorkspace(
-  baseUrl: string,
-  token: string,
-  workspaceId: string,
-  projectDir: string,
-  excludeDirs: string[]
-): Promise<number> {
-  const workspace = normalizeWorkspaceId(workspaceId);
-  const rootDir = path.resolve(projectDir);
-  const excludes = normalizeExcludeDirs([...DEFAULT_EXCLUDED_DIRS, ...excludeDirs]);
-  const seedPaths: string[] = [];
-  collectSeedPaths(rootDir, '', excludes, seedPaths);
-  const allFiles = seedPaths
-    .sort((left, right) => left.localeCompare(right))
-    .map((filePath) => buildSeedFilePayload(filePath, rootDir));
-
-  let seededCount = 0;
-  for (let index = 0; index < allFiles.length; index += BATCH_SIZE) {
-    const batch = allFiles.slice(index, index + BATCH_SIZE);
-    const batchIndex = Math.floor(index / BATCH_SIZE);
-    const result = await writeBulkWrite(
-      baseUrl,
-      token,
-      workspace,
-      batch,
-      `seed-workspace-${workspace}-${Date.now()}-${batchIndex}`
-    );
-    seededCount += result.written;
-  }
-
-  return seededCount;
-}
-
-function buildWorkflowAclRules(agents: WorkflowAclAgent[]): Record<string, string[]> {
-  const directories = new Set<string>();
-  const normalizedAgents = agents.map((agent) => ({
-    name: String(agent.name ?? '').trim(),
-    acl: Object.fromEntries(
-      Object.entries(agent.acl ?? {}).map(([dirPath, rules]) => [
-        normalizeAclDirectory(dirPath),
-        Array.isArray(rules) ? rules : [],
-      ])
-    ),
-  }));
-  const reviewerNames = normalizedAgents
-    .map((agent) => agent.name)
-    .filter((name) => name !== '' && isReviewerAgent(name));
-
-  for (const agent of normalizedAgents) {
-    for (const dirPath of Object.keys(agent.acl)) {
-      directories.add(dirPath);
-    }
-  }
-
-  const merged = new Map<string, Set<string>>();
-
-  for (const dirPath of [...directories].sort((left, right) => left.localeCompare(right))) {
-    const rules = new Set<string>();
-
-    for (const reviewerName of reviewerNames) {
-      rules.add(`allow:agent:${reviewerName}:read`);
-    }
-
-    for (const agent of normalizedAgents) {
-      if (!agent.name) {
-        continue;
-      }
-
-      const agentRules = agent.acl[dirPath] ?? [];
-      const hasRead = agentRules.includes('read') || agentRules.includes('write');
-      const hasWrite = agentRules.includes('write');
-
-      if (hasRead) {
-        rules.add(`allow:agent:${agent.name}:read`);
-      } else if (!isReviewerAgent(agent.name)) {
-        rules.add(`deny:agent:${agent.name}`);
-      }
-
-      if (hasWrite) {
-        rules.add(`allow:agent:${agent.name}:write`);
-      }
-    }
-
-    if (rules.size > 0) {
-      merged.set(dirPath, rules);
-    }
-  }
-
-  return Object.fromEntries([...merged.entries()].map(([dirPath, rules]) => [dirPath, [...rules].sort()]));
-}
-
-export async function seedWorkflowAcls({
-  relayfileUrl,
-  adminToken,
-  workspace,
-  agents,
-}: SeedWorkflowAclsOptions): Promise<void> {
-  const aclRules = buildWorkflowAclRules(agents);
-
-  if (Object.keys(aclRules).length === 0) {
-    return;
-  }
-
-  await seedAclRules(relayfileUrl, adminToken, workspace, aclRules);
-}
-
-// ── Tar-based bulk upload ───────────────────────────────────────────────────
-
-interface ImportResponseShape {
-  imported?: number;
-}
-
-function getGitTrackedFiles(rootDir: string): string[] | null {
-  try {
-    const output = execSync('git ls-files -z --cached --others --exclude-standard', {
-      cwd: rootDir,
-      encoding: 'utf-8',
-      maxBuffer: 50 * 1024 * 1024,
-    });
-    const files = output.split('\0').filter(Boolean);
-    return files;
-  } catch {
-    return null;
-  }
-}
-
-function collectAllFiles(rootDir: string, excludeDirs: Set<string>): string[] {
-  const files: string[] = [];
-  const stack = [''];
-
-  while (stack.length > 0) {
-    const currentRelative = stack.pop()!;
-    const absoluteDir = path.join(rootDir, currentRelative);
-    let entries: fs.Dirent[];
-    try {
-      entries = fs.readdirSync(absoluteDir, { withFileTypes: true });
-    } catch {
-      continue;
-    }
-
-    for (const entry of entries) {
-      if (excludeDirs.has(entry.name)) continue;
-      if (DEFAULT_EXCLUDED_FILES.has(entry.name)) continue;
-      const nextRelative = currentRelative ? `${currentRelative}/${entry.name}` : entry.name;
-      if (excludeDirs.has(nextRelative)) continue;
-
-      if (entry.isDirectory()) {
-        stack.push(nextRelative);
-      } else if (entry.isFile()) {
-        files.push(nextRelative);
-      }
-    }
-  }
-
-  return files;
-}
-
-async function createTarBuffer(rootDir: string, files: string[]): Promise<Buffer> {
-  const tarStream = tar.create({ gzip: true, cwd: rootDir, portable: true, follow: true }, files);
-  const chunks: Buffer[] = [];
-  for await (const chunk of tarStream) {
-    chunks.push(Buffer.from(chunk as Uint8Array));
-  }
-  return Buffer.concat(chunks);
-}
-
-export async function seedWorkspaceTar(
-  baseUrl: string,
-  token: string,
-  workspaceId: string,
-  projectDir: string,
-  excludeDirs: string[]
-): Promise<number> {
-  const workspace = normalizeWorkspaceId(workspaceId);
-  const rootDir = path.resolve(projectDir);
-  const excludes = normalizeExcludeDirs([...DEFAULT_EXCLUDED_DIRS, ...excludeDirs]);
-
-  const gitFiles = getGitTrackedFiles(rootDir);
-  const rawFiles = gitFiles ?? collectAllFiles(rootDir, excludes);
-  const files = gitFiles
-    ? rawFiles.filter((f) => {
-        const segments = f.split('/');
-        if (DEFAULT_EXCLUDED_FILES.has(segments[segments.length - 1])) return false;
-        return !segments.some((seg) => excludes.has(seg));
-      })
-    : rawFiles;
-
-  if (files.length === 0) {
-    return 0;
-  }
-
-  const tarball = await createTarBuffer(rootDir, files);
-
-  const url = `${normalizeBaseUrl(baseUrl)}/v1/workspaces/${encodeURIComponent(workspace)}/fs/import`;
-  const response = await fetch(url, {
-    method: 'POST',
-    headers: {
-      Authorization: `Bearer ${token}`,
-      'Content-Type': 'application/gzip',
-      'X-Correlation-Id': `seed-tar-${workspace}-${Date.now()}`,
-    },
-    body: tarball.buffer.slice(tarball.byteOffset, tarball.byteOffset + tarball.byteLength) as ArrayBuffer,
-  });
-
-  if (response.status === 404) {
-    // Tar import not supported — fall back to batch upload
-    return seedWorkspace(baseUrl, token, workspaceId, projectDir, excludeDirs);
-  }
-
-  if (!response.ok) {
-    const body = await response.text().catch(() => '');
-    throw new Error(`tar import failed for workspace ${workspace}: HTTP ${response.status} ${body}`.trim());
-  }
-
-  const raw = await response.text();
-  if (!raw.trim()) {
-    return files.length;
-  }
-
-  try {
-    const parsed = JSON.parse(raw) as ImportResponseShape;
-    return typeof parsed.imported === 'number' ? parsed.imported : files.length;
-  } catch {
-    return files.length;
-  }
-}
diff --git a/packages/sdk/src/provisioner/types.ts b/packages/sdk/src/provisioner/types.ts
deleted file mode 100644
index 19fa282cb..000000000
--- a/packages/sdk/src/provisioner/types.ts
+++ /dev/null
@@ -1,189 +0,0 @@
-import type {
-  AccessPreset,
-  AgentPermissions,
-  CompiledAgentPermissions,
-  FilePermissions,
-  PermissionSource,
-} from '../workflows/types.js';
-import type { LocalJwksSigningKey } from './local-jwks.js';
-import type { MountHandle } from './mount.js';
-
-// ── Input Configuration ────────────────────────────────────────────────────
-
-/** Configuration for provisioning workflow agents. */
-export interface WorkflowProvisionConfig {
-  /** RS256 signing key used to mint JWT tokens. */
-  tokenSigningKey: LocalJwksSigningKey;
-
-  /** Workspace identifier (e.g. 'my-project'). */
-  workspace: string;
-
-  /** Absolute path to the project directory. */
-  projectDir: string;
-
-  /** Base URL of the relayfile server (e.g. 'http://127.0.0.1:4080'). */
-  relayfileBaseUrl: string;
-
-  /**
-   * Agents to provision, keyed by agent name.
-   * Each entry carries the AgentPermissions from relay.yaml.
-   * When empty/undefined, agents are auto-discovered from dotfiles.
-   */
-  agents?: Record<string, AgentPermissions>;
-
-  /** JWT token TTL in seconds. Default: 7200 (2 hours). */
-  tokenTtlSeconds?: number;
-
-  /**
-   * Directories to exclude from workspace seeding.
-   * Defaults: ['.relay', '.git', 'node_modules'].
-   */
-  excludeDirs?: string[];
-
-  /**
-   * When true, skip workspace creation and file seeding.
-   * Useful when only tokens/ACL are needed.
-   */
-  skipSeeding?: boolean;
-
-  /**
-   * Admin scopes for the workspace management token.
-   * Uses DEFAULT_ADMIN_SCOPES when omitted.
-   */
-  adminScopes?: string[];
-
-  /** Optional explicit relayfile-mount binary path. */
-  mountBinaryPath?: string;
-
-  /** Base directory for per-agent mount points. Defaults to <projectDir>/.relay. */
-  mountBaseDir?: string;
-
-  /** When true, skip starting relayfile mount processes. */
-  skipMount?: boolean;
-
-  /** When true, print a short audit summary to stdout after provisioning. */
-  verbose?: boolean;
-}
-
-// ── Output ─────────────────────────────────────────────────────────────────
-
-/** Aggregate counts for compiled permissions across provisioned agents. */
-export interface ProvisionSummary {
-  readonly: number;
-  readwrite: number;
-  denied: number;
-  customScopes: number;
-}
-
-/** Convenience shape for a single agent's compiled scopes. */
-export interface CompiledAgentScopes {
-  /** Agent name. */
-  agentName: string;
-
-  /** Workspace identifier. */
-  workspace: string;
-
-  /** Final token scopes after compilation. */
-  scopes: string[];
-
-  /** Directory ACL rules derived from the compiled permissions. */
-  acl: Record<string, string[]>;
-
-  /** Counts for the compiled access model. */
-  summary: ProvisionSummary;
-}
-
-/** Result of a single agent's provisioning. */
-export interface AgentProvisionResult {
-  /** Agent name. */
-  name: string;
-
-  /** Absolute path to the written JWT file (.relay/tokens/<name>.jwt). */
-  tokenPath: string;
-
-  /** The raw JWT string. */
-  token: string;
-
-  /** Scopes baked into the token. */
-  scopes: string[];
-
-  /** Full compiled permissions (for audit / dry-run output). */
-  compiled: CompiledAgentPermissions;
-
-  /** Absolute path to the mounted relayfile workspace for this agent, when active. */
-  mountPoint?: string;
-}
-
-/** Map of agent names to minted JWT strings. */
-export type AgentTokenMap = Record<string, string>;
-
-/** Map of agent names to their provisioning result. */
-export type AgentProvisionMap = Record<string, AgentProvisionResult>;
-
-/** Aggregate result of provisionWorkflowAgents(). */
-export interface ProvisionResult {
-  /** Per-agent results, keyed by agent name. */
-  agents: AgentProvisionMap;
-
-  /** Ordered list of agent names (matches iteration order). */
-  agentNames: string[];
-
-  /** Workspace-level admin token (used for seeding). */
-  adminToken: string;
-
-  /** Number of files seeded to the relayfile workspace. */
-  seededFileCount: number;
-
-  /** Number of ACL directory rules seeded. */
-  seededAclCount: number;
-
-  /** Aggregate summary across all agents. */
-  summary: ProvisionSummary;
-
-  /** Per-agent mounted workspace handles. */
-  mounts: Map<string, MountHandle>;
-
-  /** Per-agent minted JWT strings. */
-  tokens: Map<string, string>;
-
-  /** Per-agent compiled token scopes. */
-  scopes: Map<string, string[]>;
-}
-
-// ── Compiler Types ─────────────────────────────────────────────────────────
-
-/** Input to the permission compiler for a single agent. */
-export interface CompileInput {
-  agentName: string;
-  workspace: string;
-  projectDir: string;
-  permissions: AgentPermissions;
-}
-
-// ── Seeder Types ───────────────────────────────────────────────────────────
-
-/** Options for the ACL seeder. */
-export interface SeedAclOptions {
-  relayfileBaseUrl: string;
-  token: string;
-  workspace: string;
-  aclRules: Record<string, string[]>;
-}
-
-/** Options for workspace file seeding. */
-export interface SeedWorkspaceOptions {
-  relayfileBaseUrl: string;
-  token: string;
-  workspace: string;
-  projectDir: string;
-  excludeDirs: string[];
-}
-
-/** Minimal debug summary written alongside compiled ACL output. */
-export interface AgentAclSummary {
-  name: string;
-  summary: Pick<ProvisionSummary, 'readonly' | 'readwrite' | 'denied'>;
-}
-
-// Re-export upstream types for convenience.
-export type { AccessPreset, AgentPermissions, CompiledAgentPermissions, FilePermissions, PermissionSource };
diff --git a/packages/sdk/src/workflows/README.md b/packages/sdk/src/workflows/README.md
deleted file mode 100644
index 9d881c306..000000000
--- a/packages/sdk/src/workflows/README.md
+++ /dev/null
@@ -1,764 +0,0 @@
-# Agent Relay Workflows
-
-Orchestrate multi-agent workflows using YAML, TypeScript, or Python. Define agents, wire up dependencies, and let the runner handle execution, retries, and verification.
-
-## Quick Start
-
-### CLI
-
-```bash
-# Run a YAML workflow
-agent-relay run workflow.yaml
-
-# Run a TypeScript workflow
-agent-relay run workflow.ts
-
-# Run a Python workflow
-agent-relay run workflow.py
-
-# Run a specific named workflow from a file
-agent-relay run workflow.yaml --workflow deploy
-```
-
-### TypeScript
-
-```typescript
-import { workflow } from '@agent-relay/sdk/workflows';
-
-const result = await workflow('ship-feature')
-  .pattern('dag')
-  .agent('planner', { cli: 'claude', role: 'Plans implementation' })
-  .agent('developer', { cli: 'codex', role: 'Writes code' })
-  .agent('reviewer', { cli: 'claude', role: 'Reviews code' })
-  .step('plan', {
-    agent: 'planner',
-    task: 'Create implementation plan for user authentication',
-  })
-  .step('implement', {
-    agent: 'developer',
-    task: 'Implement the plan',
-    dependsOn: ['plan'],
-  })
-  .step('review', {
-    agent: 'reviewer',
-    task: 'Review the implementation',
-    dependsOn: ['implement'],
-  })
-  .run();
-
-console.log(result.status); // "completed" | "failed"
-```
-
-### Python
-
-```python
-from agent_relay import workflow
-
-result = (
-    workflow("ship-feature")
-    .pattern("dag")
-    .agent("planner", cli="claude", role="Plans implementation")
-    .agent("developer", cli="codex", role="Writes code")
-    .agent("reviewer", cli="claude", role="Reviews code")
-    .step("plan", agent="planner", task="Create implementation plan for user auth")
-    .step("implement", agent="developer", task="Implement the plan", depends_on=["plan"])
-    .step("review", agent="reviewer", task="Review the implementation", depends_on=["implement"])
-    .run()
-)
-```
-
-## Consumer-Facing Apps + AI SDK Communicate Flows
-
-A good production split is:
-
-1. **AI SDK app** handles the user conversation and streaming UI
-2. **Communicate / `onRelay()`** lets that point-person coordinate with specialists over Relay
-3. **Workflows / `runWorkflow()`** take over when a request needs multi-step execution, verification, or handoffs
-
-```typescript
-import { streamText, wrapLanguageModel } from 'ai';
-import { openai } from '@ai-sdk/openai';
-import { Relay } from '@agent-relay/sdk/communicate';
-import { onRelay } from '@agent-relay/sdk/communicate/adapters/ai-sdk';
-import { runWorkflow } from '@agent-relay/sdk/workflows';
-
-export async function POST(req: Request) {
-  const { prompt, escalate, repo } = await req.json();
-
-  const relay = new Relay('AppLead');
-  const relaySession = onRelay(
-    {
-      name: 'AppLead',
-      instructions:
-        'You are the customer-facing lead. Keep the user updated and delegate implementation via Relay when needed.',
-    },
-    relay
-  );
-
-  const model = wrapLanguageModel({
-    model: openai('gpt-4o-mini'),
-    middleware: relaySession.middleware,
-  });
-
-  if (escalate) {
-    const workflow = await runWorkflow('workflows/feature-dev.yaml', {
-      vars: { task: prompt, repo },
-    });
-
-    return Response.json({ status: workflow.status, runId: workflow.runId });
-  }
-
-  return streamText({
-    model,
-    tools: relaySession.tools,
-    system: 'Answer directly when possible; coordinate internally when the task needs specialists.',
-    prompt,
-  }).toUIMessageStreamResponse({
-    onFinish() {
-      relaySession.cleanup();
-      void relay.close();
-    },
-  });
-}
-```
-
-That pattern keeps the user experience snappy while still letting longer Relay workflows run with proper ownership, retries, and verification.
-
-A compact end-to-end example app for this pattern lives in `examples/ai-sdk-relay-helpdesk/`.
-
-## YAML Format
-
-Workflows are defined as `relay.yaml` files:
-
-```yaml
-version: '1.0'
-name: my-workflow
-description: 'Optional description'
-
-swarm:
-  pattern: dag # Execution pattern (see Patterns below)
-  maxConcurrency: 3 # Max agents running in parallel
-  timeoutMs: 3600000 # Global timeout (1 hour)
-  channel: my-channel # Relay channel for agent communication
-
-agents:
-  - name: backend
-    cli: claude # claude | codex | gemini | aider | goose | opencode | droid
-    role: 'Backend engineer'
-    constraints:
-      model: opus
-      timeoutMs: 600000
-      retries: 2
-
-  - name: tester
-    cli: codex
-    role: 'Test engineer'
-    interactive: false # Non-interactive: runs as subprocess, no PTY/messaging
-
-workflows:
-  - name: build-and-test
-    onError: retry # fail | skip | retry
-    steps:
-      - name: build-api
-        agent: backend
-        task: 'Build the REST API endpoints for user management'
-        verification:
-          type: file_exists
-          value: 'src/api/users.ts'
-        retries: 1
-
-      - name: write-tests
-        agent: tester
-        task: 'Write integration tests for: {{steps.build-api.output}}'
-        dependsOn: [build-api]
-
-      - name: run-tests
-        agent: tester
-        task: 'Run the test suite and report results'
-        dependsOn: [write-tests]
-        verification:
-          type: exit_code
-          value: '0'
-
-errorHandling:
-  strategy: retry
-  maxRetries: 2
-  retryDelayMs: 5000
-  repairAgent: tester
-  repairRetries: 2
-  notifyChannel: my-channel
-```
-
-### Template Variables
-
-Use `{{variable}}` for user-provided values and `{{steps.STEP_NAME.output}}` for previous step outputs:
-
-```yaml
-steps:
-  - name: plan
-    agent: planner
-    task: 'Plan implementation for: {{task}}' # User variable
-
-  - name: implement
-    agent: developer
-    dependsOn: [plan]
-    task: 'Implement: {{steps.plan.output}}' # Previous step output
-```
-
-User variables are passed via the CLI or programmatically:
-
-```typescript
-await runWorkflow('workflow.yaml', {
-  vars: { task: 'Add OAuth2 support' },
-});
-```
-
-### Verification Checks
-
-Each step can include a verification check. Verification is one input to the runner's **completion decision pipeline** — when verification passes, the step completes even without a sentinel marker.
-
-| Type              | Description                                                                |
-| ----------------- | -------------------------------------------------------------------------- |
-| `exit_code`       | Agent must exit with the specified code (preferred for code-editing steps) |
-| `file_exists`     | A file must exist at the specified path after the step                     |
-| `output_contains` | Step output must contain the specified string (optional accelerator)       |
-| `custom`          | No-op in the runner; handled by external callers                           |
-
-```yaml
-# Preferred — deterministic verification
-verification:
-  type: exit_code
-  value: "0"
-  description: "Process exited successfully"
-
-# Also valid — output_contains as an optional accelerator
-verification:
-  type: output_contains
-  value: "IMPLEMENTATION_COMPLETE"
-  description: "Agent confirms completion (optional fast-path)"
-```
-
-### Completion Decision Pipeline
-
-The runner uses a multi-signal pipeline to decide step completion:
-
-1. **Deterministic verification** — if a verification check passes, the step completes immediately (`completed_verified`)
-2. **Owner decision** — the step owner can issue `OWNER_DECISION: COMPLETE|INCOMPLETE_RETRY|INCOMPLETE_FAIL` (`completed_by_owner_decision`)
-3. **Evidence-based completion** — channel messages, file artifacts, and exit codes are collected as evidence (`completed_by_evidence`)
-4. **Marker fast-path** — `STEP_COMPLETE:<step-name>` still works as an accelerator but is never required
-
-| Completion State              | Meaning                                         |
-| ----------------------------- | ----------------------------------------------- |
-| `completed_verified`          | Deterministic verification passed               |
-| `completed_by_owner_decision` | Owner approved the step                         |
-| `completed_by_evidence`       | Evidence-based completion                       |
-| `retry_requested_by_owner`    | Owner requested retry                           |
-| `failed_verification`         | Verification explicitly failed                  |
-| `failed_owner_decision`       | Owner rejected the step                         |
-| `failed_no_evidence`          | No verification, no owner decision, no evidence |
-
-**Review parsing is tolerant:** The runner accepts semantically equivalent outputs like "Approved", "Complete", "LGTM" — not just exact `REVIEW_DECISION: APPROVE` strings.
-
-## Swarm Patterns
-
-The `swarm.pattern` field controls how agents are coordinated:
-
-### Core Patterns
-
-| Pattern        | Description                                                            |
-| -------------- | ---------------------------------------------------------------------- |
-| `dag`          | Directed acyclic graph — steps run based on dependency edges (default) |
-| `fan-out`      | All agents run in parallel                                             |
-| `pipeline`     | Sequential chaining of steps                                           |
-| `hub-spoke`    | Central hub coordinates spoke agents                                   |
-| `consensus`    | Agents vote on decisions                                               |
-| `mesh`         | Full communication graph between agents                                |
-| `handoff`      | Sequential handoff between agents                                      |
-| `cascade`      | Waterfall with phase gates                                             |
-| `debate`       | Agents propose and counter-argue                                       |
-| `hierarchical` | Multi-level reporting structure                                        |
-
-### Data Processing Patterns
-
-| Pattern          | Description                                                                         |
-| ---------------- | ----------------------------------------------------------------------------------- |
-| `map-reduce`     | Split work into chunks (mappers), process in parallel, aggregate results (reducers) |
-| `scatter-gather` | Fan out requests to workers, collect and synthesize responses                       |
-
-### Supervision & Quality Patterns
-
-| Pattern      | Description                                                               |
-| ------------ | ------------------------------------------------------------------------- |
-| `supervisor` | Monitor agent monitors workers, restarts on failure, manages health       |
-| `reflection` | Agent produces output, critic reviews and provides feedback for iteration |
-| `verifier`   | Producer agents submit work to verifier agents for validation             |
-
-### Adversarial & Validation Patterns
-
-| Pattern    | Description                                                      |
-| ---------- | ---------------------------------------------------------------- |
-| `red-team` | Attacker agents probe for weaknesses, defender agents respond    |
-| `auction`  | Auctioneer broadcasts tasks, agents bid based on capability/cost |
-
-### Resilience Patterns
-
-| Pattern           | Description                                                       |
-| ----------------- | ----------------------------------------------------------------- |
-| `escalation`      | Start with fast/cheap agents, escalate to more capable on failure |
-| `saga`            | Distributed transactions with compensating actions on failure     |
-| `circuit-breaker` | Primary agent with fallback chain, fail fast and recover          |
-
-### Collaborative Patterns
-
-| Pattern      | Description                                                          |
-| ------------ | -------------------------------------------------------------------- |
-| `blackboard` | Shared workspace where agents contribute incrementally to a solution |
-| `swarm`      | Emergent behavior from simple agent rules (neighbor communication)   |
-
-### Auto-Selection by Role
-
-When `swarm.pattern` is omitted, the coordinator auto-selects based on agent roles.
-Patterns are checked in priority order below (first match wins):
-
-| Priority | Pattern           | Required Roles/Config                                    |
-| -------- | ----------------- | -------------------------------------------------------- |
-| 1        | `dag`             | Steps with `dependsOn`                                   |
-| 2        | `consensus`       | Uses `coordination.consensusStrategy` config             |
-| 3        | `map-reduce`      | `mapper` + `reducer`                                     |
-| 4        | `red-team`        | (`attacker` OR `red-team`) + (`defender` OR `blue-team`) |
-| 5        | `reflection`      | `critic`                                                 |
-| 6        | `escalation`      | `tier-1`, `tier-2`, etc.                                 |
-| 7        | `auction`         | `auctioneer`                                             |
-| 8        | `saga`            | `saga-orchestrator` OR `compensate-handler`              |
-| 9        | `circuit-breaker` | `fallback`, `backup`, OR `primary`                       |
-| 10       | `blackboard`      | `blackboard` OR `shared-workspace`                       |
-| 11       | `swarm`           | `hive-mind` OR `swarm-agent`                             |
-| 12       | `verifier`        | `verifier`                                               |
-| 13       | `supervisor`      | `supervisor`                                             |
-| 14       | `hierarchical`    | `lead` (with 4+ agents)                                  |
-| 15       | `hub-spoke`       | `hub` OR `coordinator`                                   |
-| 16       | `pipeline`        | Unique agents per step, 3+ steps                         |
-| 17       | `fan-out`         | Default fallback                                         |
-
-## Error Handling
-
-### Step-Level
-
-```yaml
-steps:
-  - name: risky-step
-    agent: worker
-    task: 'Do something that might fail'
-    retries: 3 # Retry up to 3 times on failure
-    timeoutMs: 300000 # 5 minute timeout
-```
-
-### Workflow-Level
-
-The `onError` field on a workflow controls what happens when a step fails:
-
-| Value                | Behavior                                                                                                        |
-| -------------------- | --------------------------------------------------------------------------------------------------------------- |
-| `fail` / `fail-fast` | Stop immediately, skip downstream steps                                                                         |
-| `skip` / `continue`  | Skip downstream dependents, continue independent steps                                                          |
-| `retry`              | Retry the step; deterministic gates ask a workflow agent to repair before each retry when an agent is available |
-
-### Global
-
-```yaml
-errorHandling:
-  strategy: retry
-  maxRetries: 2
-  retryDelayMs: 5000
-  repairAgent: tester
-  repairRetries: 2
-  notifyChannel: alerts
-```
-
-Retry-mode workflows are repair-aware by default. Deterministic step failures, verification gate failures, and malformed agent artifacts are treated as repairable work before terminal failure. The runner chooses `errorHandling.repairAgent` when set, otherwise it uses the step's owning/upstream agent when possible, then falls back to the best available workflow agent. The selected agent gets the failed command or agent output, working directory, exit information, and captured evidence, then the failed gate or step is retried. Use `repairRetries: 0`, `strategy: fail-fast`, or `strategy: continue` when a workflow intentionally should not invoke repair agents.
-
-## Built-in Templates
-
-Six pre-built workflow templates are included:
-
-| Template         | Pattern      | Description                                                   |
-| ---------------- | ------------ | ------------------------------------------------------------- |
-| `feature-dev`    | hub-spoke    | Plan, implement, review, and finalize a feature               |
-| `bug-fix`        | hub-spoke    | Investigate, patch, validate, and document a bug fix          |
-| `code-review`    | fan-out      | Parallel multi-reviewer assessment with consolidated findings |
-| `security-audit` | pipeline     | Scan, triage, remediate, and verify security issues           |
-| `refactor`       | hierarchical | Analyze, plan, execute, and validate a refactor               |
-| `documentation`  | handoff      | Research, draft, review, and publish documentation            |
-
-### Using Templates
-
-```typescript
-import { TemplateRegistry } from '@agent-relay/sdk/workflows';
-
-const registry = new TemplateRegistry();
-
-// List available templates
-const templates = await registry.listTemplates();
-
-// Load and run a template
-const config = await registry.loadTemplate('feature-dev');
-const runner = new WorkflowRunner();
-const result = await runner.execute(config, undefined, {
-  task: 'Add WebSocket support to the API',
-});
-
-// Install a custom template from a URL
-await registry.installExternalTemplate('https://example.com/my-template.yaml', 'my-template');
-```
-
-## TypeScript Builder API
-
-The builder constructs a `RelayYamlConfig` object and can run it, export it as YAML, or return the raw config.
-
-```typescript
-import { workflow } from '@agent-relay/sdk/workflows';
-
-// Build and run
-const result = await workflow('my-workflow')
-  .pattern('dag')
-  .maxConcurrency(3)
-  .timeout(60 * 60 * 1000)
-  .channel('my-channel')
-  .agent('backend', {
-    cli: 'claude',
-    role: 'Backend engineer',
-    model: 'opus',
-    retries: 2,
-  })
-  .agent('frontend', {
-    cli: 'codex',
-    role: 'Frontend engineer',
-    interactive: false, // Non-interactive subprocess mode
-  })
-  .step('api', {
-    agent: 'backend',
-    task: 'Build REST API',
-    verification: { type: 'output_contains', value: 'API_READY' },
-  })
-  .step('ui', {
-    agent: 'frontend',
-    task: 'Build the UI',
-    dependsOn: ['api'],
-  })
-  .onError('retry', { maxRetries: 2, retryDelayMs: 5000 })
-  .run();
-
-// Or export to YAML
-const yaml = workflow('my-workflow')
-  .pattern('dag')
-  .agent('worker', { cli: 'claude' })
-  .step('task1', { agent: 'worker', task: 'Do something' })
-  .toYaml();
-
-// Or get the raw config object
-const config = workflow('my-workflow')
-  .pattern('dag')
-  .agent('worker', { cli: 'claude' })
-  .step('task1', { agent: 'worker', task: 'Do something' })
-  .toConfig();
-```
-
-## Python Builder API
-
-Install the Python SDK:
-
-```bash
-pip install agent-relay
-```
-
-```python
-from agent_relay import workflow, run_yaml
-
-# Build and run
-result = (
-    workflow("my-workflow")
-    .pattern("dag")
-    .max_concurrency(3)
-    .timeout(3600000)
-    .agent("backend", cli="claude", role="Backend engineer")
-    .agent("frontend", cli="codex", role="Frontend engineer")
-    .step("api", agent="backend", task="Build REST API")
-    .step("ui", agent="frontend", task="Build the UI", depends_on=["api"])
-    .on_error("retry", max_retries=2, retry_delay_ms=5000)
-    .run()
-)
-
-# Run an existing YAML file
-result = run_yaml("workflows/my-workflow.yaml")
-
-# Export to YAML string
-yaml_str = (
-    workflow("my-workflow")
-    .pattern("dag")
-    .agent("worker", cli="claude")
-    .step("task1", agent="worker", task="Do something")
-    .to_yaml()
-)
-
-# Get the raw config dict
-config = (
-    workflow("my-workflow")
-    .pattern("dag")
-    .agent("worker", cli="claude")
-    .step("task1", agent="worker", task="Do something")
-    .to_config()
-)
-```
-
-## Programmatic API
-
-For full control, use the `WorkflowRunner` directly:
-
-```typescript
-import { WorkflowRunner } from '@agent-relay/sdk/workflows';
-
-const runner = new WorkflowRunner({
-  cwd: '/path/to/project', // Working directory (default: process.cwd())
-  relay: { port: 3000 }, // AgentRelay options (optional)
-});
-
-// Listen to events (broker:event fires frequently — filter it out for cleaner output)
-runner.on((event) => {
-  if (event.type === 'broker:event') return;
-  console.log(event.type, event);
-});
-
-// Parse and execute
-const config = await runner.parseYamlFile('workflow.yaml');
-const run = await runner.execute(config, 'workflow-name', {
-  task: 'Build the feature',
-});
-
-// Pause / resume / abort
-runner.pause();
-runner.unpause();
-runner.abort();
-
-// Resume a failed run
-const resumed = await runner.resume(run.id);
-```
-
-### Zero-Config Convenience Function
-
-```typescript
-import { runWorkflow } from '@agent-relay/sdk/workflows';
-
-const result = await runWorkflow('workflow.yaml', {
-  workflow: 'deploy',
-  vars: { environment: 'staging' },
-  onEvent: (event) => {
-    if (event.type !== 'broker:event') console.log(event.type);
-  },
-});
-```
-
-## Coordination
-
-### Barriers
-
-Synchronization points that wait for specific steps to complete:
-
-```yaml
-coordination:
-  barriers:
-    - name: all-reviews-done
-      waitFor: [review-arch, review-security, review-correctness]
-      timeoutMs: 900000
-  consensusStrategy: majority # majority | unanimous | quorum
-```
-
-### Shared State
-
-Agents can share state during execution:
-
-```yaml
-state:
-  backend: memory # memory | redis | database
-  ttlMs: 86400000
-  namespace: my-workflow
-```
-
-## Supported Agent CLIs
-
-| CLI        | Description             |
-| ---------- | ----------------------- |
-| `claude`   | Claude Code (Anthropic) |
-| `codex`    | Codex CLI (OpenAI)      |
-| `gemini`   | Gemini CLI (Google)     |
-| `aider`    | Aider coding assistant  |
-| `goose`    | Goose AI assistant      |
-| `opencode` | OpenCode CLI            |
-| `droid`    | Droid CLI               |
-
-## Non-Interactive Agents
-
-By default, agents run in interactive PTY mode with full relay messaging. For workers that just need to execute a task and return output — common in fan-out, map-reduce, and pipeline patterns — set `interactive: false` to run them as lightweight subprocesses.
-
-### YAML
-
-```yaml
-agents:
-  - name: lead
-    cli: claude
-    role: 'Coordinates work'
-    # interactive: true (default) — full PTY, relay messaging, /exit detection
-
-  - name: worker
-    cli: codex
-    role: 'Executes tasks'
-    interactive: false # Runs "codex exec <task>", captures stdout
-```
-
-### TypeScript
-
-```typescript
-workflow('fan-out-analysis')
-  .pattern('fan-out')
-  .agent('lead', { cli: 'claude', role: 'Coordinator' })
-  .agent('worker-1', { cli: 'codex', interactive: false, role: 'Analyst' })
-  .agent('worker-2', { cli: 'codex', interactive: false, role: 'Analyst' })
-  .step('analyze-1', { agent: 'worker-1', task: 'Analyze module A' })
-  .step('analyze-2', { agent: 'worker-2', task: 'Analyze module B' })
-  .step('synthesize', {
-    agent: 'lead',
-    task: 'Combine: {{steps.analyze-1.output}} + {{steps.analyze-2.output}}',
-    dependsOn: ['analyze-1', 'analyze-2'],
-  })
-  .run();
-```
-
-### How It Works
-
-| Aspect           | Interactive (default)                     | Non-Interactive                                 |
-| ---------------- | ----------------------------------------- | ----------------------------------------------- |
-| Execution        | Full PTY with stdin/stdout                | `child_process.spawn()` with piped stdio        |
-| CLI invocation   | Standard interactive session              | One-shot mode (`claude -p`, `codex exec`, etc.) |
-| Relay messaging  | Can send/receive messages                 | No messaging — excluded from topology edges     |
-| Self-termination | Must output `/exit`                       | Process exits naturally when done               |
-| Output capture   | PTY output buffer                         | stdout capture                                  |
-| Overhead         | Higher (PTY, echo verification, SIGWINCH) | Lower (simple subprocess)                       |
-
-### Non-Interactive CLI Commands
-
-| CLI        | Command                                          | Notes                            |
-| ---------- | ------------------------------------------------ | -------------------------------- |
-| `claude`   | `claude -p "<task>"`                             | Print mode, exits after response |
-| `codex`    | `codex exec "<task>"`                            | One-shot execution               |
-| `gemini`   | `gemini -p "<task>"`                             | Prompt mode                      |
-| `opencode` | `opencode --prompt "<task>"`                     | One-shot prompt                  |
-| `droid`    | `droid exec "<task>"`                            | One-shot execution               |
-| `aider`    | `aider --message "<task>" --yes-always --no-git` | Auto-approve, skip git           |
-| `goose`    | `goose run --text "<task>" --no-session`         | Text mode, no session file       |
-
-### When to Use
-
-- Fan-out workers that process a task and return results
-- Map-reduce mappers that don't need mid-task communication
-- Pipeline stages that transform input to output
-- Any agent that doesn't need turn-by-turn relay messaging
-
-### When NOT to Use
-
-- Lead/coordinator agents that communicate with others
-- Agents in debate, consensus, or reflection patterns
-- Agents that need to receive messages during execution
-
-## Agent Slash Commands
-
-Agents running inside a workflow can output slash commands to signal the broker. These are detected in the agent's PTY output at the broker level — the agent simply prints the command on its own line.
-
-### `/exit`
-
-Signals that the agent has completed its current step and is ready to be released.
-
-```
-/exit
-```
-
-The workflow runner waits for each agent to `/exit` after delivering a step task. When the broker detects `/exit` in the agent's output (exact line match after ANSI stripping), it:
-
-1. Emits an `agent_exit` frame with `reason: "agent_requested"`
-2. Triggers graceful PTY shutdown
-
-If an agent does not `/exit` within the step's `timeoutMs`, the runner treats the step as timed out. As a safety net, steps with `file_exists` verification will still pass if the expected file is present despite the timeout.
-
-**Best practice:** Instruct agents to output `/exit` when done in your step task descriptions:
-
-```yaml
-steps:
-  - name: build-api
-    agent: backend
-    task: |
-      Build the REST API endpoints for user management.
-      When finished, output /exit.
-```
-
-## Idle Agent Detection and Nudging
-
-Interactive agents sometimes finish their task but forget to `/exit`, sitting idle and blocking downstream steps. The runner can detect idle agents and take action automatically.
-
-### Configuration
-
-Add `idleNudge` to your swarm config:
-
-```yaml
-swarm:
-  pattern: hub-spoke
-  idleNudge:
-    nudgeAfterMs: 120000 # 2 min before first nudge (default)
-    escalateAfterMs: 120000 # 2 min after nudge before force-release (default)
-    maxNudges: 1 # Nudges before escalation (default)
-```
-
-All built-in templates include idle nudging with these defaults.
-
-### How It Works
-
-1. **Detection**: The broker tracks agent output timestamps and emits `agent_idle` events when an agent goes silent for the configured threshold
-2. **Nudge**: For hub patterns (hub-spoke, fan-out, hierarchical, etc.), the runner tells the hub agent to check on the idle agent. For non-hub patterns, a system message is injected directly into the agent's PTY
-3. **Escalation**: If the agent remains idle after `maxNudges` attempts, the runner force-releases it and captures whatever output was produced
-4. **No config**: When `idleNudge` is omitted, the runner uses simple `waitForExit` (backward compatible)
-
-### Events
-
-The runner emits two new events for idle nudging:
-
-| Event                 | Description                                                   |
-| --------------------- | ------------------------------------------------------------- |
-| `step:nudged`         | Fired when a nudge message is sent to an idle agent           |
-| `step:force-released` | Fired when an agent is force-released after exhausting nudges |
-
-## Automatic Step Owner and Review
-
-For interactive agent steps, the runner uses a point-person-led completion model:
-
-1. **Elects a step owner** (prefers lead/coordinator-style agents, falls back to the step agent)
-2. **Runs a completion decision pipeline** — checks deterministic verification first, then owner judgment, then evidence
-3. **Owner can issue structured decisions** via `OWNER_DECISION: COMPLETE|INCOMPLETE_RETRY|INCOMPLETE_FAIL|NEEDS_CLARIFICATION` with optional `REASON: <text>`
-4. **Review parsing is tolerant** — accepts "Approved", "Complete", "LGTM", not just exact `REVIEW_DECISION: APPROVE`
-5. **Markers are optional accelerators** — `STEP_COMPLETE:<step-name>` still works as a fast-path but is never required
-6. Stores primary output plus review output in the step artifact
-
-**Evidence-based completion:** The runner collects channel messages, file artifacts, process exit codes, and coordination signals (e.g., WORKER_DONE posted in channel) as completion evidence. When sufficient evidence exists, the step completes without requiring any sentinel marker.
-
-Deterministic and worktree steps are unchanged and do not require owner/review delegation.
-
-## Schema Validation
-
-A JSON Schema is available at `packages/sdk/src/workflows/schema.json` for editor autocompletion and validation of `relay.yaml` files.
-
-## Requirements
-
-- Node.js 22+
-- `agent-relay` CLI installed (`npm install -g agent-relay`)
-- For Python: Python 3.10+ with `pip install agent-relay`
-- For TypeScript workflow files: `tsx` or `ts-node` installed
-
-## License
-
-Apache-2.0 -- Copyright 2025 Agent Workforce Incorporated
diff --git a/packages/sdk/src/workflows/__tests__/budget-enforcement.test.ts b/packages/sdk/src/workflows/__tests__/budget-enforcement.test.ts
deleted file mode 100644
index 7b7fd9a7b..000000000
--- a/packages/sdk/src/workflows/__tests__/budget-enforcement.test.ts
+++ /dev/null
@@ -1,533 +0,0 @@
-import { EventEmitter } from 'node:events';
-import { afterEach, beforeEach, describe, expect, it, vi } from 'vitest';
-import { mkdtempSync, mkdirSync, rmSync } from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-
-import type { BudgetTracker } from '../budget-tracker.js';
-import type { CliSessionQuery, CliSessionReport } from '../cli-session-collector.js';
-import type { WorkflowDb } from '../runner.js';
-import type { RelayYamlConfig, WorkflowRunRow, WorkflowStepRow } from '../types.js';
-
-const tempDirs: string[] = [];
-
-type QueuedSubprocessResult = {
-  stdout?: string;
-  stderr?: string;
-  code?: number | null;
-  signal?: string | null;
-  delayMs?: number;
-  error?: Error;
-  onSpawn?: () => void;
-};
-
-type CollectorResult =
-  | CliSessionReport
-  | null
-  | ((query: CliSessionQuery) => CliSessionReport | null | Promise<CliSessionReport | null>);
-
-let queuedSubprocessResults: QueuedSubprocessResult[] = [];
-let queuedCollectorResults: CollectorResult[] = [];
-let collectorResultsByCwd = new Map<string, CollectorResult>();
-let activeRunner: InstanceType<typeof WorkflowRunner> | undefined;
-
-const mockCollectCliSession = vi.fn(async (query: CliSessionQuery): Promise<CliSessionReport | null> => {
-  const next =
-    queuedCollectorResults.length > 0 ? queuedCollectorResults.shift() : collectorResultsByCwd.get(query.cwd);
-
-  if (typeof next === 'function') {
-    return next(query);
-  }
-
-  return next ?? null;
-});
-
-vi.mock('../cli-session-collector.js', () => ({
-  collectCliSession: mockCollectCliSession,
-}));
-
-const mockSubprocessSpawn = vi.fn().mockImplementation((_cmd, _args, _options) => {
-  const result = queuedSubprocessResults.shift() ?? {
-    stdout: 'completed\n',
-    code: 0,
-  };
-
-  const child = new EventEmitter() as EventEmitter & {
-    stdout: EventEmitter;
-    stderr: EventEmitter;
-    pid: number;
-    kill: ReturnType<typeof vi.fn>;
-  };
-
-  child.stdout = new EventEmitter();
-  child.stderr = new EventEmitter();
-  child.pid = 4321;
-  child.kill = vi.fn();
-
-  result.onSpawn?.();
-
-  const emitResult = () => {
-    if (result.error) {
-      child.emit('error', result.error);
-      return;
-    }
-    if (result.stdout) {
-      child.stdout.emit('data', Buffer.from(result.stdout));
-    }
-    if (result.stderr) {
-      child.stderr.emit('data', Buffer.from(result.stderr));
-    }
-    child.emit('close', result.code ?? 0, result.signal ?? null);
-  };
-
-  if (result.delayMs && result.delayMs > 0) {
-    setTimeout(emitResult, result.delayMs);
-  } else {
-    queueMicrotask(emitResult);
-  }
-
-  return child;
-});
-
-vi.mock('node:child_process', async () => {
-  const actual = await vi.importActual<typeof import('node:child_process')>('node:child_process');
-  return {
-    ...actual,
-    spawn: mockSubprocessSpawn,
-  };
-});
-
-const mockRelayInstance = {
-  spawnPty: vi.fn(),
-  human: vi.fn().mockReturnValue({ sendMessage: vi.fn().mockResolvedValue(undefined) }),
-  shutdown: vi.fn().mockResolvedValue(undefined),
-  onBrokerStderr: vi.fn().mockReturnValue(() => {}),
-  listAgentsRaw: vi.fn().mockResolvedValue([]),
-  listAgents: vi.fn().mockResolvedValue([]),
-  addListener: vi.fn(() => () => {}),
-};
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn(),
-  RelayError: class RelayError extends Error {},
-}));
-
-vi.mock('../../relay.js', () => ({
-  AgentRelay: vi.fn().mockImplementation(() => mockRelayInstance),
-}));
-
-const { WorkflowRunner } = await import('../runner.js');
-
-interface DbHarness {
-  db: WorkflowDb;
-  getRun(id: string): WorkflowRunRow | null;
-  getSteps(runId: string): WorkflowStepRow[];
-}
-
-function makeDbHarness(): DbHarness {
-  const runs = new Map<string, WorkflowRunRow>();
-  const steps = new Map<string, WorkflowStepRow>();
-
-  return {
-    db: {
-      insertRun: vi.fn(async (run: WorkflowRunRow) => {
-        runs.set(run.id, { ...run });
-      }),
-      updateRun: vi.fn(async (id: string, patch: Partial<WorkflowRunRow>) => {
-        const existing = runs.get(id);
-        if (existing) {
-          runs.set(id, { ...existing, ...patch });
-        }
-      }),
-      getRun: vi.fn(async (id: string) => {
-        const run = runs.get(id);
-        return run ? { ...run } : null;
-      }),
-      insertStep: vi.fn(async (step: WorkflowStepRow) => {
-        steps.set(step.id, { ...step });
-      }),
-      updateStep: vi.fn(async (id: string, patch: Partial<WorkflowStepRow>) => {
-        const existing = steps.get(id);
-        if (existing) {
-          steps.set(id, { ...existing, ...patch });
-        }
-      }),
-      getStepsByRunId: vi.fn(async (runId: string) => {
-        return [...steps.values()].filter((step) => step.runId === runId).map((step) => ({ ...step }));
-      }),
-    },
-    getRun(id: string) {
-      const run = runs.get(id);
-      return run ? { ...run } : null;
-    },
-    getSteps(runId: string) {
-      return [...steps.values()].filter((step) => step.runId === runId).map((step) => ({ ...step }));
-    },
-  };
-}
-
-function createWorkspace(subdirs: string[] = []): string {
-  const dir = mkdtempSync(path.join(os.tmpdir(), 'relay-budget-enforcement-'));
-  tempDirs.push(dir);
-
-  for (const subdir of subdirs) {
-    mkdirSync(path.join(dir, subdir), { recursive: true });
-  }
-
-  return dir;
-}
-
-function makeRunner(cwd: string, db: WorkflowDb): InstanceType<typeof WorkflowRunner> {
-  return new WorkflowRunner({
-    cwd,
-    db,
-    workspaceId: 'ws-test',
-    relay: {
-      env: {
-        AGENT_RELAY_WORKFLOW_DISABLE_RELAYCAST: '1',
-      },
-    },
-  });
-}
-
-function makeAgent(
-  name: string,
-  overrides: Partial<RelayYamlConfig['agents'][number]> = {}
-): RelayYamlConfig['agents'][number] {
-  return {
-    name,
-    cli: 'claude',
-    interactive: false,
-    ...overrides,
-  };
-}
-
-function makeStep(
-  name: string,
-  agent: string,
-  overrides: Partial<NonNullable<RelayYamlConfig['workflows']>[number]['steps'][number]> = {}
-): NonNullable<RelayYamlConfig['workflows']>[number]['steps'][number] {
-  return {
-    name,
-    agent,
-    task: `Complete ${name}`,
-    ...overrides,
-  };
-}
-
-function makeConfig(input: {
-  agents: RelayYamlConfig['agents'];
-  steps: NonNullable<RelayYamlConfig['workflows']>[number]['steps'];
-  swarm?: Partial<RelayYamlConfig['swarm']>;
-}): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'budget-enforcement',
-    swarm: {
-      pattern: 'dag',
-      ...input.swarm,
-    },
-    agents: input.agents,
-    workflows: [
-      {
-        name: 'default',
-        steps: input.steps,
-      },
-    ],
-    trajectories: false,
-  };
-}
-
-function makeReport(
-  tokens: Partial<NonNullable<CliSessionReport['tokens']>>,
-  overrides: Partial<CliSessionReport> = {}
-): CliSessionReport {
-  return {
-    cli: 'claude',
-    sessionId: 'session-1',
-    model: 'claude-sonnet-4',
-    provider: 'anthropic',
-    durationMs: 1_000,
-    cost: null,
-    tokens: {
-      input: tokens.input ?? 0,
-      output: tokens.output ?? 0,
-      cacheRead: tokens.cacheRead ?? 0,
-    },
-    turns: 1,
-    toolCalls: [],
-    errors: [],
-    finalStatus: 'completed',
-    summary: 'done',
-    ...overrides,
-  };
-}
-
-function getBudgetTracker(runner: InstanceType<typeof WorkflowRunner>): BudgetTracker | undefined {
-  return (runner as any).budgetTracker as BudgetTracker | undefined;
-}
-
-beforeEach(() => {
-  vi.clearAllMocks();
-  queuedSubprocessResults = [];
-  queuedCollectorResults = [];
-  collectorResultsByCwd = new Map();
-  activeRunner = undefined;
-  mockRelayInstance.shutdown.mockResolvedValue(undefined);
-  mockRelayInstance.onBrokerStderr.mockReturnValue(() => {});
-  mockRelayInstance.listAgents.mockResolvedValue([]);
-});
-
-afterEach(() => {
-  activeRunner = undefined;
-  while (tempDirs.length > 0) {
-    rmSync(tempDirs.pop()!, { recursive: true, force: true });
-  }
-});
-
-describe('WorkflowRunner budget enforcement integration', () => {
-  it('workflow with no budget config runs normally', async () => {
-    const workspace = createWorkspace(['step-1', 'step-2']);
-    const dbHarness = makeDbHarness();
-    const runner = makeRunner(workspace, dbHarness.db);
-    activeRunner = runner;
-
-    queuedSubprocessResults = [
-      { stdout: 'step 1 complete\n', code: 0 },
-      { stdout: 'step 2 complete\n', code: 0 },
-    ];
-    queuedCollectorResults = [null, null];
-
-    const run = await runner.execute(
-      makeConfig({
-        agents: [makeAgent('worker-1', { cwd: 'step-1' }), makeAgent('worker-2', { cwd: 'step-2' })],
-        steps: [makeStep('step-1', 'worker-1'), makeStep('step-2', 'worker-2', { dependsOn: ['step-1'] })],
-      }),
-      'default'
-    );
-
-    expect(run.status).toBe('completed');
-    expect(getBudgetTracker(runner)).toBeUndefined();
-    expect(dbHarness.getSteps(run.id).map((step) => step.status)).toEqual(['completed', 'completed']);
-    expect(mockSubprocessSpawn).toHaveBeenCalledTimes(2);
-  });
-
-  it('per-agent maxTokens recorded in budget tracker', async () => {
-    const workspace = createWorkspace(['writer']);
-    const dbHarness = makeDbHarness();
-    const runner = makeRunner(workspace, dbHarness.db);
-    activeRunner = runner;
-
-    queuedSubprocessResults = [{ stdout: 'draft complete\n', code: 0 }];
-    collectorResultsByCwd.set(path.join(workspace, 'writer'), makeReport({ input: 800, output: 150 }));
-
-    const run = await runner.execute(
-      makeConfig({
-        agents: [
-          makeAgent('writer', {
-            cwd: 'writer',
-            constraints: { maxTokens: 1_000 },
-          }),
-        ],
-        steps: [makeStep('draft', 'writer')],
-      }),
-      'default'
-    );
-
-    const tracker = getBudgetTracker(runner);
-
-    expect(run.status).toBe('completed');
-    expect(tracker).toBeDefined();
-    expect(tracker?.getStepUsage('draft')).toEqual({
-      input: 800,
-      output: 150,
-      cacheRead: 0,
-      total: 950,
-    });
-    expect(tracker?.getStepBudgetStatus('draft')).toEqual({
-      used: 950,
-      limit: 1_000,
-      over: false,
-    });
-  });
-
-  it('per-workflow tokenBudget prevents spawning when exhausted', async () => {
-    const workspace = createWorkspace(['planner', 'writer']);
-    const dbHarness = makeDbHarness();
-    const runner = makeRunner(workspace, dbHarness.db);
-    activeRunner = runner;
-
-    queuedSubprocessResults = [{ stdout: 'plan complete\n', code: 0 }];
-    collectorResultsByCwd.set(path.join(workspace, 'planner'), makeReport({ input: 1_500, output: 300 }));
-
-    const run = await runner.execute(
-      makeConfig({
-        agents: [makeAgent('planner', { cwd: 'planner' }), makeAgent('writer', { cwd: 'writer' })],
-        steps: [makeStep('step-1', 'planner'), makeStep('step-2', 'writer', { dependsOn: ['step-1'] })],
-        swarm: {
-          tokenBudget: 2_000,
-        },
-      }),
-      'default'
-    );
-
-    const tracker = getBudgetTracker(runner);
-    const failedStep = dbHarness.getSteps(run.id).find((step) => step.stepName === 'step-2');
-
-    expect(run.status).toBe('failed');
-    expect(mockSubprocessSpawn).toHaveBeenCalledTimes(1);
-    expect(tracker?.getTotalUsage().total).toBe(1_800);
-    expect(failedStep?.status).toBe('failed');
-    expect(failedStep?.error).toContain('workflow budget exhausted');
-    expect(failedStep?.error).toContain('1800/2000');
-  });
-
-  it('pre-spawn check allows step when budget has headroom', async () => {
-    const workspace = createWorkspace(['first', 'second']);
-    const dbHarness = makeDbHarness();
-    const runner = makeRunner(workspace, dbHarness.db);
-    activeRunner = runner;
-
-    let checkCanSpawnAllowed: boolean | undefined;
-
-    queuedSubprocessResults = [
-      { stdout: 'first complete\n', code: 0 },
-      {
-        stdout: 'second complete\n',
-        code: 0,
-        onSpawn: () => {
-          checkCanSpawnAllowed = getBudgetTracker(runner)?.checkCanSpawn('step-2').allowed;
-        },
-      },
-    ];
-    collectorResultsByCwd.set(path.join(workspace, 'first'), makeReport({ input: 900, output: 100 }));
-    collectorResultsByCwd.set(path.join(workspace, 'second'), makeReport({ input: 150, output: 50 }));
-
-    const run = await runner.execute(
-      makeConfig({
-        agents: [makeAgent('first-agent', { cwd: 'first' }), makeAgent('second-agent', { cwd: 'second' })],
-        steps: [
-          makeStep('step-1', 'first-agent'),
-          makeStep('step-2', 'second-agent', { dependsOn: ['step-1'] }),
-        ],
-        swarm: {
-          tokenBudget: 5_000,
-        },
-      }),
-      'default'
-    );
-
-    expect(run.status).toBe('completed');
-    expect(checkCanSpawnAllowed).toBe(true);
-    expect(mockSubprocessSpawn).toHaveBeenCalledTimes(2);
-  });
-
-  it('retry attempts consume from same budget', async () => {
-    const workspace = createWorkspace(['retry-agent']);
-    const dbHarness = makeDbHarness();
-    const runner = makeRunner(workspace, dbHarness.db);
-    activeRunner = runner;
-
-    let usageBeforeRetry: number | undefined;
-
-    queuedSubprocessResults = [
-      { stdout: 'first attempt failed\n', code: 1 },
-      {
-        stdout: 'retry succeeded\n',
-        code: 0,
-        onSpawn: () => {
-          usageBeforeRetry = getBudgetTracker(runner)?.getStepUsage('retry-step').total;
-        },
-      },
-    ];
-    queuedCollectorResults = [
-      makeReport({ input: 500, output: 100 }, { finalStatus: 'failed' }),
-      makeReport({ input: 250, output: 100 }),
-    ];
-
-    const run = await runner.execute(
-      makeConfig({
-        agents: [
-          makeAgent('retry-agent', {
-            cwd: 'retry-agent',
-            constraints: { maxTokens: 1_000 },
-          }),
-        ],
-        steps: [makeStep('retry-step', 'retry-agent', { retries: 1 })],
-      }),
-      'default'
-    );
-
-    const tracker = getBudgetTracker(runner);
-
-    expect(run.status).toBe('completed');
-    expect(usageBeforeRetry).toBe(600);
-    expect(tracker?.getStepUsage('retry-step')).toEqual({
-      input: 750,
-      output: 200,
-      cacheRead: 0,
-      total: 950,
-    });
-    expect(tracker?.getStepBudgetStatus('retry-step')).toEqual({
-      used: 950,
-      limit: 1_000,
-      over: false,
-    });
-    expect(mockCollectCliSession).toHaveBeenCalledTimes(2);
-  });
-
-  it('parallel steps track budget correctly', async () => {
-    const workspace = createWorkspace(['parallel-a', 'parallel-b']);
-    const dbHarness = makeDbHarness();
-    const runner = makeRunner(workspace, dbHarness.db);
-    activeRunner = runner;
-
-    queuedSubprocessResults = [
-      { stdout: 'parallel a\n', code: 0, delayMs: 10 },
-      { stdout: 'parallel b\n', code: 0, delayMs: 1 },
-    ];
-    collectorResultsByCwd.set(path.join(workspace, 'parallel-a'), makeReport({ input: 500, output: 200 }));
-    collectorResultsByCwd.set(path.join(workspace, 'parallel-b'), makeReport({ input: 700, output: 200 }));
-
-    const run = await runner.execute(
-      makeConfig({
-        agents: [
-          makeAgent('parallel-a', { cwd: 'parallel-a' }),
-          makeAgent('parallel-b', { cwd: 'parallel-b' }),
-        ],
-        steps: [makeStep('parallel-a', 'parallel-a'), makeStep('parallel-b', 'parallel-b')],
-        swarm: {
-          tokenBudget: 5_000,
-        },
-      }),
-      'default'
-    );
-
-    const tracker = getBudgetTracker(runner);
-
-    expect(run.status).toBe('completed');
-    expect(tracker?.getStepUsage('parallel-a')).toEqual({
-      input: 500,
-      output: 200,
-      cacheRead: 0,
-      total: 700,
-    });
-    expect(tracker?.getStepUsage('parallel-b')).toEqual({
-      input: 700,
-      output: 200,
-      cacheRead: 0,
-      total: 900,
-    });
-    expect(tracker?.getTotalUsage()).toEqual({
-      input: 1_200,
-      output: 400,
-      cacheRead: 0,
-      total: 1_600,
-    });
-    expect(tracker?.getRunSummaryBudgetData()?.workflow).toEqual({
-      used: 1_600,
-      limit: 5_000,
-      exhausted: false,
-    });
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/budget-tracker.test.ts b/packages/sdk/src/workflows/__tests__/budget-tracker.test.ts
deleted file mode 100644
index 42e07cb53..000000000
--- a/packages/sdk/src/workflows/__tests__/budget-tracker.test.ts
+++ /dev/null
@@ -1,120 +0,0 @@
-import { describe, expect, it } from 'vitest';
-
-import { BudgetExceededError, BudgetTracker, type TokenUsage } from '../budget-tracker.js';
-
-function expectUsage(actual: TokenUsage, expected: TokenUsage): void {
-  expect(actual).toEqual(expected);
-}
-
-describe('BudgetTracker', () => {
-  it('tracks usage across multiple steps', () => {
-    const tracker = new BudgetTracker({ perAgent: 100, perWorkflow: 500 });
-
-    tracker.recordUsage('planner', { input: 10, output: 5, cacheRead: 3 });
-    tracker.recordUsage('writer', { input: 20, output: 4 });
-    tracker.recordUsage('planner', { input: 1, output: 1, cacheRead: 2 });
-
-    expectUsage(tracker.getStepUsage('planner'), {
-      input: 11,
-      output: 6,
-      cacheRead: 5,
-      total: 17,
-    });
-    expectUsage(tracker.getStepUsage('writer'), {
-      input: 20,
-      output: 4,
-      cacheRead: 0,
-      total: 24,
-    });
-    expectUsage(tracker.getTotalUsage(), {
-      input: 31,
-      output: 10,
-      cacheRead: 5,
-      total: 41,
-    });
-    // total = input + output (cacheRead excluded from budget)
-    expect(tracker.getRemainingBudget()).toEqual({
-      agent: 59,
-      workflow: 459,
-    });
-  });
-
-  it('detects when a step exceeds the per-agent budget', () => {
-    const tracker = new BudgetTracker({ perAgent: 25, perWorkflow: 100 });
-
-    tracker.recordUsage('specialist', { input: 18, output: 9 });
-
-    expect(tracker.isOverBudget('specialist')).toEqual({
-      over: true,
-      reason: 'Step "specialist" exceeded per-agent budget (27/25)',
-    });
-  });
-
-  it('detects when total usage exceeds the per-workflow budget', () => {
-    const tracker = new BudgetTracker({ perAgent: 100, perWorkflow: 40 });
-
-    tracker.recordUsage('step-a', { input: 10, output: 10 });
-    tracker.recordUsage('step-b', { input: 15, output: 10 });
-
-    expect(tracker.isOverBudget('step-b')).toEqual({
-      over: true,
-      reason: 'Workflow exceeded total budget (45/40)',
-    });
-    expect(tracker.checkCanSpawn('step-c')).toEqual({
-      allowed: false,
-      reason: 'Cannot spawn step-c: workflow budget exceeded (45/40)',
-    });
-  });
-
-  it('refuses to spawn when the remaining workflow budget is nearly exhausted', () => {
-    const tracker = new BudgetTracker({ perAgent: 100, perWorkflow: 250 });
-
-    tracker.recordUsage('lead', { input: 120, output: 121 });
-
-    expect(tracker.checkCanSpawn('reviewer')).toEqual({
-      allowed: false,
-      reason: 'Cannot spawn reviewer: remaining workflow budget 9 is below step budget 100',
-    });
-  });
-
-  it('maintains correct totals when parallel steps record usage concurrently', async () => {
-    const tracker = new BudgetTracker({ perAgent: 1_000, perWorkflow: 10_000 });
-
-    await Promise.all(
-      Array.from({ length: 40 }, async (_, index) => {
-        await new Promise((resolve) => setTimeout(resolve, index % 5));
-        tracker.recordUsage(`step-${index % 4}`, {
-          input: 2,
-          output: 3,
-          cacheRead: 1,
-        });
-      })
-    );
-
-    expectUsage(tracker.getTotalUsage(), {
-      input: 80,
-      output: 120,
-      cacheRead: 40,
-      total: 200,
-    });
-
-    for (const stepName of ['step-0', 'step-1', 'step-2', 'step-3']) {
-      expectUsage(tracker.getStepUsage(stepName), {
-        input: 20,
-        output: 30,
-        cacheRead: 10,
-        total: 50,
-      });
-    }
-  });
-
-  it('exposes budget metadata on BudgetExceededError', () => {
-    const error = new BudgetExceededError('planner', 'workflow', 100, 125);
-
-    expect(error.name).toBe('BudgetExceededError');
-    expect(error.stepName).toBe('planner');
-    expect(error.budgetType).toBe('workflow');
-    expect(error.limit).toBe(100);
-    expect(error.actual).toBe(125);
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/builder-paths.test.ts b/packages/sdk/src/workflows/__tests__/builder-paths.test.ts
deleted file mode 100644
index 3d0f0ff17..000000000
--- a/packages/sdk/src/workflows/__tests__/builder-paths.test.ts
+++ /dev/null
@@ -1,76 +0,0 @@
-import { describe, it, expect } from 'vitest';
-
-import { WorkflowBuilder } from '../builder.js';
-
-describe('WorkflowBuilder.paths()', () => {
-  it('records the declared paths on toConfig() output', () => {
-    const config = new WorkflowBuilder('multi-repo')
-      .paths([
-        { name: 'alpha', path: 'alpha', description: 'Demo repo A' },
-        { name: 'beta', path: 'beta', description: 'Demo repo B' },
-      ])
-      .agent('worker', { cli: 'codex' })
-      .step('noop', { type: 'deterministic', command: 'true' })
-      .toConfig();
-
-    expect(config.paths).toEqual([
-      { name: 'alpha', path: 'alpha', description: 'Demo repo A' },
-      { name: 'beta', path: 'beta', description: 'Demo repo B' },
-    ]);
-  });
-
-  it('omits the paths field entirely when none are declared', () => {
-    const config = new WorkflowBuilder('single-repo')
-      .agent('worker', { cli: 'codex' })
-      .step('noop', { type: 'deterministic', command: 'true' })
-      .toConfig();
-
-    expect(config.paths).toBeUndefined();
-  });
-
-  it('does not allow downstream callers to mutate the recorded paths via the input array', () => {
-    const original = [{ name: 'alpha', path: 'alpha' }];
-    const builder = new WorkflowBuilder('mutation-guard')
-      .paths(original)
-      .agent('w', { cli: 'codex' })
-      .step('s', { type: 'deterministic', command: 'true' });
-
-    // Mutating the original array AFTER passing it in should not change
-    // the config the builder emits.
-    original.push({ name: 'beta', path: 'beta' });
-    original[0].name = 'mutated';
-
-    const config = builder.toConfig();
-    expect(config.paths).toEqual([{ name: 'alpha', path: 'alpha' }]);
-  });
-
-  it('rejects non-array inputs', () => {
-    const builder = new WorkflowBuilder('bad-input');
-    // @ts-expect-error — runtime guard, not a type-level test
-    expect(() => builder.paths('not-an-array')).toThrow(/expects an array/);
-  });
-
-  it('rejects entries missing name or path', () => {
-    const builder = new WorkflowBuilder('bad-entry');
-    // @ts-expect-error — runtime guard
-    expect(() => builder.paths([{ name: 'alpha' }])).toThrow(/string `name` and `path`/);
-    // @ts-expect-error — runtime guard
-    expect(() => builder.paths([{ path: 'beta' }])).toThrow(/string `name` and `path`/);
-  });
-
-  it('rejects duplicate path names', () => {
-    const builder = new WorkflowBuilder('dup');
-    expect(() =>
-      builder.paths([
-        { name: 'alpha', path: 'alpha' },
-        { name: 'alpha', path: 'alpha-also' },
-      ])
-    ).toThrow(/duplicate entry name "alpha"/);
-  });
-
-  it('returns the builder so the call chains', () => {
-    const builder = new WorkflowBuilder('chain');
-    const returned = builder.paths([{ name: 'alpha', path: 'alpha' }]);
-    expect(returned).toBe(builder);
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/channel-messenger.test.ts b/packages/sdk/src/workflows/__tests__/channel-messenger.test.ts
deleted file mode 100644
index 1e9867e4d..000000000
--- a/packages/sdk/src/workflows/__tests__/channel-messenger.test.ts
+++ /dev/null
@@ -1,145 +0,0 @@
-import { describe, expect, it, vi } from 'vitest';
-
-// Import from the module that will be extracted from runner.ts
-import {
-  ChannelMessenger,
-  formatError,
-  formatStepOutput,
-  sendToChannel,
-  truncateMessage,
-} from '../channel-messenger.js';
-
-describe('channel messenger helpers', () => {
-  it('sendToChannel forwards messages to the relay client', async () => {
-    const relay = { send: vi.fn().mockResolvedValue(undefined) };
-    await sendToChannel(relay, 'workflow-room', 'hello');
-    expect(relay.send).toHaveBeenCalledWith('workflow-room', 'hello');
-  });
-
-  it('truncateMessage keeps the most recent tail within the limit', () => {
-    expect(truncateMessage('abcdefghij', 4)).toBe('ghij');
-    expect(truncateMessage('abc', 10)).toBe('abc');
-  });
-
-  it('formatStepOutput returns a completion note when scrubbed output is empty', () => {
-    expect(formatStepOutput('plan', '▗▖\n')).toBe('**[plan]** Step completed — output written to disk');
-  });
-
-  it('formatStepOutput scrubs noise and formats a fenced block', () => {
-    const output = 'Thinking…\nuseful line\n';
-    expect(formatStepOutput('plan', output)).toBe('**[plan] Output:**\n```\nuseful line\n```');
-  });
-
-  it('formatStepOutput strips malformed PTY frames through the shared scrubber', () => {
-    const output = ['real result', 'qW0 | q0 / ql0 _ qqm ~ lqq = qW0 | q0 / ql0 _ qqm', 'done'].join('\n');
-    expect(formatStepOutput('plan', output)).toBe('**[plan] Output:**\n```\nreal result\ndone\n```');
-  });
-
-  it('formatStepOutput redacts secrets through the shared scrubber', () => {
-    const output = 'deploy succeeded\naccess_token=ghp_abcdefghijklmnopqrstuvwxyzABCDEFGHIJ\n';
-    const formatted = formatStepOutput('deploy', output);
-    expect(formatted).toContain('[REDACTED]');
-    expect(formatted).not.toContain('ghp_abcdefghijklmnopqrstuvwxyzABCDEFGHIJ');
-  });
-
-  it('formatError normalizes unknown errors', () => {
-    expect(formatError('build', new Error('Boom'))).toBe('**[build]** Failed: Boom');
-    expect(formatError('build', 'bad input')).toBe('**[build]** Failed: bad input');
-  });
-});
-
-describe('ChannelMessenger', () => {
-  describe('buildNonInteractiveAwareness', () => {
-    it('returns undefined when no non-interactive agents exist', () => {
-      const messenger = new ChannelMessenger();
-      const agents = new Map([['worker', { name: 'worker', cli: 'claude', interactive: true }]]);
-      const result = messenger.buildNonInteractiveAwareness(agents as any, new Map());
-      expect(result).toBeUndefined();
-    });
-
-    it('lists non-interactive agents with step references', () => {
-      const messenger = new ChannelMessenger();
-      const agents = new Map([['bg-worker', { name: 'bg-worker', cli: 'claude', interactive: false }]]);
-      const stepStates = new Map([['analyze', { row: { agentName: 'bg-worker', status: 'running' } }]]);
-      const result = messenger.buildNonInteractiveAwareness(agents as any, stepStates as any);
-      expect(result).toContain('bg-worker');
-      expect(result).toContain('{{steps.analyze.output}}');
-      expect(result).toContain('cannot receive messages');
-    });
-  });
-
-  describe('buildDelegationGuidance', () => {
-    it('includes timeout note when timeout is provided', () => {
-      const messenger = new ChannelMessenger();
-      const result = messenger.buildDelegationGuidance('claude', 300_000);
-      expect(result).toContain('5 minutes');
-      expect(result).toContain('AUTONOMOUS DELEGATION');
-    });
-
-    it('includes sub-agent option only for claude CLI', () => {
-      const messenger = new ChannelMessenger();
-      const claudeResult = messenger.buildDelegationGuidance('claude');
-      const codexResult = messenger.buildDelegationGuidance('codex');
-      expect(claudeResult).toContain('Task tool');
-      expect(codexResult).not.toContain('Task tool');
-    });
-
-    it('omits timeout note when no timeout given', () => {
-      const messenger = new ChannelMessenger();
-      const result = messenger.buildDelegationGuidance('claude');
-      expect(result).not.toContain('minutes before this step');
-    });
-  });
-
-  describe('buildRelayRegistrationNote', () => {
-    it('returns empty string for claude CLI', () => {
-      const messenger = new ChannelMessenger();
-      expect(messenger.buildRelayRegistrationNote('claude', 'worker-1')).toBe('');
-    });
-
-    it('returns registration instructions for non-claude CLIs', () => {
-      const messenger = new ChannelMessenger();
-      const result = messenger.buildRelayRegistrationNote('codex', 'helper-1');
-      expect(result).toContain('register_agent(name="helper-1")');
-      expect(result).toContain('RELAY SETUP');
-    });
-  });
-
-  describe('postCompletionReport', () => {
-    it('formats a completion report with step results', () => {
-      const postSpy = vi.fn();
-      const messenger = new ChannelMessenger({ postFn: postSpy });
-      const outcomes = [
-        { name: 'plan', agent: 'lead', status: 'completed', attempts: 1, verificationPassed: true },
-        { name: 'code', agent: 'worker', status: 'completed', attempts: 2 },
-        { name: 'optional', agent: 'worker', status: 'skipped', attempts: 0 },
-      ];
-      messenger.postCompletionReport('my-workflow', outcomes as any, 'All done', 0.95);
-      expect(postSpy).toHaveBeenCalledTimes(1);
-      const text = postSpy.mock.calls[0][0];
-      expect(text).toContain('my-workflow');
-      expect(text).toContain('Complete');
-      expect(text).toContain('95%');
-      expect(text).toContain('verified');
-      expect(text).toContain('2 attempts');
-      expect(text).toContain('skipped');
-    });
-  });
-
-  describe('postFailureReport', () => {
-    it('formats a failure report with error details', () => {
-      const postSpy = vi.fn();
-      const messenger = new ChannelMessenger({ postFn: postSpy });
-      const outcomes = [
-        { name: 'plan', agent: 'lead', status: 'completed', attempts: 1 },
-        { name: 'code', agent: 'worker', status: 'failed', attempts: 3, error: 'Timeout exceeded' },
-      ];
-      messenger.postFailureReport('my-workflow', outcomes as any, 'Step failed');
-      expect(postSpy).toHaveBeenCalledTimes(1);
-      const text = postSpy.mock.calls[0][0];
-      expect(text).toContain('Failed');
-      expect(text).toContain('1/2 steps passed');
-      expect(text).toContain('Timeout exceeded');
-    });
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/cli-session-collector.test.ts b/packages/sdk/src/workflows/__tests__/cli-session-collector.test.ts
deleted file mode 100644
index 808276419..000000000
--- a/packages/sdk/src/workflows/__tests__/cli-session-collector.test.ts
+++ /dev/null
@@ -1,64 +0,0 @@
-import { afterEach, describe, expect, it, vi } from 'vitest';
-import { mkdtempSync, rmSync } from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-
-import { collectCliSession } from '../cli-session-collector.js';
-
-const tempDirs: string[] = [];
-const originalHome = process.env.HOME;
-
-function makeTempDir(prefix: string): string {
-  const dir = mkdtempSync(path.join(os.tmpdir(), prefix));
-  tempDirs.push(dir);
-  return dir;
-}
-
-async function importCollectorsWithHome(homeDir: string) {
-  process.env.HOME = homeDir;
-  vi.resetModules();
-  const [claudeModule, opencodeModule] = await Promise.all([
-    import('../collectors/claude.js'),
-    import('../collectors/opencode.js'),
-  ]);
-  return {
-    ClaudeCodeCollector: claudeModule.ClaudeCodeCollector,
-    OpenCodeCollector: opencodeModule.OpenCodeCollector,
-  };
-}
-
-afterEach(() => {
-  vi.resetModules();
-  process.env.HOME = originalHome;
-  while (tempDirs.length > 0) {
-    rmSync(tempDirs.pop()!, { recursive: true, force: true });
-  }
-});
-
-describe('cli-session-collector', () => {
-  it('returns null for an unknown CLI', async () => {
-    const report = await collectCliSession({
-      cli: 'gemini',
-      cwd: '/tmp/project',
-      startedAt: 1000,
-      completedAt: 2000,
-    });
-
-    expect(report).toBeNull();
-  });
-
-  it('reports canCollect=false when configured data stores do not exist', async () => {
-    const homeDir = makeTempDir('cli-session-collector-empty-home-');
-    const { ClaudeCodeCollector, OpenCodeCollector } = await importCollectorsWithHome(homeDir);
-    const { CodexCollector } = await import('../collectors/codex.js');
-
-    expect(new ClaudeCodeCollector().canCollect()).toBe(false);
-    expect(new OpenCodeCollector().canCollect()).toBe(false);
-    expect(
-      new CodexCollector({
-        historyPath: path.join(homeDir, 'missing-history.jsonl'),
-        statePath: path.join(homeDir, 'missing-state.sqlite'),
-      }).canCollect()
-    ).toBe(false);
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/collectors/claude.test.ts b/packages/sdk/src/workflows/__tests__/collectors/claude.test.ts
deleted file mode 100644
index 2da888ab2..000000000
--- a/packages/sdk/src/workflows/__tests__/collectors/claude.test.ts
+++ /dev/null
@@ -1,108 +0,0 @@
-import { afterEach, describe, expect, it, vi } from 'vitest';
-import { mkdirSync, mkdtempSync, rmSync, writeFileSync } from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-
-const tempDirs: string[] = [];
-const originalHome = process.env.HOME;
-
-function makeTempDir(prefix: string): string {
-  const dir = mkdtempSync(path.join(os.tmpdir(), prefix));
-  tempDirs.push(dir);
-  return dir;
-}
-
-function encodeProjectPath(projectPath: string): string {
-  return projectPath.replace(/\//g, '--').replace(/^-+/, '');
-}
-
-function createClaudeFixture(homeDir: string, cwd: string, timestamp: number): string {
-  const claudeHome = path.join(homeDir, '.claude');
-  const projectsRoot = path.join(claudeHome, 'projects', encodeProjectPath(cwd));
-  mkdirSync(projectsRoot, { recursive: true });
-
-  const sessionId = 'session-claude-1';
-  writeFileSync(
-    path.join(claudeHome, 'history.jsonl'),
-    [
-      JSON.stringify({
-        timestamp: timestamp - 1000,
-        project: '/other/project',
-        sessionId: 'ignored-session',
-      }),
-      JSON.stringify({ timestamp, project: cwd, sessionId }),
-    ].join('\n')
-  );
-
-  writeFileSync(
-    path.join(projectsRoot, `${sessionId}.jsonl`),
-    [
-      JSON.stringify({ type: 'user', text: 'Investigate the failing command' }),
-      JSON.stringify({ type: 'tool_use', name: 'bash' }),
-      JSON.stringify({
-        type: 'assistant',
-        message: {
-          model: 'claude-sonnet-4',
-          provider: 'anthropic',
-          usage: {
-            input_tokens: 42,
-            output_tokens: 24,
-            cache_read_input_tokens: 7,
-          },
-          content: [{ text: 'Final concise summary' }],
-        },
-      }),
-    ].join('\n')
-  );
-
-  return sessionId;
-}
-
-async function importCollectorWithHome(homeDir: string) {
-  process.env.HOME = homeDir;
-  vi.resetModules();
-  const module = await import('../../collectors/claude.js');
-  return module.ClaudeCodeCollector;
-}
-
-afterEach(() => {
-  vi.resetModules();
-  process.env.HOME = originalHome;
-  while (tempDirs.length > 0) {
-    rmSync(tempDirs.pop()!, { recursive: true, force: true });
-  }
-});
-
-describe('ClaudeCodeCollector', () => {
-  it('matches by project path and timestamp and reads the session jsonl', async () => {
-    const homeDir = makeTempDir('claude-home-');
-    const cwd = '/repo/project';
-    const timestamp = 50_000;
-    const sessionId = createClaudeFixture(homeDir, cwd, timestamp);
-    const ClaudeCodeCollector = await importCollectorWithHome(homeDir);
-
-    const report = await new ClaudeCodeCollector().collect({
-      cli: 'claude',
-      cwd,
-      startedAt: timestamp - 100,
-      completedAt: timestamp + 2_000,
-    });
-
-    expect(report).not.toBeNull();
-    expect(report?.sessionId).toBe(sessionId);
-    expect(report?.model).toBe('claude-sonnet-4');
-    expect(report?.provider).toBe('anthropic');
-    expect(report?.tokens).toEqual({ input: 42, output: 24, cacheRead: 7 });
-    expect(report?.turns).toBe(1);
-    expect(report?.toolCalls).toEqual([{ name: 'bash', count: 1 }]);
-    expect(report?.summary).toBe('Final concise summary');
-    expect(report?.finalStatus).toBe('completed');
-  });
-
-  it('returns false from canCollect when history and project files are missing', async () => {
-    const homeDir = makeTempDir('claude-empty-home-');
-    const ClaudeCodeCollector = await importCollectorWithHome(homeDir);
-
-    expect(new ClaudeCodeCollector().canCollect()).toBe(false);
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/collectors/codex.test.ts b/packages/sdk/src/workflows/__tests__/collectors/codex.test.ts
deleted file mode 100644
index 4ecbbfe48..000000000
--- a/packages/sdk/src/workflows/__tests__/collectors/codex.test.ts
+++ /dev/null
@@ -1,89 +0,0 @@
-import { afterEach, describe, expect, it } from 'vitest';
-import { mkdtempSync, rmSync, writeFileSync } from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import { DatabaseSync } from 'node:sqlite';
-
-import { CodexCollector } from '../../collectors/codex.js';
-
-const tempDirs: string[] = [];
-
-function makeTempDir(prefix: string): string {
-  const dir = mkdtempSync(path.join(os.tmpdir(), prefix));
-  tempDirs.push(dir);
-  return dir;
-}
-
-function createCodexFixture(tempDir: string, cwd: string, createdAtSeconds: number) {
-  const statePath = path.join(tempDir, 'state_5.sqlite');
-  const historyPath = path.join(tempDir, 'history.jsonl');
-  const db = new DatabaseSync(statePath);
-
-  db.exec(`
-    CREATE TABLE threads (
-      id TEXT PRIMARY KEY,
-      cwd TEXT,
-      model_provider TEXT,
-      tokens_used INTEGER,
-      created_at INTEGER,
-      updated_at INTEGER
-    );
-    CREATE TABLE logs (
-      thread_id TEXT,
-      ts INTEGER,
-      level TEXT,
-      message TEXT,
-      line INTEGER
-    );
-  `);
-
-  db.prepare(
-    'INSERT INTO threads (id, cwd, model_provider, tokens_used, created_at, updated_at) VALUES (?, ?, ?, ?, ?, ?)'
-  ).run('thread-1', cwd, 'openai/gpt-5', 321, createdAtSeconds, createdAtSeconds + 3);
-  db.prepare('INSERT INTO logs (thread_id, ts, level, message, line) VALUES (?, ?, ?, ?, ?)').run(
-    'thread-1',
-    createdAtSeconds + 1,
-    'error',
-    'Command failed: bad exit code',
-    12
-  );
-  db.close();
-
-  writeFileSync(
-    historyPath,
-    `${JSON.stringify({ session_id: 'thread-1', ts: createdAtSeconds, text: 'history' })}\n`
-  );
-
-  return { statePath, historyPath };
-}
-
-afterEach(() => {
-  while (tempDirs.length > 0) {
-    rmSync(tempDirs.pop()!, { recursive: true, force: true });
-  }
-});
-
-describe('CodexCollector', () => {
-  it('matches by cwd and time window and extracts errors from logs', async () => {
-    const tempDir = makeTempDir('codex-fixture-');
-    const cwd = '/repo/codex-project';
-    const createdAtSeconds = 100;
-    const { statePath, historyPath } = createCodexFixture(tempDir, cwd, createdAtSeconds);
-    const collector = new CodexCollector({ statePath, historyPath });
-
-    const report = await collector.collect({
-      cli: 'codex',
-      cwd,
-      startedAt: 100_000,
-      completedAt: 105_000,
-    });
-
-    expect(report).not.toBeNull();
-    expect(report?.sessionId).toBe('thread-1');
-    expect(report?.provider).toBe('openai');
-    expect(report?.model).toBe('gpt-5');
-    expect(report?.tokens).toEqual({ input: 321, output: 0, cacheRead: 0 });
-    expect(report?.errors).toEqual([{ turn: 1, text: 'Command failed: bad exit code' }]);
-    expect(report?.finalStatus).toBe('failed');
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/collectors/opencode.test.ts b/packages/sdk/src/workflows/__tests__/collectors/opencode.test.ts
deleted file mode 100644
index 89e3ebd88..000000000
--- a/packages/sdk/src/workflows/__tests__/collectors/opencode.test.ts
+++ /dev/null
@@ -1,182 +0,0 @@
-import { afterEach, describe, expect, it, vi } from 'vitest';
-import { mkdirSync, mkdtempSync, rmSync } from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import { DatabaseSync } from 'node:sqlite';
-
-const tempDirs: string[] = [];
-const originalHome = process.env.HOME;
-
-function makeTempDir(prefix: string): string {
-  const dir = mkdtempSync(path.join(os.tmpdir(), prefix));
-  tempDirs.push(dir);
-  return dir;
-}
-
-function createOpenCodeFixture(homeDir: string, cwd: string, sessionCreatedAt: number): string {
-  const dbDir = path.join(homeDir, '.local', 'share', 'opencode');
-  mkdirSync(dbDir, { recursive: true });
-  const dbPath = path.join(dbDir, 'opencode.db');
-  const db = new DatabaseSync(dbPath);
-
-  db.exec(`
-    CREATE TABLE session (id TEXT PRIMARY KEY, directory TEXT, time_created INTEGER);
-    CREATE TABLE message (id TEXT PRIMARY KEY, session_id TEXT, time_created INTEGER, data TEXT);
-    CREATE TABLE part (id TEXT PRIMARY KEY, message_id TEXT, session_id TEXT, time_created INTEGER, data TEXT);
-  `);
-
-  const insertSession = db.prepare('INSERT INTO session (id, directory, time_created) VALUES (?, ?, ?)');
-  const insertMessage = db.prepare(
-    'INSERT INTO message (id, session_id, time_created, data) VALUES (?, ?, ?, ?)'
-  );
-  const insertPart = db.prepare(
-    'INSERT INTO part (id, message_id, session_id, time_created, data) VALUES (?, ?, ?, ?, ?)'
-  );
-
-  insertSession.run('session-1', cwd, sessionCreatedAt);
-  insertSession.run('session-2', '/other/project', sessionCreatedAt + 1000);
-
-  insertMessage.run(
-    'msg-1',
-    'session-1',
-    sessionCreatedAt + 10,
-    JSON.stringify({ role: 'user', tokens: { input: 10, output: 0, cache: { read: 1 } } })
-  );
-  insertMessage.run(
-    'msg-2',
-    'session-1',
-    sessionCreatedAt + 20,
-    JSON.stringify({
-      role: 'assistant',
-      modelID: 'gpt-5',
-      providerID: 'openai',
-      finish: 'error',
-      cost: 1.25,
-      tokens: { input: 15, output: 20, cache: { read: 4 } },
-    })
-  );
-  insertMessage.run(
-    'msg-other',
-    'session-2',
-    sessionCreatedAt + 30,
-    JSON.stringify({ role: 'assistant', modelID: 'ignore-me', providerID: 'other', finish: 'completed' })
-  );
-
-  insertPart.run(
-    'part-1',
-    'msg-1',
-    'session-1',
-    sessionCreatedAt + 11,
-    JSON.stringify({ type: 'text', text: 'Planning work' })
-  );
-  insertPart.run(
-    'part-2',
-    'msg-2',
-    'session-1',
-    sessionCreatedAt + 21,
-    JSON.stringify({ type: 'tool_call', name: 'write_file' })
-  );
-  insertPart.run(
-    'part-3',
-    'msg-2',
-    'session-1',
-    sessionCreatedAt + 22,
-    JSON.stringify({ type: 'text', text: 'Error: database locked\nCleanup afterwards' })
-  );
-  insertPart.run(
-    'part-4',
-    'msg-2',
-    'session-1',
-    sessionCreatedAt + 23,
-    JSON.stringify({ type: 'text', text: 'Completed summary output' })
-  );
-
-  db.close();
-  return dbPath;
-}
-
-async function importCollectorWithHome(homeDir: string) {
-  process.env.HOME = homeDir;
-  vi.resetModules();
-  vi.doMock('node:module', () => ({
-    createRequire: () => (id: string) => {
-      if (id !== 'better-sqlite3') {
-        throw new Error(`Unexpected module request: ${id}`);
-      }
-
-      return class BetterSqliteCompat {
-        private readonly db: DatabaseSync;
-
-        constructor(filename: string) {
-          this.db = new DatabaseSync(filename, { open: true, readOnly: true });
-        }
-
-        prepare(sql: string) {
-          const statement = this.db.prepare(sql);
-          return {
-            get<T>(params?: unknown): T | undefined {
-              return statement.get(params as never) as T | undefined;
-            },
-            all<T>(params?: unknown): T[] {
-              return statement.all(params as never) as T[];
-            },
-          };
-        }
-
-        pragma(_source: string) {
-          return undefined;
-        }
-
-        close() {
-          this.db.close();
-        }
-      };
-    },
-  }));
-  const module = await import('../../collectors/opencode.js');
-  return module.OpenCodeCollector;
-}
-
-afterEach(() => {
-  vi.resetModules();
-  process.env.HOME = originalHome;
-  while (tempDirs.length > 0) {
-    rmSync(tempDirs.pop()!, { recursive: true, force: true });
-  }
-});
-
-describe('OpenCodeCollector', () => {
-  it('matches by directory and time window, aggregates tokens, and extracts errors', async () => {
-    const homeDir = makeTempDir('opencode-home-');
-    const cwd = path.join(homeDir, 'workspace');
-    const sessionCreatedAt = 10_000;
-    createOpenCodeFixture(homeDir, cwd, sessionCreatedAt);
-    const OpenCodeCollector = await importCollectorWithHome(homeDir);
-
-    const collector = new OpenCodeCollector();
-    const report = await collector.collect({
-      cli: 'opencode',
-      cwd,
-      startedAt: sessionCreatedAt + 100,
-      completedAt: sessionCreatedAt + 500,
-    });
-
-    expect(report).not.toBeNull();
-    expect(report?.sessionId).toBe('session-1');
-    expect(report?.model).toBe('gpt-5');
-    expect(report?.provider).toBe('openai');
-    expect(report?.tokens).toEqual({ input: 25, output: 20, cacheRead: 5 });
-    expect(report?.cost).toBe(1.25);
-    expect(report?.toolCalls).toEqual([{ name: 'write_file', count: 1 }]);
-    expect(report?.errors).toEqual([{ turn: 3, text: 'Error: database locked' }]);
-    expect(report?.finalStatus).toBe('failed');
-    expect(report?.summary).toBe('Completed summary output');
-  });
-
-  it('returns false from canCollect when the database is missing', async () => {
-    const homeDir = makeTempDir('opencode-missing-home-');
-    const OpenCodeCollector = await importCollectorWithHome(homeDir);
-
-    expect(new OpenCodeCollector().canCollect()).toBe(false);
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/e2big-and-verify.test.ts b/packages/sdk/src/workflows/__tests__/e2big-and-verify.test.ts
deleted file mode 100644
index 0747e2b54..000000000
--- a/packages/sdk/src/workflows/__tests__/e2big-and-verify.test.ts
+++ /dev/null
@@ -1,112 +0,0 @@
-import { describe, expect, it, vi } from 'vitest';
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn(),
-  RelayError: class RelayError extends Error {},
-}));
-
-vi.mock('../../relay.js', () => ({
-  AgentRelay: vi.fn(),
-}));
-
-const { WorkflowRunner } = await import('../runner.js');
-
-describe('runVerification output_contains (token double-count fix)', () => {
-  function createRunner(): InstanceType<typeof WorkflowRunner> {
-    return new WorkflowRunner({ cwd: '/tmp/test' });
-  }
-
-  function runVerification(
-    runner: InstanceType<typeof WorkflowRunner>,
-    check: { type: 'output_contains'; value: string },
-    output: string,
-    stepName: string,
-    injectedTaskText?: string
-  ) {
-    return (runner as any).runVerification(check, output, stepName, injectedTaskText, {
-      allowFailure: true,
-    });
-  }
-
-  it('passes when token is in output and not in task injection', () => {
-    const runner = createRunner();
-    const result = runVerification(
-      runner,
-      { type: 'output_contains', value: 'DONE' },
-      'Task completed. DONE',
-      'step1'
-    );
-    expect(result.passed).toBe(true);
-  });
-
-  it('fails when token is missing from output entirely', () => {
-    const runner = createRunner();
-    const result = runVerification(
-      runner,
-      { type: 'output_contains', value: 'DONE' },
-      'Task completed without the marker',
-      'step1'
-    );
-    expect(result.passed).toBe(false);
-    expect(result.error).toContain('does not contain "DONE"');
-  });
-
-  it('passes when token is in both task injection and agent output', () => {
-    const runner = createRunner();
-    const result = runVerification(
-      runner,
-      { type: 'output_contains', value: 'REFLECTION_COMPLETE' },
-      'Your task: output REFLECTION_COMPLETE when done\n\nI have finished. REFLECTION_COMPLETE',
-      'step1',
-      'Your task: output REFLECTION_COMPLETE when done'
-    );
-    expect(result.passed).toBe(true);
-  });
-
-  it('fails when token appears only in task injection (not produced by agent)', () => {
-    const runner = createRunner();
-    const result = runVerification(
-      runner,
-      { type: 'output_contains', value: 'REFLECTION_COMPLETE' },
-      'Your task: output REFLECTION_COMPLETE when done\n\nI worked on it but forgot the marker.',
-      'step1',
-      'Your task: output REFLECTION_COMPLETE when done'
-    );
-    expect(result.passed).toBe(false);
-    expect(result.error).toContain('does not contain "REFLECTION_COMPLETE"');
-  });
-
-  it('handles token appearing multiple times in task injection', () => {
-    const runner = createRunner();
-    const taskText = 'Output DONE when done. Remember: DONE is required.';
-    const output = taskText + '\n\nAll work complete. DONE';
-    const result = runVerification(
-      runner,
-      { type: 'output_contains', value: 'DONE' },
-      output,
-      'step1',
-      taskText
-    );
-    expect(result.passed).toBe(true);
-  });
-
-  it('fails when token appears same number of times as in task injection', () => {
-    const runner = createRunner();
-    const taskText = 'Output DONE when done. Remember: DONE is required.';
-    const output = taskText + '\n\nAll work complete but no marker here.';
-    const result = runVerification(
-      runner,
-      { type: 'output_contains', value: 'DONE' },
-      output,
-      'step1',
-      taskText
-    );
-    expect(result.passed).toBe(false);
-  });
-
-  it('handles empty token gracefully', () => {
-    const runner = createRunner();
-    const result = runVerification(runner, { type: 'output_contains', value: '' }, 'some output', 'step1');
-    expect(result.passed).toBe(false);
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/e2e-permissions.test.ts b/packages/sdk/src/workflows/__tests__/e2e-permissions.test.ts
deleted file mode 100644
index 257a802fe..000000000
--- a/packages/sdk/src/workflows/__tests__/e2e-permissions.test.ts
+++ /dev/null
@@ -1,413 +0,0 @@
-import { beforeEach, afterEach, describe, expect, it, vi } from 'vitest';
-import { mkdtempSync, mkdirSync, rmSync, writeFileSync } from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import { fileURLToPath } from 'node:url';
-
-import type { WorkflowDb } from '../runner.js';
-import type { RelayYamlConfig, WorkflowRunRow, WorkflowStepRow } from '../types.js';
-import type { ProvisionResult, WorkflowProvisionConfig } from '../../provisioner/types.js';
-
-const fixturePath = fileURLToPath(new URL('./fixtures/permission-test.yaml', import.meta.url));
-
-const permissionProfiles = {
-  reader: {
-    access: 'readonly',
-    scopes: ['relayfile:fs:read:/**'],
-    summary: { readonly: 4, readwrite: 0, denied: 0, customScopes: 0 },
-  },
-  writer: {
-    access: 'readwrite',
-    scopes: ['relayfile:fs:read:/src/tests/**', 'relayfile:fs:write:/src/tests/**'],
-    summary: { readonly: 0, readwrite: 1, denied: 2, customScopes: 0 },
-  },
-  'admin-lead': {
-    access: 'full',
-    scopes: ['relayfile:fs:read:/**', 'relayfile:fs:write:/**'],
-    summary: { readonly: 0, readwrite: 6, denied: 0, customScopes: 0 },
-  },
-} as const;
-
-type PermissionProfile = (typeof permissionProfiles)[keyof typeof permissionProfiles];
-
-function buildCompiledPermissions(agentName: string, workspace: string, profile: PermissionProfile) {
-  return {
-    agentName,
-    workspace,
-    effectiveAccess: profile.access,
-    inherited: profile.access !== 'full',
-    sources: [{ type: 'yaml' as const, label: 'permissions', ruleCount: profile.scopes.length }],
-    readonlyPatterns: profile.access === 'readonly' ? ['**'] : [],
-    readwritePatterns:
-      profile.access === 'full'
-        ? ['**']
-        : profile.scopes
-            .filter((scope) => scope.startsWith('relayfile:fs:write:'))
-            .map((scope) => scope.split(':').slice(3).join(':')),
-    deniedPatterns: agentName === 'writer' ? ['.env', 'secrets/**'] : [],
-    readonlyPaths: Array.from({ length: profile.summary.readonly }, (_, index) => `readonly-${index}.txt`),
-    readwritePaths: Array.from({ length: profile.summary.readwrite }, (_, index) => `write-${index}.txt`),
-    deniedPaths: Array.from({ length: profile.summary.denied }, (_, index) => `denied-${index}.txt`),
-    scopes: [...profile.scopes],
-    network: undefined,
-    exec: undefined,
-    acl: {},
-    summary: { ...profile.summary },
-  };
-}
-
-let lastProvisionCall: WorkflowProvisionConfig | null = null;
-let lastProvisionResult: ProvisionResult | null = null;
-
-const mockProvisionWorkflowAgents = vi.fn(
-  async (input: WorkflowProvisionConfig): Promise<ProvisionResult> => {
-    lastProvisionCall = input;
-
-    const agentNames = Object.keys(input.agents ?? {});
-    const tokens = new Map<string, string>();
-    const scopes = new Map<string, string[]>();
-    const agents = Object.fromEntries(
-      agentNames.map((agentName) => {
-        const profile = permissionProfiles[agentName as keyof typeof permissionProfiles];
-        const token = `jwt-${agentName}`;
-        const compiled = buildCompiledPermissions(agentName, input.workspace, profile);
-
-        tokens.set(agentName, token);
-        scopes.set(agentName, [...profile.scopes]);
-
-        return [
-          agentName,
-          {
-            name: agentName,
-            tokenPath: path.join(input.projectDir, '.relay', 'tokens', `${agentName}.jwt`),
-            token,
-            scopes: [...profile.scopes],
-            compiled,
-          },
-        ];
-      })
-    );
-
-    const result: ProvisionResult = {
-      agents,
-      agentNames,
-      adminToken: 'jwt-admin',
-      seededFileCount: 0,
-      seededAclCount: 0,
-      summary: agentNames.reduce(
-        (acc, agentName) => {
-          const profile = permissionProfiles[agentName as keyof typeof permissionProfiles];
-          acc.readonly += profile.summary.readonly;
-          acc.readwrite += profile.summary.readwrite;
-          acc.denied += profile.summary.denied;
-          acc.customScopes += profile.summary.customScopes;
-          return acc;
-        },
-        { readonly: 0, readwrite: 0, denied: 0, customScopes: 0 }
-      ),
-      mounts: new Map(),
-      tokens,
-      scopes,
-    };
-
-    lastProvisionResult = result;
-    return result;
-  }
-);
-
-const mockResolveAgentPermissions = vi.fn(
-  (agentName: string, _permissions: unknown, _projectDir: string, workspace: string) =>
-    buildCompiledPermissions(
-      agentName,
-      workspace,
-      permissionProfiles[agentName as keyof typeof permissionProfiles]
-    )
-);
-
-vi.mock('../../provisioner/index.js', async (importOriginal) => {
-  const actual = await importOriginal<typeof import('../../provisioner/index.js')>();
-  return {
-    ...actual,
-    provisionWorkflowAgents: mockProvisionWorkflowAgents,
-    resolveAgentPermissions: mockResolveAgentPermissions,
-  };
-});
-
-const mockFetch = vi.fn().mockResolvedValue({
-  ok: true,
-  json: () => Promise.resolve({ data: { api_key: 'rk_live_test', workspace_id: 'ws-test' } }),
-  text: () => Promise.resolve(''),
-});
-vi.stubGlobal('fetch', mockFetch);
-
-const mockRelaycastAgent = {
-  send: vi.fn().mockResolvedValue(undefined),
-  heartbeat: vi.fn().mockResolvedValue(undefined),
-  channels: {
-    create: vi.fn().mockResolvedValue(undefined),
-    join: vi.fn().mockResolvedValue(undefined),
-    invite: vi.fn().mockResolvedValue(undefined),
-  },
-};
-
-const mockRelaycast = {
-  agents: {
-    register: vi.fn().mockResolvedValue({ token: 'token-1' }),
-  },
-  as: vi.fn().mockReturnValue(mockRelaycastAgent),
-};
-
-class MockRelayError extends Error {
-  code: string;
-
-  constructor(code: string, message: string, status = 400) {
-    super(message);
-    this.code = code;
-    this.name = 'RelayError';
-    (this as any).status = status;
-  }
-}
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn().mockImplementation(() => mockRelaycast),
-  RelayError: MockRelayError,
-}));
-
-let waitForExitFn: (ms?: number) => Promise<'exited' | 'timeout' | 'released'>;
-let waitForIdleFn: (ms?: number) => Promise<'idle' | 'timeout' | 'exited'>;
-let mockSpawnOutputs: string[] = [];
-
-const mockAgent = {
-  name: 'test-agent-abc',
-  get waitForExit() {
-    return waitForExitFn;
-  },
-  get waitForIdle() {
-    return waitForIdleFn;
-  },
-  release: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockHuman = {
-  name: 'WorkflowRunner',
-  sendMessage: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockListeners = new Map<string, Set<(...args: any[]) => void>>();
-function emitMockEvent(event: string, ...args: any[]): void {
-  const set = mockListeners.get(event);
-  if (set) for (const cb of set) cb(...args);
-}
-
-const defaultSpawnPtyImplementation = async ({ name, task }: { name: string; task?: string }) => {
-  const queued = mockSpawnOutputs.shift();
-  const stepComplete = task?.match(/STEP_COMPLETE:([^\n]+)/)?.[1]?.trim();
-  const output = queued ?? (stepComplete ? `STEP_COMPLETE:${stepComplete}\n` : 'STEP_COMPLETE:unknown\n');
-
-  queueMicrotask(() => {
-    emitMockEvent('workerOutput', { name, chunk: output });
-  });
-
-  return { ...mockAgent, name };
-};
-
-const mockRelayInstance = {
-  spawnPty: vi.fn().mockImplementation(defaultSpawnPtyImplementation),
-  human: vi.fn().mockReturnValue(mockHuman),
-  shutdown: vi.fn().mockResolvedValue(undefined),
-  onBrokerStderr: vi.fn().mockReturnValue(() => {}),
-  addListener: vi.fn((event: string, cb: (...args: any[]) => void) => {
-    let set = mockListeners.get(event);
-    if (!set) {
-      set = new Set();
-      mockListeners.set(event, set);
-    }
-    set.add(cb);
-    return () => set!.delete(cb);
-  }),
-  listAgentsRaw: vi.fn().mockResolvedValue([]),
-};
-
-vi.mock('../../relay.js', () => ({
-  AgentRelay: vi.fn().mockImplementation(() => mockRelayInstance),
-}));
-
-const { WorkflowRunner } = await import('../runner.js');
-const { formatDryRunReport } = await import('../dry-run-format.js');
-
-function makeDb(): WorkflowDb {
-  const runs = new Map<string, WorkflowRunRow>();
-  const steps = new Map<string, WorkflowStepRow>();
-
-  return {
-    insertRun: vi.fn(async (run: WorkflowRunRow) => {
-      runs.set(run.id, { ...run });
-    }),
-    updateRun: vi.fn(async (id: string, patch: Partial<WorkflowRunRow>) => {
-      const existing = runs.get(id);
-      if (existing) runs.set(id, { ...existing, ...patch });
-    }),
-    getRun: vi.fn(async (id: string) => {
-      const run = runs.get(id);
-      return run ? { ...run } : null;
-    }),
-    insertStep: vi.fn(async (step: WorkflowStepRow) => {
-      steps.set(step.id, { ...step });
-    }),
-    updateStep: vi.fn(async (id: string, patch: Partial<WorkflowStepRow>) => {
-      const existing = steps.get(id);
-      if (existing) steps.set(id, { ...existing, ...patch });
-    }),
-    getStepsByRunId: vi.fn(async (runId: string) => {
-      return [...steps.values()].filter((step) => step.runId === runId);
-    }),
-  };
-}
-
-function never<T>(): Promise<T> {
-  return new Promise(() => {});
-}
-
-function createWorkspace(): string {
-  const dir = mkdtempSync(path.join(os.tmpdir(), 'relay-workflow-permissions-'));
-  mkdirSync(path.join(dir, 'src', 'tests'), { recursive: true });
-  mkdirSync(path.join(dir, 'src'), { recursive: true });
-  mkdirSync(path.join(dir, 'secrets'), { recursive: true });
-  writeFileSync(path.join(dir, 'README.md'), '# workspace\n');
-  writeFileSync(path.join(dir, 'src', 'index.ts'), 'export const value = 1;\n');
-  writeFileSync(path.join(dir, 'src', 'tests', 'fixture.txt'), 'fixture\n');
-  writeFileSync(path.join(dir, '.env'), 'TOKEN=secret\n');
-  writeFileSync(path.join(dir, 'secrets', 'prod.txt'), 'top-secret\n');
-  return dir;
-}
-
-async function loadPermissionFixture(
-  runner: InstanceType<typeof WorkflowRunner>,
-  options: { includeLeadStep?: boolean } = {}
-): Promise<RelayYamlConfig> {
-  const config = await runner.parseYamlFile(fixturePath);
-  config.trajectories = false;
-
-  if (options.includeLeadStep) {
-    const workflow = config.workflows?.find((entry) => entry.name === 'test');
-    workflow?.steps.push({
-      name: 'lead-step',
-      agent: 'admin-lead',
-      dependsOn: ['read-step', 'write-step'],
-      task: 'Verify admin lead permissions are available and conclude the workflow.',
-    });
-  }
-
-  return config;
-}
-
-describe('WorkflowRunner permissions integration', () => {
-  let db: WorkflowDb;
-  let runner: InstanceType<typeof WorkflowRunner>;
-  let workspaceDir: string;
-
-  beforeEach(() => {
-    vi.clearAllMocks();
-    waitForExitFn = vi.fn().mockResolvedValue('exited');
-    waitForIdleFn = vi.fn().mockImplementation(() => never());
-    mockSpawnOutputs = [];
-    mockAgent.release.mockResolvedValue(undefined);
-    mockRelayInstance.spawnPty.mockImplementation(defaultSpawnPtyImplementation);
-    mockListeners.clear();
-    lastProvisionCall = null;
-    lastProvisionResult = null;
-    workspaceDir = createWorkspace();
-    db = makeDb();
-    runner = new WorkflowRunner({ db, workspaceId: 'ws-test', cwd: workspaceDir });
-  });
-
-  afterEach(() => {
-    vi.restoreAllMocks();
-    rmSync(workspaceDir, { recursive: true, force: true });
-  });
-
-  it('provisions permissions, propagates agent tokens, and clears workflow tokens after completion', async () => {
-    const config = await loadPermissionFixture(runner, { includeLeadStep: true });
-    const provisionSpy = vi.spyOn(runner as any, 'provisionAgents');
-    const nonInteractiveCommandSpy = vi
-      .spyOn(WorkflowRunner, 'buildNonInteractiveCommand')
-      .mockImplementation(() => ({
-        cmd: 'sh',
-        args: ['-c', 'printf "RELAY_AGENT_TOKEN=%s" "$RELAY_AGENT_TOKEN"'],
-      }));
-
-    const run = await runner.execute(config, 'test');
-    const steps = await db.getStepsByRunId(run.id);
-    const stepByName = new Map(steps.map((step) => [step.stepName, step]));
-    const provisionedScopes = lastProvisionResult?.scopes;
-    const spawnCalls = (mockRelayInstance.spawnPty as any).mock.calls.map(
-      ([input]: [{ agentToken?: string; name: string }]) => input
-    );
-
-    expect(run.status).toBe('completed');
-    expect(provisionSpy).toHaveBeenCalledTimes(1);
-    expect(mockProvisionWorkflowAgents).toHaveBeenCalledTimes(1);
-    expect(lastProvisionCall?.workspace).toBe('ws-test');
-    expect(lastProvisionCall?.projectDir).toBe(workspaceDir);
-    expect(Object.keys(lastProvisionCall?.agents ?? {})).toEqual(['reader', 'writer', 'admin-lead']);
-
-    expect(provisionedScopes?.get('reader')).toEqual(['relayfile:fs:read:/**']);
-    expect(provisionedScopes?.get('reader')?.some((scope) => scope.includes(':write:'))).toBe(false);
-    expect(provisionedScopes?.get('writer')).toEqual([
-      'relayfile:fs:read:/src/tests/**',
-      'relayfile:fs:write:/src/tests/**',
-    ]);
-    expect(provisionedScopes?.get('writer')?.filter((scope) => scope.includes(':write:'))).toEqual([
-      'relayfile:fs:write:/src/tests/**',
-    ]);
-    expect(provisionedScopes?.get('admin-lead')).toEqual(['relayfile:fs:read:/**', 'relayfile:fs:write:/**']);
-
-    expect(nonInteractiveCommandSpy).toHaveBeenCalledTimes(2);
-    expect(stepByName.get('read-step')?.output).toBe('RELAY_AGENT_TOKEN=jwt-reader');
-    expect(stepByName.get('write-step')?.output).toBe('RELAY_AGENT_TOKEN=jwt-writer');
-
-    expect(spawnCalls.length).toBeGreaterThan(0);
-    expect(
-      spawnCalls.every(
-        (call: { agentToken: string }) => typeof call.agentToken === 'string' && call.agentToken.length > 0
-      )
-    ).toBe(true);
-    expect(spawnCalls[0]?.agentToken).toBe('jwt-admin-lead');
-
-    expect((runner as any).agentTokens.size).toBe(0);
-    expect((runner as any).agentMounts.size).toBe(0);
-  }, 20_000);
-
-  it('shows a permissions summary in dry-run mode', async () => {
-    const config = await loadPermissionFixture(runner);
-    const report = runner.dryRun(config, 'test');
-    const formatted = formatDryRunReport(report);
-
-    expect(report.permissions).toEqual(
-      expect.arrayContaining([
-        expect.objectContaining({
-          agent: 'reader',
-          access: 'readonly',
-          writePaths: 0,
-        }),
-        expect.objectContaining({
-          agent: 'writer',
-          access: 'readwrite',
-          writePaths: 1,
-        }),
-        expect.objectContaining({
-          agent: 'admin-lead',
-          access: 'full',
-        }),
-      ])
-    );
-
-    expect(formatted).toContain('Permissions');
-    expect(formatted).toContain('reader');
-    expect(formatted).toContain('writer');
-    expect(formatted).toContain('admin-lead');
-    expect(formatted).toContain('readonly');
-    expect(formatted).toContain('readwrite');
-    expect(formatted).toContain('full');
-  }, 20_000);
-});
diff --git a/packages/sdk/src/workflows/__tests__/fixtures/.agentignore b/packages/sdk/src/workflows/__tests__/fixtures/.agentignore
deleted file mode 100644
index 8c8d008f1..000000000
--- a/packages/sdk/src/workflows/__tests__/fixtures/.agentignore
+++ /dev/null
@@ -1,2 +0,0 @@
-.env
-secrets/**
diff --git a/packages/sdk/src/workflows/__tests__/fixtures/.reader.agentreadonly b/packages/sdk/src/workflows/__tests__/fixtures/.reader.agentreadonly
deleted file mode 100644
index 2d348c17c..000000000
--- a/packages/sdk/src/workflows/__tests__/fixtures/.reader.agentreadonly
+++ /dev/null
@@ -1,2 +0,0 @@
-docs/**
-README.md
diff --git a/packages/sdk/src/workflows/__tests__/fixtures/permission-test.yaml b/packages/sdk/src/workflows/__tests__/fixtures/permission-test.yaml
deleted file mode 100644
index a82ef6214..000000000
--- a/packages/sdk/src/workflows/__tests__/fixtures/permission-test.yaml
+++ /dev/null
@@ -1,42 +0,0 @@
-version: '1.0'
-name: permission-e2e-test
-swarm:
-  pattern: dag
-  channel: wf-perm-e2e
-agents:
-  - name: reader
-    cli: claude
-    preset: reviewer
-    permissions:
-      access: readonly
-  - name: writer
-    cli: codex
-    preset: worker
-    permissions:
-      access: readwrite
-      files:
-        write: ['src/tests/**']
-        deny: ['.env', 'secrets/**']
-  - name: admin-lead
-    cli: claude
-    preset: lead
-    permissions:
-      access: full
-workflows:
-  - name: test
-    steps:
-      - name: check-env
-        type: deterministic
-        command: 'echo "checking env"'
-      - name: read-step
-        agent: reader
-        dependsOn: [check-env]
-        task: 'Verify you have read access. Check RELAY_AGENT_TOKEN is set.'
-        verification:
-          type: exit_code
-      - name: write-step
-        agent: writer
-        dependsOn: [check-env]
-        task: 'Verify you can write to src/tests/. Check RELAY_AGENT_TOKEN is set.'
-        verification:
-          type: exit_code
diff --git a/packages/sdk/src/workflows/__tests__/permission-types.test.ts b/packages/sdk/src/workflows/__tests__/permission-types.test.ts
deleted file mode 100644
index 779ea2f5a..000000000
--- a/packages/sdk/src/workflows/__tests__/permission-types.test.ts
+++ /dev/null
@@ -1,154 +0,0 @@
-import { mkdir, mkdtemp, rm, writeFile } from 'node:fs/promises';
-import { tmpdir } from 'node:os';
-import path from 'node:path';
-
-import { afterEach, describe, expect, it } from 'vitest';
-
-import { compileAgentScopes, resolveAgentPermissions } from '../../provisioner/compiler.js';
-import type {
-  AccessPreset,
-  AgentDefinition,
-  AgentWorkflowStep,
-  DeterministicWorkflowStep,
-} from '../types.js';
-import { isAgentStep, isDeterministicStep, isRestrictedAgent } from '../types.js';
-
-const tempDirs: string[] = [];
-
-async function createWorkspace(files: Record<string, string>) {
-  const dir = await mkdtemp(path.join(tmpdir(), 'relay-workflow-permission-types-'));
-  tempDirs.push(dir);
-
-  for (const [relativePath, content] of Object.entries(files)) {
-    const filePath = path.join(dir, relativePath);
-    await mkdir(path.dirname(filePath), { recursive: true });
-    await writeFile(filePath, content);
-  }
-
-  return dir;
-}
-
-afterEach(async () => {
-  while (tempDirs.length > 0) {
-    await rm(tempDirs.pop()!, { recursive: true, force: true });
-  }
-});
-
-describe('workflow permission types', () => {
-  it('allows agents to omit permissions without becoming restricted', () => {
-    const agent: AgentDefinition = {
-      name: 'worker',
-      cli: 'codex',
-      task: 'Write tests',
-    };
-
-    expect(agent.permissions).toBeUndefined();
-    expect(isRestrictedAgent(agent)).toBe(false);
-  });
-
-  it.each(['readonly', 'readwrite', 'restricted', 'full'] as const satisfies readonly AccessPreset[])(
-    'accepts the %s access preset',
-    async (access) => {
-      const workspace = await createWorkspace({
-        'src/index.ts': 'export const value = 1;\n',
-      });
-
-      const compiled = compileAgentScopes({
-        agentName: `${access}-agent`,
-        workspace: 'relay-test',
-        projectDir: workspace,
-        permissions: {
-          access,
-          inherit: false,
-        },
-      });
-
-      expect(compiled.effectiveAccess).toBe(access);
-      expect(isRestrictedAgent({ name: 'agent', cli: 'codex', permissions: { access } })).toBe(
-        access === 'readonly' || access === 'restricted'
-      );
-    }
-  );
-
-  it('compiles full permissions with read/write access for all files', async () => {
-    const workspace = await createWorkspace({
-      '.agentignore': 'secret.txt\n',
-      '.agentreadonly': 'locked.txt\n',
-      'locked.txt': 'lock me\n',
-      'secret.txt': 'classified\n',
-      'src/index.ts': 'export const value = 1;\n',
-    });
-
-    const compiled = compileAgentScopes({
-      agentName: 'lead',
-      workspace: 'relay-test',
-      projectDir: workspace,
-      permissions: {
-        access: 'full',
-        network: false,
-        exec: ['npm test'],
-        scopes: ['custom:relay:debug'],
-      },
-    });
-
-    expect(compiled.effectiveAccess).toBe('full');
-    expect(compiled.inherited).toBe(false);
-    expect(compiled.readonlyPaths).toEqual([]);
-    expect(compiled.deniedPaths).toEqual([]);
-    expect(compiled.readwritePaths).toEqual([
-      '.agentignore',
-      '.agentreadonly',
-      'locked.txt',
-      'secret.txt',
-      'src/index.ts',
-    ]);
-    expect(compiled.scopes).toContain('relayfile:fs:read:/secret.txt');
-    expect(compiled.scopes).toContain('relayfile:fs:write:/secret.txt');
-    expect(compiled.scopes).toContain('relayfile:fs:read:/src/index.ts');
-    expect(compiled.scopes).toContain('relayfile:fs:write:/src/index.ts');
-    expect(compiled.scopes).toContain('custom:relay:debug');
-    expect(compiled.network).toBe(false);
-    expect(compiled.exec).toEqual(['npm test']);
-    expect(compiled.summary).toEqual({
-      readonly: 0,
-      readwrite: 5,
-      denied: 0,
-      customScopes: 1,
-    });
-  });
-
-  it('preserves backwards-compatible default resolution when permissions are undefined', async () => {
-    const workspace = await createWorkspace({
-      '.agentignore': 'blocked.txt\n',
-      '.agentreadonly': 'locked.txt\n',
-      'blocked.txt': 'do not read\n',
-      'locked.txt': 'read only\n',
-      'writable.txt': 'can edit\n',
-    });
-
-    const compiled = resolveAgentPermissions('legacy-worker', undefined, workspace, 'relay-test');
-
-    expect(compiled.effectiveAccess).toBe('readwrite');
-    expect(compiled.inherited).toBe(true);
-    expect(compiled.readonlyPaths).toEqual(['locked.txt']);
-    expect(compiled.readwritePaths).toEqual(['.agentignore', '.agentreadonly', 'writable.txt']);
-    expect(compiled.deniedPaths).toEqual(['blocked.txt']);
-  });
-
-  it('keeps legacy workflow step aliases compatible with WorkflowStep guards', () => {
-    const agentStep: AgentWorkflowStep = {
-      name: 'draft',
-      agent: 'worker',
-      task: 'Draft the summary',
-    };
-    const deterministicStep: DeterministicWorkflowStep = {
-      name: 'check',
-      type: 'deterministic',
-      command: 'npm test',
-    };
-
-    expect(isAgentStep(agentStep)).toBe(true);
-    expect(isDeterministicStep(agentStep)).toBe(false);
-    expect(isDeterministicStep(deterministicStep)).toBe(true);
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/permissions-integration.test.ts b/packages/sdk/src/workflows/__tests__/permissions-integration.test.ts
deleted file mode 100644
index 3fe7690a2..000000000
--- a/packages/sdk/src/workflows/__tests__/permissions-integration.test.ts
+++ /dev/null
@@ -1,701 +0,0 @@
-import { EventEmitter } from 'node:events';
-import { beforeEach, afterEach, describe, expect, it, vi } from 'vitest';
-import { mkdtempSync, mkdirSync, rmSync, writeFileSync } from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-
-import type { WorkflowDb } from '../runner.js';
-import type { AgentPermissions, RelayYamlConfig, WorkflowRunRow, WorkflowStepRow } from '../types.js';
-
-const tempDirs: string[] = [];
-
-const mockFetch = vi.fn().mockResolvedValue({
-  ok: true,
-  json: () => Promise.resolve({ data: { api_key: 'rk_test', workspace_id: 'ws-test' } }),
-  text: () => Promise.resolve(''),
-});
-vi.stubGlobal('fetch', mockFetch);
-
-let lastProvisionResult:
-  | {
-      scopes: Map<string, string[]>;
-      tokens: Map<string, string>;
-    }
-  | undefined;
-
-const mockProvisionWorkflowAgents = vi.fn();
-
-vi.mock('../../provisioner/index.js', async () => {
-  const actual = await vi.importActual<typeof import('../../provisioner/index.js')>(
-    '../../provisioner/index.js'
-  );
-
-  mockProvisionWorkflowAgents.mockImplementation(async (config) => {
-    const scopes = new Map<string, string[]>();
-    const tokens = new Map<string, string>();
-    const agents: Record<string, unknown> = {};
-    let readonly = 0;
-    let readwrite = 0;
-    let denied = 0;
-    let customScopes = 0;
-
-    for (const [agentName, permissions] of Object.entries(config.agents ?? {}) as [
-      string,
-      AgentPermissions,
-    ][]) {
-      const compiled = actual.resolveAgentPermissions(
-        agentName,
-        permissions,
-        config.projectDir,
-        config.workspace
-      );
-      const token = `token:${agentName}`;
-
-      scopes.set(agentName, [...compiled.scopes]);
-      tokens.set(agentName, token);
-      readonly += compiled.summary.readonly;
-      readwrite += compiled.summary.readwrite;
-      denied += compiled.summary.denied;
-      customScopes += compiled.summary.customScopes;
-
-      agents[agentName] = {
-        name: agentName,
-        tokenPath: path.resolve(config.projectDir, '.relay', 'tokens', `${agentName}.jwt`),
-        token,
-        scopes: [...compiled.scopes],
-        compiled,
-      };
-    }
-
-    const result = {
-      agents,
-      agentNames: Object.keys(config.agents ?? {}),
-      adminToken: 'admin-token',
-      seededFileCount: 0,
-      seededAclCount: 0,
-      summary: { readonly, readwrite, denied, customScopes },
-      mounts: new Map(),
-      tokens,
-      scopes,
-    };
-
-    lastProvisionResult = { scopes, tokens };
-    return result;
-  });
-
-  return {
-    ...actual,
-    provisionWorkflowAgents: mockProvisionWorkflowAgents,
-  };
-});
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn(),
-  RelayError: class RelayError extends Error {},
-}));
-
-function never<T>(): Promise<T> {
-  return new Promise(() => {});
-}
-
-let queuedPtyOutputs: string[] = [];
-let waitForExitFn: (ms?: number) => Promise<'exited' | 'timeout' | 'released'>;
-let waitForIdleFn: (ms?: number) => Promise<'idle' | 'timeout' | 'exited'>;
-
-const mockAgent = {
-  name: 'workflow-agent',
-  exitCode: 0,
-  exitSignal: undefined as string | undefined,
-  get waitForExit() {
-    return waitForExitFn;
-  },
-  get waitForIdle() {
-    return waitForIdleFn;
-  },
-  release: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockHuman = {
-  name: 'WorkflowRunner',
-  sendMessage: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockListeners = new Map<string, Set<(...args: any[]) => void>>();
-function emitMockEvent(event: string, ...args: any[]): void {
-  const set = mockListeners.get(event);
-  if (set) for (const cb of set) cb(...args);
-}
-
-const mockRelayInstance = {
-  spawnPty: vi.fn(),
-  human: vi.fn().mockReturnValue(mockHuman),
-  shutdown: vi.fn().mockResolvedValue(undefined),
-  onBrokerStderr: vi.fn().mockReturnValue(() => {}),
-  listAgentsRaw: vi.fn().mockResolvedValue([]),
-  addListener: vi.fn((event: string, cb: (...args: any[]) => void) => {
-    let set = mockListeners.get(event);
-    if (!set) {
-      set = new Set();
-      mockListeners.set(event, set);
-    }
-    set.add(cb);
-    return () => set!.delete(cb);
-  }),
-};
-
-const defaultSpawnPtyImplementation = async ({ name, task }: { name: string; task?: string }) => {
-  const queued = queuedPtyOutputs.shift();
-  const stepComplete = task?.match(/STEP_COMPLETE:([^\n]+)/u)?.[1]?.trim();
-  const output = queued ?? (stepComplete ? `STEP_COMPLETE:${stepComplete}\n` : 'STEP_COMPLETE:done\n');
-
-  queueMicrotask(() => {
-    emitMockEvent('workerOutput', { name, chunk: output });
-  });
-
-  return { ...mockAgent, name };
-};
-
-vi.mock('../../relay.js', () => ({
-  AgentRelay: vi.fn().mockImplementation(() => mockRelayInstance),
-}));
-
-type QueuedSubprocessResult = {
-  stdout?: string;
-  stderr?: string;
-  code?: number | null;
-  signal?: string | null;
-  error?: Error;
-};
-
-let queuedSubprocessResults: QueuedSubprocessResult[] = [];
-
-const mockSubprocessSpawn = vi.fn().mockImplementation((_cmd, _args, _options) => {
-  const result = queuedSubprocessResults.shift() ?? { stdout: 'non-interactive complete\n', code: 0 };
-  const child = new EventEmitter() as EventEmitter & {
-    stdout: EventEmitter;
-    stderr: EventEmitter;
-    pid: number;
-    kill: ReturnType<typeof vi.fn>;
-  };
-
-  child.stdout = new EventEmitter();
-  child.stderr = new EventEmitter();
-  child.pid = 4321;
-  child.kill = vi.fn();
-
-  queueMicrotask(() => {
-    if (result.error) {
-      child.emit('error', result.error);
-      return;
-    }
-    if (result.stdout) {
-      child.stdout.emit('data', Buffer.from(result.stdout));
-    }
-    if (result.stderr) {
-      child.stderr.emit('data', Buffer.from(result.stderr));
-    }
-    child.emit('close', result.code ?? 0, result.signal ?? null);
-  });
-
-  return child;
-});
-
-vi.mock('node:child_process', async () => {
-  const actual = await vi.importActual<typeof import('node:child_process')>('node:child_process');
-  return {
-    ...actual,
-    spawn: mockSubprocessSpawn,
-  };
-});
-
-const { WorkflowRunner } = await import('../runner.js');
-
-function makeDb(): WorkflowDb {
-  const runs = new Map<string, WorkflowRunRow>();
-  const steps = new Map<string, WorkflowStepRow>();
-
-  return {
-    insertRun: vi.fn(async (run: WorkflowRunRow) => {
-      runs.set(run.id, { ...run });
-    }),
-    updateRun: vi.fn(async (id: string, patch: Partial<WorkflowRunRow>) => {
-      const existing = runs.get(id);
-      if (existing) runs.set(id, { ...existing, ...patch });
-    }),
-    getRun: vi.fn(async (id: string) => {
-      const run = runs.get(id);
-      return run ? { ...run } : null;
-    }),
-    insertStep: vi.fn(async (step: WorkflowStepRow) => {
-      steps.set(step.id, { ...step });
-    }),
-    updateStep: vi.fn(async (id: string, patch: Partial<WorkflowStepRow>) => {
-      const existing = steps.get(id);
-      if (existing) steps.set(id, { ...existing, ...patch });
-    }),
-    getStepsByRunId: vi.fn(async (runId: string) => {
-      return [...steps.values()].filter((step) => step.runId === runId);
-    }),
-  };
-}
-
-function createProject(files: Record<string, string>): string {
-  const dir = mkdtempSync(path.join(os.tmpdir(), 'relay-permissions-integration-'));
-  tempDirs.push(dir);
-
-  for (const [relativePath, contents] of Object.entries(files)) {
-    const absolutePath = path.join(dir, relativePath);
-    mkdirSync(path.dirname(absolutePath), { recursive: true });
-    writeFileSync(absolutePath, contents);
-  }
-
-  return dir;
-}
-
-function createBaseProject(): string {
-  return createProject({
-    'src/app.ts': 'export const app = true;\n',
-    'docs/review.md': '# review\n',
-    '.env': 'SECRET=1\n',
-  });
-}
-
-function makeRunner(cwd: string): InstanceType<typeof WorkflowRunner> {
-  return new WorkflowRunner({
-    cwd,
-    db: makeDb(),
-    workspaceId: 'ws-test',
-    relay: {
-      env: {
-        AGENT_RELAY_WORKFLOW_DISABLE_RELAYCAST: '1',
-      },
-    },
-  });
-}
-
-function makeConfig(
-  agents: RelayYamlConfig['agents'],
-  steps?: NonNullable<RelayYamlConfig['workflows']>[number]['steps'],
-  permissionProfiles?: RelayYamlConfig['permission_profiles']
-): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'permissions-integration',
-    permission_profiles: permissionProfiles,
-    swarm: { pattern: 'dag' },
-    agents,
-    workflows: [
-      {
-        name: 'default',
-        steps:
-          steps ??
-          agents.map((agent, index) => ({
-            name: `step-${index + 1}`,
-            agent: agent.name,
-            task: `Complete work for ${agent.name}`,
-          })),
-      },
-    ],
-    trajectories: false,
-  };
-}
-
-function getProvisionedScopes(agentName: string): string[] {
-  expect(lastProvisionResult).toBeDefined();
-  const scopes = lastProvisionResult?.scopes.get(agentName);
-  expect(scopes).toBeDefined();
-  return scopes ?? [];
-}
-
-beforeEach(() => {
-  vi.clearAllMocks();
-  lastProvisionResult = undefined;
-  queuedPtyOutputs = [];
-  queuedSubprocessResults = [];
-  waitForExitFn = vi.fn().mockResolvedValue('exited');
-  waitForIdleFn = vi.fn().mockImplementation(() => never());
-  mockAgent.release.mockResolvedValue(undefined);
-  mockRelayInstance.spawnPty.mockImplementation(defaultSpawnPtyImplementation);
-  mockListeners.clear();
-});
-
-afterEach(() => {
-  while (tempDirs.length > 0) {
-    rmSync(tempDirs.pop()!, { recursive: true, force: true });
-  }
-});
-
-describe('WorkflowRunner permission lifecycle integration', () => {
-  it('mints workflow tokens before spawning interactive agents', async () => {
-    const projectDir = createBaseProject();
-    const runner = makeRunner(projectDir);
-    const config = makeConfig([
-      {
-        name: 'writer',
-        cli: 'claude',
-        permissions: { access: 'readwrite' },
-      },
-    ]);
-
-    const run = await runner.execute(config, 'default');
-
-    expect(run.status).toBe('completed');
-    expect(mockProvisionWorkflowAgents).toHaveBeenCalledTimes(1);
-    expect(mockRelayInstance.spawnPty).toHaveBeenCalledTimes(1);
-    expect(mockProvisionWorkflowAgents.mock.invocationCallOrder[0]).toBeLessThan(
-      mockRelayInstance.spawnPty.mock.invocationCallOrder[0]
-    );
-  });
-
-  it('skips provisioning entirely when no agent permissions are configured', async () => {
-    const projectDir = createBaseProject();
-    const runner = makeRunner(projectDir);
-    const config = makeConfig([{ name: 'legacy-agent', cli: 'claude' }]);
-
-    const run = await runner.execute(config, 'default');
-
-    expect(run.status).toBe('completed');
-    expect(mockProvisionWorkflowAgents).not.toHaveBeenCalled();
-    expect(mockRelayInstance.spawnPty).toHaveBeenCalledTimes(1);
-  });
-
-  it('provisions reviewer agents with readonly scopes only', async () => {
-    const projectDir = createBaseProject();
-    const runner = makeRunner(projectDir);
-    const config = makeConfig([
-      {
-        name: 'reviewer-agent',
-        cli: 'claude',
-        permissions: { access: 'readonly' },
-      },
-    ]);
-
-    const run = await runner.execute(config, 'default');
-    const scopes = getProvisionedScopes('reviewer-agent');
-
-    expect(run.status).toBe('completed');
-    expect(lastProvisionResult?.tokens.get('reviewer-agent')).toBe('token:reviewer-agent');
-    expect(scopes.length).toBeGreaterThan(0);
-    expect(scopes.every((scope) => !scope.includes(':write:'))).toBe(true);
-    expect(scopes.every((scope) => scope.includes(':read:'))).toBe(true);
-  });
-
-  it('provisions worker agents with readwrite scopes', async () => {
-    const projectDir = createBaseProject();
-    const runner = makeRunner(projectDir);
-    const config = makeConfig([
-      {
-        name: 'worker-agent',
-        cli: 'claude',
-        permissions: { access: 'readwrite' },
-      },
-    ]);
-
-    const run = await runner.execute(config, 'default');
-    const scopes = getProvisionedScopes('worker-agent');
-
-    expect(run.status).toBe('completed');
-    expect(scopes).toContain('relayfile:fs:write:/src/app.ts');
-    expect(scopes).toContain('relayfile:fs:write:/docs/review.md');
-  });
-
-  it('provisions lead agents with full-access scopes', async () => {
-    const projectDir = createBaseProject();
-    const runner = makeRunner(projectDir);
-    const config = makeConfig([
-      {
-        name: 'lead-agent',
-        cli: 'claude',
-        permissions: { access: 'full' },
-      },
-    ]);
-
-    const run = await runner.execute(config, 'default');
-    const scopes = getProvisionedScopes('lead-agent');
-
-    expect(run.status).toBe('completed');
-    expect(scopes).toContain('relayfile:fs:write:/.env');
-    expect(scopes).toContain('relayfile:fs:write:/src/app.ts');
-    expect(scopes).toContain('relayfile:fs:write:/docs/review.md');
-  });
-
-  it('passes the workflow agent token through to spawnPty', async () => {
-    const projectDir = createBaseProject();
-    const runner = makeRunner(projectDir);
-    const config = makeConfig([
-      {
-        name: 'interactive-agent',
-        cli: 'claude',
-        permissions: { access: 'readwrite' },
-      },
-    ]);
-
-    const run = await runner.execute(config, 'default');
-
-    expect(run.status).toBe('completed');
-    expect(mockRelayInstance.spawnPty).toHaveBeenCalledWith(
-      expect.objectContaining({
-        agentToken: 'token:interactive-agent',
-      })
-    );
-  });
-
-  it('merges permission profiles into agent permissions before provisioning', async () => {
-    const projectDir = createBaseProject();
-    const runner = makeRunner(projectDir);
-    const config = makeConfig(
-      [
-        {
-          name: 'profiled-agent',
-          cli: 'claude',
-          permissions: {
-            profile: 'reviewer',
-            why: 'Needs shared reviewer constraints with one extra scope',
-            files: {
-              read: ['docs/**'],
-            },
-            scopes: ['relay:custom:use:/review'],
-          },
-        },
-      ],
-      undefined,
-      {
-        reviewer: {
-          description: 'Reusable reviewer profile',
-          access: 'readonly',
-          files: {
-            read: ['src/**'],
-            deny: ['.env'],
-          },
-          exec: ['git diff'],
-        },
-      }
-    );
-
-    const run = await runner.execute(config, 'default');
-    const provisionedPermissions = mockProvisionWorkflowAgents.mock.calls[0]?.[0]?.agents?.['profiled-agent'];
-
-    expect(run.status).toBe('completed');
-    expect(provisionedPermissions).toEqual({
-      description: 'Reusable reviewer profile',
-      profile: 'reviewer',
-      why: 'Needs shared reviewer constraints with one extra scope',
-      access: 'readonly',
-      files: {
-        read: ['src/**', 'docs/**'],
-        deny: ['.env'],
-      },
-      scopes: ['relay:custom:use:/review'],
-      exec: ['git diff'],
-    });
-  });
-
-  it('injects RELAY_AGENT_TOKEN into non-interactive agent environments', async () => {
-    const projectDir = createBaseProject();
-    const runner = makeRunner(projectDir);
-    const config = makeConfig([
-      {
-        name: 'headless-agent',
-        cli: 'claude',
-        interactive: false,
-        permissions: { access: 'readwrite' },
-      },
-    ]);
-
-    const run = await runner.execute(config, 'default');
-    const spawnOptions = mockSubprocessSpawn.mock.calls[0]?.[2] as
-      | { env?: Record<string, string> }
-      | undefined;
-
-    expect(run.status).toBe('completed');
-    expect(mockRelayInstance.spawnPty).not.toHaveBeenCalled();
-    expect(mockSubprocessSpawn).toHaveBeenCalledTimes(1);
-    expect(spawnOptions?.env?.RELAY_AGENT_TOKEN).toBe('token:headless-agent');
-    expect(spawnOptions?.env?.RELAYFILE_TOKEN).toBe('token:headless-agent');
-  });
-
-  it('merges relay.env with inherited process env for non-interactive agents', async () => {
-    const projectDir = createBaseProject();
-    const inheritedEnvKey = 'WORKFLOW_RUNNER_RELAY_ENV_MERGE_TEST';
-    const originalInheritedValue = process.env[inheritedEnvKey];
-    process.env[inheritedEnvKey] = 'inherited-value';
-
-    try {
-      const runner = new WorkflowRunner({
-        cwd: projectDir,
-        db: makeDb(),
-        workspaceId: 'ws-test',
-        relay: {
-          env: {
-            AGENT_RELAY_WORKFLOW_DISABLE_RELAYCAST: '1',
-            RELAYFILE_BASE_URL: 'https://relay.example.test',
-          },
-        },
-      });
-      const config = makeConfig([
-        {
-          name: 'env-merge-agent',
-          cli: 'claude',
-          interactive: false,
-          permissions: { access: 'readwrite' },
-        },
-      ]);
-
-      const run = await runner.execute(config, 'default');
-      const spawnOptions = mockSubprocessSpawn.mock.calls[0]?.[2] as { env?: NodeJS.ProcessEnv } | undefined;
-
-      expect(run.status).toBe('completed');
-      expect(mockSubprocessSpawn).toHaveBeenCalledTimes(1);
-      expect(spawnOptions?.env?.[inheritedEnvKey]).toBe('inherited-value');
-      expect(spawnOptions?.env?.RELAYFILE_BASE_URL).toBe('https://relay.example.test');
-      expect(spawnOptions?.env?.AGENT_RELAY_WORKFLOW_DISABLE_RELAYCAST).toBe('1');
-    } finally {
-      if (originalInheritedValue === undefined) {
-        delete process.env[inheritedEnvKey];
-      } else {
-        process.env[inheritedEnvKey] = originalInheritedValue;
-      }
-    }
-  });
-
-  it('clears workflow-scoped tokens after successful completion', async () => {
-    const projectDir = createBaseProject();
-    const runner = makeRunner(projectDir);
-    const config = makeConfig([
-      {
-        name: 'cleanup-agent',
-        cli: 'claude',
-        permissions: { access: 'readwrite' },
-      },
-    ]);
-
-    const run = await runner.execute(config, 'default');
-
-    expect(run.status).toBe('completed');
-    expect((runner as any).agentTokens.size).toBe(0);
-  });
-
-  it('clears workflow-scoped tokens after failed workflows', async () => {
-    const projectDir = createBaseProject();
-    const runner = makeRunner(projectDir);
-    const config = makeConfig([
-      {
-        name: 'failing-agent',
-        cli: 'claude',
-        permissions: { access: 'readwrite' },
-      },
-    ]);
-
-    mockRelayInstance.spawnPty.mockRejectedValueOnce(new Error('spawn failed'));
-
-    const run = await runner.execute(config, 'default');
-
-    expect(run.status).toBe('failed');
-    expect((runner as any).agentTokens.size).toBe(0);
-  });
-
-  it('reports resolved permissions during dry-run without minting tokens', () => {
-    const projectDir = createProject({
-      'src/app.ts': 'export const app = true;\n',
-      '.agentreadonly': 'src/app.ts\n',
-    });
-    const runner = makeRunner(projectDir);
-    const config = makeConfig([
-      {
-        name: 'dry-run-agent',
-        cli: 'claude',
-        permissions: {
-          access: 'readonly',
-          files: {
-            read: ['src/**'],
-          },
-          scopes: ['relay:custom:use:/feature'],
-        },
-      },
-    ]);
-
-    const report = runner.dryRun(config, 'default');
-    const permissionEntry = report.permissions?.find((entry) => entry.agent === 'dry-run-agent');
-
-    expect(report.valid).toBe(true);
-    expect(permissionEntry).toMatchObject({
-      agent: 'dry-run-agent',
-      access: 'readonly',
-      source: 'yaml',
-    });
-    expect(permissionEntry?.scopes ?? 0).toBeGreaterThan(0);
-    expect(mockProvisionWorkflowAgents).not.toHaveBeenCalled();
-    expect(mockRelayInstance.spawnPty).not.toHaveBeenCalled();
-    expect((runner as any).agentTokens.size).toBe(0);
-  });
-
-  it('rejects invalid permission config during validation before provisioning', async () => {
-    const projectDir = createBaseProject();
-    const runner = makeRunner(projectDir);
-    const config = makeConfig([
-      {
-        name: 'invalid-agent',
-        cli: 'claude',
-        permissions: {
-          access: 'bogus' as any,
-        },
-      },
-    ]);
-
-    await expect(runner.execute(config, 'default')).rejects.toThrow('Permission validation failed');
-    expect(mockProvisionWorkflowAgents).not.toHaveBeenCalled();
-    expect(mockRelayInstance.spawnPty).not.toHaveBeenCalled();
-  });
-
-  it('rejects unknown permission profiles during validation before provisioning', async () => {
-    const projectDir = createBaseProject();
-    const runner = makeRunner(projectDir);
-    const config = makeConfig([
-      {
-        name: 'invalid-profile-agent',
-        cli: 'claude',
-        permissions: {
-          profile: 'missing-reviewer',
-        },
-      },
-    ]);
-
-    await expect(runner.execute(config, 'default')).rejects.toThrow('Permission validation failed');
-    expect(mockProvisionWorkflowAgents).not.toHaveBeenCalled();
-    expect(mockRelayInstance.spawnPty).not.toHaveBeenCalled();
-  });
-
-  it('merges dotfile rules with YAML overrides into the expected scopes', async () => {
-    const projectDir = createProject({
-      '.agentignore': 'blocked.txt\n',
-      '.agentreadonly': 'locked.txt\n',
-      'blocked.txt': 'blocked\n',
-      'locked.txt': 'locked\n',
-      'plain.txt': 'plain\n',
-    });
-    const runner = makeRunner(projectDir);
-    const config = makeConfig([
-      {
-        name: 'override-agent',
-        cli: 'claude',
-        permissions: {
-          access: 'restricted',
-          files: {
-            read: ['blocked.txt'],
-            write: ['locked.txt'],
-          },
-        },
-      },
-    ]);
-
-    const run = await runner.execute(config, 'default');
-    const scopes = getProvisionedScopes('override-agent');
-
-    expect(run.status).toBe('completed');
-    expect(scopes).toEqual([
-      'relayfile:fs:read:/blocked.txt',
-      'relayfile:fs:read:/locked.txt',
-      'relayfile:fs:write:/locked.txt',
-    ]);
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/process-backend-executor.test.ts b/packages/sdk/src/workflows/__tests__/process-backend-executor.test.ts
deleted file mode 100644
index ddc6d284e..000000000
--- a/packages/sdk/src/workflows/__tests__/process-backend-executor.test.ts
+++ /dev/null
@@ -1,125 +0,0 @@
-import { describe, it, expect, vi } from 'vitest';
-
-import { createProcessBackendExecutor } from '../process-backend-executor.js';
-import type { ProcessBackend, ProcessEnvironment, WorkflowStep, AgentDefinition } from '../types.js';
-
-function makeEnv(
-  exec: ProcessEnvironment['exec'],
-  destroy: ProcessEnvironment['destroy'] = vi.fn(async () => undefined)
-): ProcessEnvironment {
-  return {
-    id: 'env-1',
-    homeDir: '/home/runner',
-    exec,
-    uploadFile: vi.fn(async () => undefined),
-    destroy,
-  };
-}
-
-function makeBackend(env: ProcessEnvironment): ProcessBackend {
-  return { createEnvironment: vi.fn(async () => env) };
-}
-
-function makeStep(overrides: Partial<WorkflowStep> = {}): WorkflowStep {
-  return { name: 'step-1', ...overrides } as WorkflowStep;
-}
-
-function makeAgent(overrides: Partial<AgentDefinition> = {}): AgentDefinition {
-  return { name: 'worker-1', cli: 'claude', ...overrides } as AgentDefinition;
-}
-
-describe('createProcessBackendExecutor', () => {
-  it('creates an environment, runs the built command, and destroys the env', async () => {
-    const destroy = vi.fn<ProcessEnvironment['destroy']>(async () => undefined);
-    const exec = vi.fn<ProcessEnvironment['exec']>(async () => ({ output: 'hello\n', exitCode: 0 }));
-    const env = makeEnv(exec, destroy);
-    const backend = makeBackend(env);
-
-    const executor = createProcessBackendExecutor(backend);
-    const output = await executor.executeAgentStep(
-      makeStep({ name: 'planner' }),
-      makeAgent({ cli: 'claude' }),
-      'do the thing',
-      30_000
-    );
-
-    expect(backend.createEnvironment).toHaveBeenCalledWith('planner');
-    expect(exec).toHaveBeenCalledTimes(1);
-    const [command, opts] = exec.mock.calls[0]!;
-    expect(typeof command).toBe('string');
-    expect(command).toContain('claude');
-    expect(opts?.timeoutSeconds).toBe(30);
-    expect(destroy).toHaveBeenCalledTimes(1);
-    expect(output).toBe('hello\n');
-  });
-
-  it('passes injected env and agent cwd through execOpts (not baked into the command)', async () => {
-    const exec = vi.fn<ProcessEnvironment['exec']>(async () => ({ output: 'ok', exitCode: 0 }));
-    const env = makeEnv(exec);
-    const backend = makeBackend(env);
-
-    const executor = createProcessBackendExecutor(backend, {
-      env: { ANTHROPIC_API_KEY: 'sk-test', RELAY_WORKSPACE: 'ws_123' },
-    });
-
-    await executor.executeAgentStep(
-      makeStep({ name: 'planner' }),
-      makeAgent({ cli: 'claude', cwd: '/work/repo' }),
-      'do the thing',
-      5_000
-    );
-
-    const [command, opts] = exec.mock.calls[0]!;
-    expect(command.startsWith('claude ') || command.startsWith("'claude'")).toBe(true);
-    expect(command).not.toMatch(/ANTHROPIC_API_KEY=/);
-    expect(opts?.env).toEqual({ ANTHROPIC_API_KEY: 'sk-test', RELAY_WORKSPACE: 'ws_123' });
-    expect(opts?.cwd).toBe('/work/repo');
-    expect(opts?.timeoutSeconds).toBe(5);
-  });
-
-  it('throws when the remote command exits non-zero and still destroys', async () => {
-    const destroy = vi.fn<ProcessEnvironment['destroy']>(async () => undefined);
-    const exec = vi.fn<ProcessEnvironment['exec']>(async () => ({ output: 'boom', exitCode: 2 }));
-    const env = makeEnv(exec, destroy);
-    const backend = makeBackend(env);
-
-    const executor = createProcessBackendExecutor(backend);
-
-    await expect(executor.executeAgentStep(makeStep(), makeAgent(), 'task')).rejects.toThrow(
-      /exited with code 2/
-    );
-    expect(destroy).toHaveBeenCalledTimes(1);
-  });
-
-  it('rejects cli:"api" because it does not run as a subprocess', async () => {
-    const env = makeEnv(vi.fn<ProcessEnvironment['exec']>());
-    const backend = makeBackend(env);
-    const executor = createProcessBackendExecutor(backend);
-
-    await expect(executor.executeAgentStep(makeStep(), makeAgent({ cli: 'api' }), 'task')).rejects.toThrow(
-      /cli "api"/
-    );
-  });
-
-  it('passes injected env through to exec for deterministic steps', async () => {
-    const exec = vi.fn<ProcessEnvironment['exec']>(async () => ({ output: 'ok', exitCode: 0 }));
-    const env = makeEnv(exec);
-    const backend = makeBackend(env);
-
-    const executor = createProcessBackendExecutor(backend, {
-      env: { RELAY_WORKSPACE: 'ws_123' },
-    });
-
-    const result = await executor.executeDeterministicStep!(
-      makeStep({ type: 'deterministic', command: 'echo hi', timeoutMs: 5_000 }),
-      'echo hi',
-      '/work'
-    );
-
-    expect(result).toEqual({ output: 'ok', exitCode: 0 });
-    const [, opts] = exec.mock.calls[0]!;
-    expect(opts?.cwd).toBe('/work');
-    expect(opts?.env).toEqual({ RELAY_WORKSPACE: 'ws_123' });
-    expect(opts?.timeoutSeconds).toBe(5);
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/proxy-env.test.ts b/packages/sdk/src/workflows/__tests__/proxy-env.test.ts
deleted file mode 100644
index a0147fd29..000000000
--- a/packages/sdk/src/workflows/__tests__/proxy-env.test.ts
+++ /dev/null
@@ -1,178 +0,0 @@
-import { afterEach, describe, expect, it, vi } from 'vitest';
-
-import type { AgentDefinition, SwarmConfig } from '../types.js';
-import {
-  buildNormalizedProxyEnv,
-  createProxyEnvResolver,
-  getStrippedApiKeyVars,
-  isProxyEnabled,
-  RELAY_PROXY_TOKEN_ENV,
-  RELAY_PROXY_TOKEN_ENV_ALIAS,
-  RELAY_PROXY_URL_ENV,
-  RELAY_PROXY_URL_ENV_ALIAS,
-  resolveProxyTokenFromEnv,
-  resolveProxyUrlFromEnv,
-  resolveProxyEnv,
-  type ProxyEnvRegistry,
-} from '../proxy-env.js';
-import { WorkflowRunner } from '../runner.js';
-
-describe('proxy-env', () => {
-  afterEach(() => {
-    vi.restoreAllMocks();
-  });
-
-  it.each([
-    ['claude', { ANTHROPIC_BASE_URL: 'https://proxy.local', ANTHROPIC_API_KEY: 'proxy-token' }],
-    ['codex', { OPENAI_BASE_URL: 'https://proxy.local', OPENAI_API_KEY: 'proxy-token' }],
-    ['opencode', { OPENAI_BASE_URL: 'https://proxy.local', OPENAI_API_KEY: 'proxy-token' }],
-    ['aider', { OPENAI_API_BASE: 'https://proxy.local', OPENAI_API_KEY: 'proxy-token' }],
-    ['gemini', { GOOGLE_API_BASE: 'https://proxy.local', GOOGLE_API_KEY: 'proxy-token' }],
-    ['goose', { OPENAI_BASE_URL: 'https://proxy.local', OPENAI_API_KEY: 'proxy-token' }],
-    ['droid', { OPENAI_BASE_URL: 'https://proxy.local', OPENAI_API_KEY: 'proxy-token' }],
-    ['cursor', { OPENAI_BASE_URL: 'https://proxy.local', OPENAI_API_KEY: 'proxy-token' }],
-  ] as const)('returns the correct env overrides for %s', (cli, expected) => {
-    expect(resolveProxyEnv(cli, 'https://proxy.local', 'proxy-token')).toEqual(expected);
-  });
-
-  it('normalizes cli variants before resolving proxy env', () => {
-    expect(resolveProxyEnv('codex:gpt-5.4', 'https://proxy.local', 'proxy-token')).toEqual({
-      OPENAI_BASE_URL: 'https://proxy.local',
-      OPENAI_API_KEY: 'proxy-token',
-    });
-    expect(resolveProxyEnv('cursor-agent', 'https://proxy.local', 'proxy-token')).toEqual({
-      OPENAI_BASE_URL: 'https://proxy.local',
-      OPENAI_API_KEY: 'proxy-token',
-    });
-  });
-
-  it('falls back to dual-provider overrides for unknown CLIs and logs a warning', () => {
-    const warn = vi.spyOn(console, 'warn').mockImplementation(() => {});
-
-    expect(resolveProxyEnv('mystery-cli', 'https://proxy.local', 'proxy-token')).toEqual({
-      OPENAI_BASE_URL: 'https://proxy.local',
-      OPENAI_API_KEY: 'proxy-token',
-      ANTHROPIC_BASE_URL: 'https://proxy.local',
-      ANTHROPIC_API_KEY: 'proxy-token',
-    });
-    expect(warn).toHaveBeenCalledTimes(1);
-    expect(warn).toHaveBeenCalledWith(
-      expect.stringContaining('Falling back to generic OpenAI/Anthropic proxy env overrides.')
-    );
-  });
-
-  it('returns the full provider/base-url strip list', () => {
-    expect(getStrippedApiKeyVars()).toEqual([
-      'OPENAI_API_KEY',
-      'ANTHROPIC_API_KEY',
-      'OPENROUTER_API_KEY',
-      'GOOGLE_API_KEY',
-      'OPENAI_BASE_URL',
-      'ANTHROPIC_BASE_URL',
-      'OPENAI_API_BASE',
-      'GOOGLE_API_BASE',
-    ]);
-  });
-
-  it('does not strip canonical or legacy relay proxy env vars', () => {
-    expect(getStrippedApiKeyVars()).not.toContain(RELAY_PROXY_URL_ENV);
-    expect(getStrippedApiKeyVars()).not.toContain(RELAY_PROXY_URL_ENV_ALIAS);
-    expect(getStrippedApiKeyVars()).not.toContain(RELAY_PROXY_TOKEN_ENV);
-    expect(getStrippedApiKeyVars()).not.toContain(RELAY_PROXY_TOKEN_ENV_ALIAS);
-  });
-
-  it('prefers the canonical relay proxy URL env name', () => {
-    expect(
-      resolveProxyUrlFromEnv({
-        [RELAY_PROXY_URL_ENV]: 'https://cloud.proxy',
-        [RELAY_PROXY_URL_ENV_ALIAS]: 'https://legacy.proxy',
-      })
-    ).toBe('https://cloud.proxy');
-  });
-
-  it('falls back to the legacy relay proxy URL env name', () => {
-    expect(
-      resolveProxyUrlFromEnv({
-        [RELAY_PROXY_URL_ENV_ALIAS]: 'https://legacy.proxy',
-      })
-    ).toBe('https://legacy.proxy');
-  });
-
-  it('prefers the canonical relay proxy token env name', () => {
-    expect(
-      resolveProxyTokenFromEnv({
-        [RELAY_PROXY_TOKEN_ENV]: 'cloud-token',
-        [RELAY_PROXY_TOKEN_ENV_ALIAS]: 'legacy-token',
-      })
-    ).toBe('cloud-token');
-  });
-
-  it('falls back to the legacy relay proxy token env name', () => {
-    expect(
-      resolveProxyTokenFromEnv({
-        [RELAY_PROXY_TOKEN_ENV_ALIAS]: 'legacy-token',
-      })
-    ).toBe('legacy-token');
-  });
-
-  it('emits canonical and legacy relay proxy env vars together', () => {
-    expect(buildNormalizedProxyEnv('https://proxy.local', 'proxy-token')).toEqual({
-      RELAY_LLM_PROXY: 'https://proxy.local',
-      RELAY_LLM_PROXY_URL: 'https://proxy.local',
-      CREDENTIAL_PROXY_TOKEN: 'proxy-token',
-      RELAY_LLM_PROXY_TOKEN: 'proxy-token',
-    });
-  });
-
-  it('enables proxy mode only when both agent and swarm opt in', () => {
-    const agentWithProxy = { credentials: { proxy: true } } as AgentDefinition;
-    const agentWithoutProxy = { credentials: { proxy: false } } as AgentDefinition;
-    const swarmWithProxy = {
-      credentialProxy: {
-        proxyUrl: 'https://proxy.local',
-        providers: {},
-      },
-    } as SwarmConfig;
-    const swarmWithoutProxy = {} as SwarmConfig;
-
-    expect(isProxyEnabled(agentWithProxy, swarmWithProxy)).toBe(true);
-    expect(isProxyEnabled(agentWithoutProxy, swarmWithProxy)).toBe(false);
-    expect(isProxyEnabled(agentWithProxy, swarmWithoutProxy)).toBe(false);
-    expect(isProxyEnabled(undefined, swarmWithProxy)).toBe(false);
-    expect(isProxyEnabled(agentWithProxy, undefined)).toBe(false);
-  });
-
-  it('supports adding a new CLI by supplying one registry entry', () => {
-    const customRegistry = {
-      'custom-cli': [{ baseUrlVar: 'CUSTOM_API_BASE', apiKeyVar: 'CUSTOM_API_KEY' }],
-    } satisfies ProxyEnvRegistry;
-    const resolveCustomProxyEnv = createProxyEnvResolver(customRegistry);
-
-    expect(resolveCustomProxyEnv('custom-cli', 'https://proxy.local', 'proxy-token')).toEqual({
-      CUSTOM_API_BASE: 'https://proxy.local',
-      CUSTOM_API_KEY: 'proxy-token',
-    });
-  });
-
-  it('normalizes inherited proxy env before child-process propagation', () => {
-    const runner = new WorkflowRunner({
-      relay: {
-        env: {
-          RELAY_LLM_PROXY_URL: 'https://legacy.proxy',
-          RELAY_LLM_PROXY_TOKEN: 'legacy-token',
-          OPENAI_API_KEY: 'should-strip',
-        },
-      },
-    });
-
-    const env = (runner as any).getRelayEnv();
-
-    expect(env).toMatchObject({
-      RELAY_LLM_PROXY: 'https://legacy.proxy',
-      RELAY_LLM_PROXY_URL: 'https://legacy.proxy',
-      CREDENTIAL_PROXY_TOKEN: 'legacy-token',
-      RELAY_LLM_PROXY_TOKEN: 'legacy-token',
-    });
-    expect(env.OPENAI_API_KEY).toBeUndefined();
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/run-script.test.ts b/packages/sdk/src/workflows/__tests__/run-script.test.ts
deleted file mode 100644
index aba29fc43..000000000
--- a/packages/sdk/src/workflows/__tests__/run-script.test.ts
+++ /dev/null
@@ -1,551 +0,0 @@
-import { describe, expect, it } from 'vitest';
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-
-import {
-  parseTsxStderr,
-  formatWorkflowParseError,
-  runScriptWorkflow,
-  findLocalSdkWorkspace,
-  ensureLocalSdkWorkflowRuntime,
-  shouldSkipNodeStripTypesPreflight,
-} from '../run-script.js';
-
-describe('parseTsxStderr', () => {
-  it('extracts file/line/col/message from inline `file:line:col: ERROR:` format', () => {
-    const stderr = '/repo/workflow.ts:42:7: ERROR: Expected "}" but found end of file\n';
-    const parsed = parseTsxStderr(stderr);
-
-    expect(parsed).toEqual({
-      file: '/repo/workflow.ts',
-      line: 42,
-      column: 7,
-      message: 'Expected "}" but found end of file',
-    });
-  });
-
-  it('extracts pretty-printed `✘ [ERROR]` format', () => {
-    const stderr = `✘ [ERROR] Unexpected "$"
-
-    /repo/workflow.ts:10:4:
-      10 │   command: \`echo \${VAR}\`
-         ╵     ^
-`;
-    const parsed = parseTsxStderr(stderr);
-
-    expect(parsed).toMatchObject({
-      file: '/repo/workflow.ts',
-      line: 10,
-      column: 4,
-      message: 'Unexpected "$"',
-    });
-  });
-
-  it('strips ANSI color codes before matching', () => {
-    const stderr = '\x1b[31m/repo/workflow.ts:1:1: ERROR: bad token\x1b[0m\n';
-    const parsed = parseTsxStderr(stderr);
-
-    expect(parsed?.file).toBe('/repo/workflow.ts');
-    expect(parsed?.message).toBe('bad token');
-  });
-
-  it('returns null when stderr does not look like a parse error', () => {
-    expect(parseTsxStderr('Error: Cannot find module foo')).toBeNull();
-    expect(parseTsxStderr('')).toBeNull();
-  });
-});
-
-describe('formatWorkflowParseError', () => {
-  it('produces a WORKFLOW_PARSE_ERROR with template-literal hints when applicable', () => {
-    const err = formatWorkflowParseError({
-      file: '/repo/workflow.ts',
-      line: 12,
-      column: 4,
-      message: 'Unterminated template literal',
-    });
-
-    expect((err as Error & { code?: string }).code).toBe('WORKFLOW_PARSE_ERROR');
-    expect(err.message).toContain('/repo/workflow.ts:12:4');
-    expect(err.message).toMatch(/template literal/i);
-  });
-
-  it('falls back to the bare error when no hint is applicable', () => {
-    const err = formatWorkflowParseError({
-      file: '/repo/workflow.ts',
-      message: 'TypeScript parse error (see tsx output above)',
-    });
-
-    expect(err.message).toContain('TypeScript parse error');
-    expect(err.message).not.toMatch(/Hint:/);
-  });
-});
-
-describe('runScriptWorkflow', () => {
-  const nodeSupportsStripTypes = (() => {
-    const [major = 0, minor = 0] = process.versions.node.split('.').map((part) => Number(part));
-    return major > 22 || (major === 22 && minor >= 6);
-  })();
-
-  it('throws when the file does not exist', async () => {
-    await expect(runScriptWorkflow('/definitely/does/not/exist.ts')).rejects.toThrow(/File not found/);
-  });
-
-  it('rejects unsupported extensions', async () => {
-    // Use a file that exists (this test file itself) but with an unsupported ext —
-    // there is no way to make the extension unsupported on a real path other than
-    // pointing at one. Use the README as a stand-in.
-    const fakePath = path.resolve(__dirname, '../../../README.md');
-    await expect(runScriptWorkflow(fakePath)).rejects.toThrow(/Unsupported file type/);
-  });
-
-  it('falls back past Node strip-only mode for valid TypeScript enums', async () => {
-    const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-runner-'));
-    const workflowPath = path.join(tmpDir, 'enum-workflow.ts');
-    fs.writeFileSync(
-      workflowPath,
-      `
-enum Step {
-  Done = 'done',
-}
-if (Step.Done !== 'done') {
-  throw new Error('enum did not execute');
-}
-`,
-      'utf8'
-    );
-
-    try {
-      await expect(runScriptWorkflow(workflowPath)).resolves.toBeUndefined();
-    } finally {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    }
-    // Skips Node strip-only, then cold-starts tsx to actually compile and run
-    // the enum — well over Vitest's default 5s budget on a cold runner.
-  }, 30000);
-
-  it('falls back past Node strip-only mode for enums in static local imports', async () => {
-    const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-runner-'));
-    const workflowPath = path.join(tmpDir, 'main.ts');
-    const enumModulePath = path.join(tmpDir, 'enum-module.ts');
-    fs.writeFileSync(
-      enumModulePath,
-      `
-export enum ImportedStep {
-  Done = 'done',
-}
-`,
-      'utf8'
-    );
-    fs.writeFileSync(
-      workflowPath,
-      `
-import { ImportedStep } from './enum-module.ts';
-if (ImportedStep.Done !== 'done') {
-  throw new Error('imported step did not execute');
-}
-`,
-      'utf8'
-    );
-
-    try {
-      await expect(runScriptWorkflow(workflowPath)).resolves.toBeUndefined();
-    } finally {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    }
-  }, 30000);
-
-  it('falls back past Node strip-only mode for parameter properties and namespaces', async () => {
-    const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-runner-'));
-    const workflowPath = path.join(tmpDir, 'parameter-property-workflow.ts');
-    fs.writeFileSync(
-      workflowPath,
-      `
-class Box {
-  constructor(public value: string) {}
-}
-namespace WorkflowValues {
-  export const done = 'done';
-}
-if (new Box(WorkflowValues.done).value !== 'done') {
-  throw new Error('unsupported syntax did not execute');
-}
-`,
-      'utf8'
-    );
-
-    try {
-      expect(shouldSkipNodeStripTypesPreflight(workflowPath)).toBe(true);
-      await expect(runScriptWorkflow(workflowPath)).resolves.toBeUndefined();
-    } finally {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    }
-  }, 30000);
-
-  it('falls back past Node strip-only mode for unsupported syntax in static local imports', async () => {
-    const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-runner-'));
-    const workflowPath = path.join(tmpDir, 'main.ts');
-    const helperPath = path.join(tmpDir, 'helper.ts');
-    fs.writeFileSync(
-      helperPath,
-      `
-export class ImportedBox {
-  constructor(public value: string) {}
-}
-export namespace ImportedValues {
-  export const done = 'done';
-}
-`,
-      'utf8'
-    );
-    fs.writeFileSync(
-      workflowPath,
-      `
-import { ImportedBox, ImportedValues } from './helper.ts';
-if (new ImportedBox(ImportedValues.done).value !== 'done') {
-  throw new Error('imported unsupported syntax did not execute');
-}
-`,
-      'utf8'
-    );
-
-    try {
-      expect(shouldSkipNodeStripTypesPreflight(workflowPath)).toBe(true);
-      await expect(runScriptWorkflow(workflowPath)).resolves.toBeUndefined();
-    } finally {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    }
-  }, 30000);
-
-  it('falls back past Node strip-only mode for import-equals syntax', async () => {
-    const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-runner-'));
-    const workflowPath = path.join(tmpDir, 'import-equals-workflow.ts');
-    fs.writeFileSync(
-      workflowPath,
-      `
-import fs = require('node:fs');
-if (!fs.existsSync(${JSON.stringify(tmpDir)})) {
-  throw new Error('import-equals workflow did not execute');
-}
-`,
-      'utf8'
-    );
-
-    try {
-      expect(shouldSkipNodeStripTypesPreflight(workflowPath)).toBe(true);
-      await expect(runScriptWorkflow(workflowPath)).resolves.toBeUndefined();
-    } finally {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    }
-  }, 30000);
-
-  it('falls back past Node strip-only mode for import-equals syntax in static local imports', async () => {
-    const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-runner-'));
-    const workflowPath = path.join(tmpDir, 'main.ts');
-    const helperPath = path.join(tmpDir, 'helper.ts');
-    fs.writeFileSync(
-      helperPath,
-      `
-import path = require('node:path');
-export const basename = path.basename('done.txt', '.txt');
-`,
-      'utf8'
-    );
-    fs.writeFileSync(
-      workflowPath,
-      `
-import { basename } from './helper.ts';
-if (basename !== 'done') {
-  throw new Error('imported import-equals syntax did not execute');
-}
-`,
-      'utf8'
-    );
-
-    try {
-      expect(shouldSkipNodeStripTypesPreflight(workflowPath)).toBe(true);
-      await expect(runScriptWorkflow(workflowPath)).resolves.toBeUndefined();
-    } finally {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    }
-  }, 30000);
-
-  it('does not treat enum text in comments or strings as unsupported strip-types syntax', async () => {
-    const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-runner-'));
-    const workflowPath = path.join(tmpDir, 'enum-text.ts');
-    fs.writeFileSync(
-      workflowPath,
-      `
-// enum CommentOnly { Value = 'value' }
-const message = "enum StringOnly { Value = 'value' }";
-const template = \`enum TemplateOnly { Value = 'value' }\`;
-if (!message || !template) {
-  throw new Error('missing values');
-}
-`,
-      'utf8'
-    );
-
-    try {
-      expect(shouldSkipNodeStripTypesPreflight(workflowPath)).toBe(false);
-      await expect(runScriptWorkflow(workflowPath)).resolves.toBeUndefined();
-    } finally {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    }
-  }, 30000);
-
-  it('falls back for NodeNext .js specifiers backed by TypeScript source', async () => {
-    const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-runner-'));
-    const workflowPath = path.join(tmpDir, 'main.ts');
-    const enumModulePath = path.join(tmpDir, 'enum-module.ts');
-    fs.writeFileSync(
-      enumModulePath,
-      `
-export enum ImportedStep {
-  Done = 'done',
-}
-`,
-      'utf8'
-    );
-    fs.writeFileSync(
-      workflowPath,
-      `
-import { ImportedStep } from './enum-module.js';
-if (ImportedStep.Done !== 'done') {
-  throw new Error('imported step did not execute');
-}
-`,
-      'utf8'
-    );
-
-    try {
-      await expect(runScriptWorkflow(workflowPath)).resolves.toBeUndefined();
-    } finally {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    }
-  }, 30000);
-
-  it('handles circular static imports during strip-types preflight', async () => {
-    const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-runner-'));
-    const workflowPath = path.join(tmpDir, 'main.ts');
-    const helperPath = path.join(tmpDir, 'helper.ts');
-    fs.writeFileSync(
-      workflowPath,
-      `
-import { helperValue } from './helper.ts';
-if (helperValue !== 'ok') {
-  throw new Error('helper did not execute');
-}
-`,
-      'utf8'
-    );
-    fs.writeFileSync(
-      helperPath,
-      `
-import type {} from './main.ts';
-export enum HelperStep {
-  Done = 'done',
-}
-export const helperValue = HelperStep.Done === 'done' ? 'ok' : 'bad';
-`,
-      'utf8'
-    );
-
-    try {
-      await expect(runScriptWorkflow(workflowPath)).resolves.toBeUndefined();
-    } finally {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    }
-  }, 30000);
-
-  it('terminates strip-types preflight for circular imports without unsupported syntax', async () => {
-    const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-runner-'));
-    const workflowPath = path.join(tmpDir, 'main.ts');
-    const helperPath = path.join(tmpDir, 'helper.ts');
-    fs.writeFileSync(
-      workflowPath,
-      `
-import { helperReady } from './helper.ts';
-void helperReady;
-export function mainReady() {
-  return true;
-}
-`,
-      'utf8'
-    );
-    fs.writeFileSync(
-      helperPath,
-      `
-import { mainReady } from './main.ts';
-void mainReady;
-export const helperReady = true;
-`,
-      'utf8'
-    );
-
-    try {
-      expect(shouldSkipNodeStripTypesPreflight(workflowPath)).toBe(false);
-      await expect(runScriptWorkflow(workflowPath)).resolves.toBeUndefined();
-    } finally {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    }
-  }, 30000);
-
-  it('skips node strip-types when a transitive TypeScript import cannot be read', async () => {
-    const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-runner-'));
-    const workflowPath = path.join(tmpDir, 'main.ts');
-    const helperPath = path.join(tmpDir, 'helper.ts');
-    fs.writeFileSync(workflowPath, "import './helper.ts';\n", 'utf8');
-    fs.mkdirSync(helperPath);
-
-    try {
-      expect(shouldSkipNodeStripTypesPreflight(workflowPath)).toBe(true);
-      await expect(runScriptWorkflow(workflowPath)).rejects.toThrow(
-        /tsx exited with code 1|EISDIR|directory/i
-      );
-    } finally {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    }
-  }, 30000);
-
-  it('does not mask ordinary runtime failures by falling back to another TypeScript runner', async () => {
-    const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-runner-'));
-    const workflowPath = path.join(tmpDir, 'runtime-failure.ts');
-    fs.writeFileSync(workflowPath, "throw new Error('intentional runtime failure');\n", 'utf8');
-
-    try {
-      await expect(runScriptWorkflow(workflowPath)).rejects.toThrow(
-        nodeSupportsStripTypes
-          ? /node --experimental-strip-types exited with code 1/
-          : /(?:tsx|ts-node|npx tsx) exited with code 1/
-      );
-    } finally {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    }
-  });
-
-  it('does not retry side-effecting user code that only prints strip-types text', async () => {
-    const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-runner-'));
-    const workflowPath = path.join(tmpDir, 'spoofed-strip-types.ts');
-    const markerPath = path.join(tmpDir, 'marker.txt');
-    fs.writeFileSync(
-      workflowPath,
-      `
-import fs from 'node:fs';
-fs.appendFileSync(${JSON.stringify(markerPath)}, 'ran\\n');
-console.error('ERR_UNSUPPORTED_TYPESCRIPT_SYNTAX');
-process.exit(7);
-`,
-      'utf8'
-    );
-
-    try {
-      await expect(runScriptWorkflow(workflowPath)).rejects.toThrow(
-        nodeSupportsStripTypes
-          ? /node --experimental-strip-types exited with code 7/
-          : /(?:tsx|ts-node|npx tsx) exited with code 7/
-      );
-      expect(fs.readFileSync(markerPath, 'utf8')).toBe('ran\n');
-    } finally {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    }
-  });
-
-  it('does not retry after user code dynamically imports unsupported strip-types syntax', async () => {
-    const tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-runner-'));
-    const workflowPath = path.join(tmpDir, 'dynamic-enum-import.ts');
-    const enumModulePath = path.join(tmpDir, 'enum-module.ts');
-    const markerPath = path.join(tmpDir, 'marker.txt');
-    fs.writeFileSync(
-      enumModulePath,
-      `
-export enum ImportedStep {
-  Done = 'done',
-}
-`,
-      'utf8'
-    );
-    fs.writeFileSync(
-      workflowPath,
-      `
-import fs from 'node:fs';
-fs.appendFileSync(${JSON.stringify(markerPath)}, 'ran\\n');
-await import(${JSON.stringify(enumModulePath)});
-`,
-      'utf8'
-    );
-
-    try {
-      await expect(runScriptWorkflow(workflowPath)).rejects.toThrow();
-      if (nodeSupportsStripTypes) {
-        expect(fs.readFileSync(markerPath, 'utf8')).toBe('ran\n');
-      }
-    } finally {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    }
-  });
-});
-
-describe('findLocalSdkWorkspace', () => {
-  it('returns null when no agent-relay workspace is in the ancestor chain', () => {
-    expect(findLocalSdkWorkspace('/tmp')).toBeNull();
-  });
-});
-
-describe('ensureLocalSdkWorkflowRuntime', () => {
-  function createTempWorkspace(): { rootDir: string; startDir: string; workflowsEntry: string } {
-    const rootDir = fs.mkdtempSync(path.join(os.tmpdir(), 'agent-relay-workspace-'));
-    const sdkDir = path.join(rootDir, 'packages', 'sdk');
-    const startDir = path.join(sdkDir, 'src', 'workflows');
-    fs.mkdirSync(startDir, { recursive: true });
-    fs.writeFileSync(path.join(rootDir, 'package.json'), JSON.stringify({ name: 'agent-relay' }), 'utf8');
-    fs.writeFileSync(path.join(sdkDir, 'package.json'), JSON.stringify({ name: '@agent-relay/sdk' }), 'utf8');
-    return {
-      rootDir,
-      startDir,
-      workflowsEntry: path.join(sdkDir, 'dist', 'workflows', 'index.js'),
-    };
-  }
-
-  it('runs local workflow runtime build commands in dependency order', () => {
-    const workspace = createTempWorkspace();
-    const calls: string[][] = [];
-    const expectedCommands = [
-      ['run', 'build:config'],
-      ['--prefix', 'packages/workflow-types', 'run', 'build'],
-      ['--prefix', 'packages/github-primitive', 'run', 'build'],
-      ['--prefix', 'packages/slack-primitive', 'run', 'build'],
-      ['--prefix', 'packages/cloud', 'run', 'build'],
-      ['run', 'build:sdk'],
-    ];
-
-    try {
-      const execRunner = ((_file: string, args?: readonly string[]) => {
-        calls.push([...(args ?? [])]);
-        if (calls.length === expectedCommands.length) {
-          fs.mkdirSync(path.dirname(workspace.workflowsEntry), { recursive: true });
-          fs.writeFileSync(workspace.workflowsEntry, '', 'utf8');
-        }
-        return Buffer.from('');
-      }) as any;
-
-      ensureLocalSdkWorkflowRuntime(workspace.startDir, execRunner);
-
-      expect(calls).toEqual(expectedCommands);
-    } finally {
-      fs.rmSync(workspace.rootDir, { recursive: true, force: true });
-    }
-  });
-
-  it('throws when local workflow runtime is still missing after build commands', () => {
-    const workspace = createTempWorkspace();
-
-    try {
-      expect(() => ensureLocalSdkWorkflowRuntime(workspace.startDir, (() => Buffer.from('')) as any)).toThrow(
-        /Local SDK workflows runtime is still missing after build/
-      );
-    } finally {
-      fs.rmSync(workspace.rootDir, { recursive: true, force: true });
-    }
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/run-summary-table.test.ts b/packages/sdk/src/workflows/__tests__/run-summary-table.test.ts
deleted file mode 100644
index 24f7e95c8..000000000
--- a/packages/sdk/src/workflows/__tests__/run-summary-table.test.ts
+++ /dev/null
@@ -1,168 +0,0 @@
-import { describe, expect, it, vi } from 'vitest';
-
-import { formatRunSummaryTable } from '../run-summary-table.js';
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn(),
-  RelayError: class RelayError extends Error {},
-}));
-
-vi.mock('../../relay.js', () => ({
-  AgentRelay: vi.fn(),
-}));
-
-const { WorkflowRunner } = await import('../runner.js');
-
-describe('formatRunSummaryTable', () => {
-  it('renders all-passing steps', () => {
-    const output = formatRunSummaryTable(
-      [
-        { name: 'plan', agent: 'lead', status: 'completed', attempts: 1, durationMs: 1_000 },
-        { name: 'implement', agent: 'worker', status: 'completed', attempts: 1, durationMs: 2_000 },
-      ],
-      new Map([
-        [
-          'plan',
-          {
-            cli: 'claude',
-            sessionId: 's1',
-            model: 'claude-sonnet-4',
-            provider: 'anthropic',
-            durationMs: 1_200,
-            cost: 0.75,
-            tokens: { input: 100, output: 50, cacheRead: 10 },
-            turns: 2,
-            toolCalls: [],
-            errors: [],
-            finalStatus: 'completed',
-            summary: 'planned',
-          },
-        ],
-        [
-          'implement',
-          {
-            cli: 'codex',
-            sessionId: 's2',
-            model: 'gpt-5',
-            provider: 'openai',
-            durationMs: 3_400,
-            cost: 1.25,
-            tokens: { input: 300, output: 90, cacheRead: 20 },
-            turns: 4,
-            toolCalls: [],
-            errors: [{ turn: 2, text: 'Error: recovered after retry' }],
-            finalStatus: 'completed',
-            summary: 'implemented',
-          },
-        ],
-      ])
-    );
-
-    expect(output).toMatchInlineSnapshot(`
-      "  Step                  Status  Model                 Cost      Tokens    Duration      Errors
-        plan                  pass    claude-sonnet-4      $0.75         160          1s          --
-        implement             pass    gpt-5                $1.25         410          3s   1 (fixed)
-        ────────────────────────────────────────────────────────────────────────────────────────────
-        Total                                              $2.00         570          5s            "
-    `);
-  });
-
-  it('renders a failed step with the first error line', () => {
-    const output = formatRunSummaryTable(
-      [
-        {
-          name: 'broken-step',
-          agent: 'worker',
-          status: 'failed',
-          attempts: 1,
-          durationMs: 1_500,
-          error: 'boom',
-        },
-      ],
-      new Map([
-        [
-          'broken-step',
-          {
-            cli: 'opencode',
-            sessionId: 's3',
-            model: 'gpt-5',
-            provider: 'openai',
-            durationMs: 1_500,
-            cost: 0.01,
-            tokens: { input: 10, output: 5, cacheRead: 0 },
-            turns: 1,
-            toolCalls: [],
-            errors: [{ turn: 1, text: 'Error: database locked' }],
-            finalStatus: 'failed',
-            summary: null,
-          },
-        ],
-      ])
-    );
-
-    expect(output).toContain('broken-step           FAIL');
-    expect(output).toContain('  └─ Error [turn 1] Error: database locked');
-  });
-
-  it('renders deterministic steps without reports using placeholder columns', () => {
-    const output = formatRunSummaryTable(
-      [{ name: 'lint', agent: 'shell', status: 'completed', attempts: 1, durationMs: 900 }],
-      new Map()
-    );
-
-    expect(output).toContain('lint                  pass    --');
-    expect(output).toContain('--');
-    // No reports means no cost column
-    expect(output).not.toContain('Cost');
-  });
-
-  it('hides Cost column when no report has reliable cost data', () => {
-    const output = formatRunSummaryTable(
-      [{ name: 'gen-code', agent: 'worker', status: 'completed', attempts: 1, durationMs: 5_000 }],
-      new Map([
-        [
-          'gen-code',
-          {
-            cli: 'claude',
-            sessionId: 's1',
-            model: 'claude-sonnet-4',
-            provider: 'anthropic',
-            durationMs: 5_000,
-            cost: null,
-            tokens: { input: 200, output: 80, cacheRead: 0 },
-            turns: 3,
-            toolCalls: [],
-            errors: [],
-            finalStatus: 'completed',
-            summary: 'done',
-          },
-        ],
-      ])
-    );
-
-    expect(output).not.toContain('Cost');
-    expect(output).toContain('Tokens');
-    expect(output).toContain('280');
-  });
-});
-
-describe('WorkflowRunner logRunSummary', () => {
-  it('uses the table summary format even when no reports exist', () => {
-    const runner = new WorkflowRunner({ cwd: '/tmp/workflow-runner' });
-    const logSpy = vi.spyOn(console, 'log').mockImplementation(() => {});
-
-    (runner as any).logRunSummary(
-      'sample-workflow',
-      [{ name: 'lint', agent: 'shell', status: 'completed', attempts: 1, output: 'ok' }],
-      'run-1'
-    );
-
-    const combined = logSpy.mock.calls.flat().join('\n');
-    expect(combined).toContain('Workflow "sample-workflow"');
-    expect(combined).toContain('Step                  Status');
-    expect(combined).toContain('lint');
-    expect(combined).toContain('pass');
-
-    logSpy.mockRestore();
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/scrub-pty-chrome.test.ts b/packages/sdk/src/workflows/__tests__/scrub-pty-chrome.test.ts
deleted file mode 100644
index e9aeefec5..000000000
--- a/packages/sdk/src/workflows/__tests__/scrub-pty-chrome.test.ts
+++ /dev/null
@@ -1,125 +0,0 @@
-/**
- * Regression tests for WorkflowRunner.scrubForChannel — the function that
- * strips PTY/TUI chrome from interactive-agent step output before it gets
- * surfaced in workflow logs and channel messages.
- *
- * The patterns covered here are taken from a real captured run of a
- * multi-turn workflow against Claude Code's PTY: when its TUI footer
- * overwrites itself faster than the PTY flushes whitespace, lines like
- * `bypasspermissionson`, `--INSERT--⏵⏵`, and `Opus 4.7 (1M context) ctx:5%
- * $1.45` end up in the captured stream. Before these regex additions, the
- * step "Output:" block was unreadable on interactive-agent steps.
- */
-import { describe, it, expect } from 'vitest';
-
-import { WorkflowRunner } from '../runner.js';
-
-// scrubForChannel is `private static` — the cast is the minimal-invasive way
-// to exercise it from a test without exporting an internal-only helper.
-const scrub = (text: string): string =>
-  (WorkflowRunner as unknown as { scrubForChannel(t: string): string }).scrubForChannel(text);
-
-describe('WorkflowRunner.scrubForChannel — PTY chrome stripping', () => {
-  it('strips the Claude Code bottom status bar (model + ctx% + cost)', () => {
-    const input = [
-      'real content line',
-      'workflows git:(main) Opus 4.7 (1M context) ctx:5% $1.45',
-      'Opus4.7(1Mcontext) ctx:6% $1.54',
-      'another real line',
-    ].join('\n');
-    const out = scrub(input);
-    expect(out).toContain('real content line');
-    expect(out).toContain('another real line');
-    expect(out).not.toMatch(/ctx\s*:\s*\d+%/);
-    expect(out).not.toMatch(/\$\d+\.\d+/);
-  });
-
-  it('strips vim-style mode indicators emitted by the input bar', () => {
-    const input = [
-      'pre-mode line',
-      '--INSERT--',
-      '--INSERT--⏵⏵bypasspermissionson (shift+tabtocycle)',
-      'post-mode line',
-    ].join('\n');
-    const out = scrub(input);
-    expect(out).toContain('pre-mode line');
-    expect(out).toContain('post-mode line');
-    expect(out).not.toMatch(/--INSERT--/);
-  });
-
-  it('strips no-whitespace TUI hint variants (bypasspermissionson, pasteagaintoexpand)', () => {
-    const input = ['before', 'bypasspermissionson', 'pasteagaintoexpand', 'shifttabto cycle', 'after'].join(
-      '\n'
-    );
-    const out = scrub(input);
-    expect(out).toContain('before');
-    expect(out).toContain('after');
-    expect(out).not.toMatch(/bypasspermissionson/);
-    expect(out).not.toMatch(/pasteagaintoexpand/);
-  });
-
-  it('strips thinking-status fragments without ellipsis anchors', () => {
-    const input = [
-      'meaningful: round 3 codex-player guess=19 feedback=correct',
-      'thinking with high effort',
-      '↓ 13 tokens · thinking with high effort',
-      'Crunched for 32s',
-      'Sautéed for 4s',
-      'Gitifying…55',
-    ].join('\n');
-    const out = scrub(input);
-    expect(out).toContain('feedback=correct');
-    expect(out).not.toMatch(/thinking with high effort/);
-    expect(out).not.toMatch(/Crunched for/);
-    expect(out).not.toMatch(/Gitifying/);
-  });
-
-  it('strips malformed overwritten q0/qW0 PTY frame runs', () => {
-    const input = [
-      'first useful line',
-      'qW0 | q0 / ql0 _ qqm ~ lqq = qW0 | q0 / ql0 _ qqm',
-      'summary: kept qW0 | q0 / ql0 _ qqm ~ lqq = qW0 | q0 done',
-      'last useful line',
-    ].join('\n');
-    const out = scrub(input);
-    expect(out).toContain('first useful line');
-    expect(out).toContain('last useful line');
-    expect(out).toMatch(/summary: kept\s+done/);
-    expect(out).not.toMatch(/qW0|ql0|qqm|lqq/);
-  });
-
-  it('redacts secrets in the runner public preview path', () => {
-    const out = scrub('deploy succeeded\napi_key=sk-abcdefghijklmnopqrstuvwxyz123456\n');
-    expect(out).toContain('deploy succeeded');
-    expect(out).toContain('[REDACTED]');
-    expect(out).not.toContain('sk-abcdefghijklmnopqrstuvwxyz123456');
-  });
-
-  it('preserves real content and OWNER_DECISION signals', () => {
-    const input = [
-      'Read 1 file, calling relaycast 2 times',
-      'Transcript verification reports TRANSCRIPT_OK with all 6 lines well-formed.',
-      'OWNER_DECISION: COMPLETE',
-      'REASON: All 6 turns executed, history.log has 6 lines.',
-      'STEP_COMPLETE: repair-transcript',
-    ].join('\n');
-    const out = scrub(input);
-    expect(out).toContain('TRANSCRIPT_OK');
-    expect(out).toContain('OWNER_DECISION: COMPLETE');
-    expect(out).toContain('STEP_COMPLETE: repair-transcript');
-    expect(out).toContain('All 6 turns executed');
-  });
-
-  it('does not strip lines that merely mention model names in prose', () => {
-    // Guard against the new claudeFooterRe (which looks for `Opus|Sonnet|Haiku <num>
-    // (...context...) ctx:N%`) being too eager and removing prose that
-    // mentions a model name.
-    const input = [
-      'Compared output from Opus 4.7 against Sonnet 4.6 — both passed.',
-      'We chose Haiku 4.5 for its latency profile.',
-    ].join('\n');
-    const out = scrub(input);
-    expect(out).toContain('Opus 4.7 against Sonnet 4.6');
-    expect(out).toContain('Haiku 4.5 for its latency profile');
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/sibling-links.test.ts b/packages/sdk/src/workflows/__tests__/sibling-links.test.ts
deleted file mode 100644
index 2ec049be5..000000000
--- a/packages/sdk/src/workflows/__tests__/sibling-links.test.ts
+++ /dev/null
@@ -1,185 +0,0 @@
-import { describe, expect, it, vi } from 'vitest';
-
-import { applySiblingLinks, buildSiblingLinkScript } from '../sibling-links.js';
-
-describe('buildSiblingLinkScript', () => {
-  it('detects npm manifest and emits an npm link block', () => {
-    const script = buildSiblingLinkScript([{ name: '@scope/pkg', path: '../sibling/packages/pkg' }]);
-    expect(script).toContain('-f "$SIBLING_PATH/package.json"');
-    expect(script).toContain('npm link --silent');
-    expect(script).toContain('@scope/pkg');
-    expect(script).toContain('../sibling/packages/pkg');
-  });
-
-  it('detects python manifest and emits a pip install -e block', () => {
-    const script = buildSiblingLinkScript([{ name: 'my_pkg', path: '../py/pkg' }]);
-    expect(script).toContain('-f "$SIBLING_PATH/pyproject.toml"');
-    expect(script).toContain('pip install -e');
-    expect(script).toContain('uv pip install --system -e');
-  });
-
-  it('fails-fast shell: script uses set -euo pipefail', () => {
-    const script = buildSiblingLinkScript([{ name: 'x', path: './x' }]);
-    expect(script.startsWith('set -euo pipefail')).toBe(true);
-  });
-
-  it('guards missing sibling path with explicit error', () => {
-    const script = buildSiblingLinkScript([{ name: 'x', path: '../missing' }]);
-    expect(script).toContain('SIBLING_PATH_MISSING');
-    expect(script).toContain('exit 1');
-  });
-
-  it('guards unknown manifest with explicit error', () => {
-    const script = buildSiblingLinkScript([{ name: 'x', path: './x' }]);
-    expect(script).toContain('UNKNOWN_MANIFEST');
-  });
-
-  it('emits one verify block per link with expected exports', () => {
-    const script = buildSiblingLinkScript([
-      { name: 'pkg-a', path: '../a', expect: ['foo', 'bar'] },
-      { name: 'pkg-b', path: '../b' },
-      { name: 'pkg-c', path: '../c', expect: ['baz'] },
-    ]);
-    const verifyCount = (script.match(/APPLY_SIBLING_LINKS_EXPECT/g) ?? []).length;
-    // Two verify blocks (for pkg-a + pkg-c), each referenced at least twice
-    // (env var declaration + two command variants for node/python fallback).
-    expect(verifyCount).toBeGreaterThanOrEqual(4);
-    expect(script).toContain('APPLY_SIBLING_LINKS_OK');
-  });
-
-  it('expects-list survives bash env var round-trip via single-quoted JSON payload', () => {
-    const script = buildSiblingLinkScript([{ name: 'p', path: './p', expect: ["it's-ok", 'with"quote'] }]);
-    // Assignment is `EXPECT='<JSON>'` where the JSON is single-quoted so
-    // bash leaves it literal (no `$` / backtick substitution), then
-    // Node/Python JSON.parse it back to the original array. Embedded `'`
-    // gets the '\'' POSIX-escape treatment.
-    const jsonPayload = JSON.stringify(["it's-ok", 'with"quote']);
-    const shellArg = `'${jsonPayload.replace(/'/g, `'\\''`)}'`;
-    expect(script).toContain(`EXPECT=${shellArg}`);
-  });
-
-  it('emits both node and python verifiers wrapped in manifest-conditional', () => {
-    const script = buildSiblingLinkScript([{ name: 'p', path: './p', expect: ['x'] }]);
-    expect(script).toContain('node --input-type=module');
-    expect(script).toContain('python3 -c');
-    // The wrapping if/elif/else pattern keeps python as a fallback inside
-    // the non-package.json branch.
-    expect(script).toMatch(/if \[ -f "\$SIBLING_PATH\/package\.json" \]; then[\s\S]+?else[\s\S]+?python/);
-  });
-
-  it('assignments use single-quoted literals so $() / backticks do not substitute (review: shell injection)', () => {
-    // Two-stage review fix:
-    //   (1) echo happens AFTER assignments and references the shell vars,
-    //       not raw link.name / link.path template interpolation.
-    //   (2) assignments themselves use SINGLE-quoted bash literals so that
-    //       `$(cmd)` and backticks inside the value are NOT interpreted as
-    //       command substitution (which JSON.stringify / double-quoted form
-    //       did NOT protect against).
-    const script = buildSiblingLinkScript([{ name: 'pkg$(evil)', path: '../path`also-evil`' }]);
-    const echoLines = script.split('\n').filter((l) => l.startsWith('echo "--- link:'));
-    expect(echoLines).toHaveLength(1);
-    expect(echoLines[0]).toBe('echo "--- link: $SIBLING_NAME <- $SIBLING_PATH ---"');
-    const assignmentLines = script
-      .split('\n')
-      .filter((l) => l.startsWith('SIBLING_NAME=') || l.startsWith('SIBLING_PATH='));
-    // Assignments should wrap the value in single quotes — the exact literal
-    // passes through bash. `$(evil)` sits inside single quotes → no
-    // substitution; same for backticks.
-    expect(assignmentLines.some((l) => l === "SIBLING_NAME='pkg$(evil)'")).toBe(true);
-    expect(assignmentLines.some((l) => l === "SIBLING_PATH='../path`also-evil`'")).toBe(true);
-    // Sanity: no double-quoted assignment form present for these lines.
-    expect(assignmentLines.some((l) => l.startsWith('SIBLING_NAME="'))).toBe(false);
-    expect(assignmentLines.some((l) => l.startsWith('SIBLING_PATH="'))).toBe(false);
-  });
-
-  it("escapes embedded single quotes in link values via POSIX '\\'' idiom", () => {
-    const script = buildSiblingLinkScript([{ name: "pkg'q", path: "../p'q" }]);
-    expect(script).toContain("SIBLING_NAME='pkg'\\''q'");
-    expect(script).toContain("SIBLING_PATH='../p'\\''q'");
-  });
-
-  it('uv is invoked with --system and falls through to pip on failure (review: non-venv)', () => {
-    // Fix for review: uv refuses to install outside a venv without --system.
-    // The dispatch now uses --system AND wraps the uv attempt in an `if` so
-    // failure falls through to pip/pip3 instead of exiting under `set -e`.
-    const script = buildSiblingLinkScript([{ name: 'p', path: '../p' }]);
-    expect(script).toContain('uv pip install --system -e');
-    expect(script).toMatch(
-      /if command -v uv[^\n]+uv pip install --system[^\n]+; then\s*\n\s*:\s*\n\s*elif command -v pip/
-    );
-  });
-
-  it('python verifier avoids backslashes inside f-string expressions (review: Python < 3.12 SyntaxError)', () => {
-    // Fix for review: backslashes (e.g. `\",\"`) inside f-string expression
-    // braces are a SyntaxError on Python < 3.12. We bind `sep = ","` outside
-    // the f-string and reference it from inside. The old escaped form must
-    // not appear anywhere in the emitted script.
-    const script = buildSiblingLinkScript([{ name: 'p', path: './p', expect: ['foo'] }]);
-    expect(script).toContain('sep = ","');
-    expect(script).toContain('sep.join(missing)');
-    expect(script).toContain('sep.join(want)');
-    expect(script).not.toContain('\\",\\".join(');
-  });
-});
-
-describe('applySiblingLinks', () => {
-  it('is a no-op when links is empty', () => {
-    const builder = { step: vi.fn() };
-    const result = applySiblingLinks(builder, { links: [] });
-    expect(builder.step).not.toHaveBeenCalled();
-    expect(result).toBe(builder);
-  });
-
-  it('adds a single deterministic step named setup-sibling-links by default', () => {
-    const builder = { step: vi.fn(() => builder) };
-    applySiblingLinks(builder, {
-      links: [{ name: 'pkg', path: '../pkg' }],
-    });
-    expect(builder.step).toHaveBeenCalledTimes(1);
-    const call = builder.step.mock.calls[0] as unknown as
-      | [string, { command: string; [k: string]: unknown }]
-      | undefined;
-    if (!call) throw new Error('expected step call');
-    const [stepName, cfg] = call;
-    expect(stepName).toBe('setup-sibling-links');
-    expect(cfg).toMatchObject({
-      type: 'deterministic',
-      dependsOn: ['install-deps'],
-      captureOutput: true,
-      failOnError: true,
-    });
-    expect(cfg.command).toContain("bash -c '");
-  });
-
-  it('honors custom stepName and dependsOn', () => {
-    const builder = { step: vi.fn(() => builder) };
-    applySiblingLinks(builder, {
-      links: [{ name: 'pkg', path: '../pkg' }],
-      stepName: 'custom-name',
-      dependsOn: ['setup-branch'],
-    });
-    const call = builder.step.mock.calls[0] as unknown as
-      | [string, { command: string; [k: string]: unknown }]
-      | undefined;
-    if (!call) throw new Error('expected step call');
-    const [stepName, cfg] = call;
-    expect(stepName).toBe('custom-name');
-    expect(cfg).toMatchObject({ dependsOn: ['setup-branch'] });
-  });
-
-  it('escapes single quotes in the embedded script safely for bash -c', () => {
-    const builder = { step: vi.fn(() => builder) };
-    applySiblingLinks(builder, {
-      links: [{ name: "has'quote", path: "./path'with-quote" }],
-    });
-    const call = builder.step.mock.calls[0] as unknown as [string, { command: string }] | undefined;
-    if (!call) throw new Error('expected step call');
-    const command = call[1].command;
-    // Verify the bash -c wrapper is well-formed: starts with bash -c ' and
-    // ends with matching close quote. The POSIX escape pattern is '\''
-    // (close-quote, escaped-quote, re-open-quote) — the end result should
-    // not have an odd number of unescaped single quotes.
-    expect(command.startsWith(`bash -c '`)).toBe(true);
-    expect(command.endsWith(`'`)).toBe(true);
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/step-cwd.test.ts b/packages/sdk/src/workflows/__tests__/step-cwd.test.ts
deleted file mode 100644
index 4f9700b13..000000000
--- a/packages/sdk/src/workflows/__tests__/step-cwd.test.ts
+++ /dev/null
@@ -1,72 +0,0 @@
-import { describe, it, expect, vi } from 'vitest';
-import path from 'node:path';
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn(),
-  RelayError: class RelayError extends Error {},
-}));
-
-vi.mock('../../relay.js', () => ({
-  AgentRelay: vi.fn(),
-}));
-
-const { WorkflowRunner } = await import('../runner.js');
-
-describe('WorkflowRunner step cwd resolution', () => {
-  it('prefers step.cwd over agent.cwd and runner cwd', () => {
-    const runnerRoot = '/runner-root';
-    const runner = new WorkflowRunner({ cwd: runnerRoot });
-
-    const resolved = (runner as any).resolveEffectiveCwd(
-      { name: 'generate', agent: 'worker', task: 'Generate', cwd: 'steps/generate' },
-      { name: 'worker', cli: 'claude', cwd: 'agents/worker' }
-    );
-
-    expect(resolved).toBe(path.resolve(runnerRoot, 'steps/generate'));
-  });
-
-  it('respects step.cwd for deterministic steps', () => {
-    const runnerRoot = '/runner-root';
-    const runner = new WorkflowRunner({ cwd: runnerRoot });
-
-    const resolved = (runner as any).resolveEffectiveCwd({
-      name: 'scaffold',
-      type: 'deterministic',
-      command: 'mkdir -p out',
-      cwd: 'deterministic/setup',
-    });
-
-    expect(resolved).toBe(path.resolve(runnerRoot, 'deterministic/setup'));
-  });
-
-  it('falls back through step.cwd to step.workdir to agent.cwd to runner.cwd', () => {
-    const runnerRoot = '/runner-root';
-    const namedPath = '/named/workdir';
-    const runner = new WorkflowRunner({ cwd: runnerRoot });
-    (runner as any).resolvedPaths.set('generated', namedPath);
-
-    const agentDef = { name: 'worker', cli: 'claude', cwd: 'agents/worker' } as const;
-
-    expect(
-      (runner as any).resolveEffectiveCwd(
-        { name: 's1', agent: 'worker', task: 'Do work', cwd: 'steps/explicit', workdir: 'generated' },
-        agentDef
-      )
-    ).toBe(path.resolve(runnerRoot, 'steps/explicit'));
-
-    expect(
-      (runner as any).resolveEffectiveCwd(
-        { name: 's2', agent: 'worker', task: 'Do work', workdir: 'generated' },
-        agentDef
-      )
-    ).toBe(namedPath);
-
-    expect(
-      (runner as any).resolveEffectiveCwd({ name: 's3', agent: 'worker', task: 'Do work' }, agentDef)
-    ).toBe(path.resolve(runnerRoot, 'agents/worker'));
-
-    expect((runner as any).resolveEffectiveCwd({ name: 's4', type: 'deterministic', command: 'pwd' })).toBe(
-      runnerRoot
-    );
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/step-executor.test.ts b/packages/sdk/src/workflows/__tests__/step-executor.test.ts
deleted file mode 100644
index 7b289b95b..000000000
--- a/packages/sdk/src/workflows/__tests__/step-executor.test.ts
+++ /dev/null
@@ -1,456 +0,0 @@
-import { describe, it, expect, vi, beforeEach } from 'vitest';
-
-import { StepExecutor, type StepExecutorDeps, type StepResult } from '../step-executor.js';
-import type { ProcessSpawner } from '../process-spawner.js';
-import { createProcessSpawner } from '../process-spawner.js';
-import type { WorkflowStep, AgentDefinition, WorkflowStepStatus } from '../types.js';
-
-// ── Helpers ──────────────────────────────────────────────────────────────────
-
-function makeStep(overrides: Partial<WorkflowStep> = {}): WorkflowStep {
-  return {
-    name: 'step-1',
-    type: 'deterministic',
-    command: 'echo hello',
-    ...overrides,
-  } as WorkflowStep;
-}
-
-function makeAgent(overrides: Partial<AgentDefinition> = {}): AgentDefinition {
-  return {
-    name: 'worker-1',
-    cli: 'claude',
-    role: 'specialist',
-    ...overrides,
-  } as AgentDefinition;
-}
-
-function mockSpawner(overrides: Partial<ProcessSpawner> = {}): ProcessSpawner {
-  return {
-    spawnShell: vi.fn(async () => ({ output: 'hello\n', exitCode: 0 })),
-    spawnAgent: vi.fn(async () => ({ output: 'done', exitCode: 0 })),
-    spawnInteractive: vi.fn(async () => ({ output: 'completed', exitCode: 0 })),
-    buildCommand: vi.fn(() => ({ bin: 'claude', args: ['--task', 'x'] })),
-    ...overrides,
-  };
-}
-
-function makeDeps(overrides: Partial<StepExecutorDeps> = {}): StepExecutorDeps {
-  return {
-    cwd: '/tmp/test-project',
-    runId: 'run-001',
-    postToChannel: vi.fn(),
-    persistStepRow: vi.fn(),
-    persistStepOutput: vi.fn(),
-    resolveTemplate: vi.fn((s: string) => s),
-    getStepOutput: vi.fn(() => ''),
-    checkAborted: vi.fn(),
-    waitIfPaused: vi.fn(async () => {}),
-    log: vi.fn(),
-    processSpawner: mockSpawner(),
-    ...overrides,
-  };
-}
-
-function createExecutor(overrides: Partial<StepExecutorDeps> = {}): StepExecutor {
-  return new StepExecutor(makeDeps(overrides));
-}
-
-// ── 1. Deterministic step execution ──────────────────────────────────────────
-
-describe('StepExecutor — deterministic steps', () => {
-  it('runs a shell command and captures stdout', async () => {
-    const executor = createExecutor();
-    const step = makeStep({ command: 'echo hello' });
-    const result = await executor.executeOne(step, new Map());
-    expect(result.status).toBe('completed');
-    expect(result.output).toContain('hello');
-    expect(result.exitCode).toBe(0);
-  });
-
-  it('marks step failed on non-zero exit code', async () => {
-    const executor = createExecutor({
-      processSpawner: mockSpawner({
-        spawnShell: vi.fn(async () => ({ output: 'err', exitCode: 1 })),
-      }),
-    });
-    const step = makeStep({ command: 'false' });
-    const result = await executor.executeOne(step, new Map());
-    expect(result.status).toBe('failed');
-    expect(result.exitCode).toBe(1);
-  });
-
-  it('succeeds with non-zero exit when failOnError is false', async () => {
-    const executor = createExecutor({
-      processSpawner: mockSpawner({
-        spawnShell: vi.fn(async () => ({ output: 'warn', exitCode: 1 })),
-      }),
-    });
-    const step = makeStep({ command: 'maybe-fail', failOnError: false });
-    const result = await executor.executeOne(step, new Map());
-    expect(result.status).toBe('completed');
-  });
-});
-
-// ── 2. Non-interactive agent step ────────────────────────────────────────────
-
-describe('StepExecutor — non-interactive agent steps', () => {
-  it('spawns a codex worker and captures output', async () => {
-    const spawner = mockSpawner();
-    const executor = createExecutor({ processSpawner: spawner });
-    const agent = makeAgent({ cli: 'codex', name: 'codex-worker', interactive: false });
-    const step = makeStep({
-      name: 'codex-step',
-      type: 'agent',
-      agent: 'codex-worker',
-      task: 'Fix the bug',
-      command: undefined,
-    });
-    const agentMap = new Map([['codex-worker', agent]]);
-
-    const result = await executor.executeOne(step, agentMap);
-    expect(spawner.spawnAgent).toHaveBeenCalledWith(
-      agent,
-      'Fix the bug',
-      expect.objectContaining({ cwd: '/tmp/test-project' })
-    );
-    expect(result.status).toBe('completed');
-  });
-
-  it('fails when agent is not found in agentMap', async () => {
-    const executor = createExecutor();
-    const step = makeStep({
-      name: 'orphan',
-      type: 'agent',
-      agent: 'missing-agent',
-      task: 'Do stuff',
-      command: undefined,
-    });
-    const result = await executor.executeOne(step, new Map());
-    expect(result.status).toBe('failed');
-    expect(result.error).toContain('not found');
-  });
-});
-
-// ── 3. Interactive agent step ────────────────────────────────────────────────
-
-describe('StepExecutor — interactive agent steps', () => {
-  it('spawns a claude lead via spawnInteractive', async () => {
-    const spawner = mockSpawner();
-    const executor = createExecutor({ processSpawner: spawner });
-    const agent = makeAgent({ cli: 'claude', name: 'lead-agent' });
-    const step = makeStep({
-      name: 'lead-step',
-      type: 'agent',
-      agent: 'lead-agent',
-      task: 'Coordinate work',
-      command: undefined,
-    });
-    const agentMap = new Map([['lead-agent', agent]]);
-
-    const result = await executor.executeOne(step, agentMap);
-    expect(spawner.spawnInteractive).toHaveBeenCalled();
-    expect(result.status).toBe('completed');
-  });
-});
-
-// ── 4. Step timeout handling ─────────────────────────────────────────────────
-
-describe('StepExecutor — timeout handling', () => {
-  it('passes timeoutMs through to process spawner', async () => {
-    const spawner = mockSpawner();
-    const executor = createExecutor({ processSpawner: spawner });
-    const step = makeStep({ command: 'sleep 60', timeoutMs: 5000 });
-
-    await executor.executeOne(step, new Map());
-    expect(spawner.spawnShell).toHaveBeenCalledWith('sleep 60', expect.objectContaining({ timeoutMs: 5000 }));
-  });
-
-  it('fails step when spawn rejects due to timeout', async () => {
-    const executor = createExecutor({
-      processSpawner: mockSpawner({
-        spawnShell: vi.fn(async () => {
-          throw new Error('Process timed out');
-        }),
-      }),
-    });
-    const step = makeStep({ command: 'sleep 60', timeoutMs: 100 });
-    const result = await executor.executeOne(step, new Map());
-    expect(result.status).toBe('failed');
-    expect(result.error).toContain('timed out');
-  });
-});
-
-// ── 5. Step dependency resolution (dependsOn) ────────────────────────────────
-
-describe('StepExecutor — dependency resolution', () => {
-  it('returns only steps whose deps are all completed', () => {
-    const executor = createExecutor();
-    const steps = [
-      makeStep({ name: 'a' }),
-      makeStep({ name: 'b', dependsOn: ['a'] }),
-      makeStep({ name: 'c', dependsOn: ['a', 'b'] }),
-    ];
-    const statuses = new Map<string, WorkflowStepStatus>([
-      ['a', 'completed'],
-      ['b', 'pending'],
-      ['c', 'pending'],
-    ]);
-    const ready = executor.findReady(steps, statuses);
-    expect(ready.map((s) => s.name)).toEqual(['b']);
-  });
-
-  it('treats skipped deps as satisfied', () => {
-    const executor = createExecutor();
-    const steps = [makeStep({ name: 'a' }), makeStep({ name: 'b', dependsOn: ['a'] })];
-    const statuses = new Map<string, WorkflowStepStatus>([
-      ['a', 'skipped'],
-      ['b', 'pending'],
-    ]);
-    const ready = executor.findReady(steps, statuses);
-    expect(ready.map((s) => s.name)).toEqual(['b']);
-  });
-
-  it('returns steps with no deps when all are pending', () => {
-    const executor = createExecutor();
-    const steps = [makeStep({ name: 'a' }), makeStep({ name: 'b', dependsOn: ['a'] })];
-    const statuses = new Map<string, WorkflowStepStatus>([
-      ['a', 'pending'],
-      ['b', 'pending'],
-    ]);
-    const ready = executor.findReady(steps, statuses);
-    expect(ready.map((s) => s.name)).toEqual(['a']);
-  });
-
-  it('returns nothing when all deps are failed', () => {
-    const executor = createExecutor();
-    const steps = [makeStep({ name: 'a' }), makeStep({ name: 'b', dependsOn: ['a'] })];
-    const statuses = new Map<string, WorkflowStepStatus>([
-      ['a', 'failed'],
-      ['b', 'pending'],
-    ]);
-    const ready = executor.findReady(steps, statuses);
-    expect(ready.map((s) => s.name)).toEqual([]);
-  });
-});
-
-// ── 6. Step output capture and storage ───────────────────────────────────────
-
-describe('StepExecutor — output capture', () => {
-  it('persists step output after successful completion', async () => {
-    const deps = makeDeps();
-    const executor = new StepExecutor(deps);
-    const step = makeStep({ command: 'echo result-data' });
-
-    await executor.executeOne(step, new Map());
-    expect(deps.persistStepOutput).toHaveBeenCalledWith(
-      'run-001',
-      'step-1',
-      expect.stringContaining('hello')
-    );
-  });
-
-  it('persists step row status on completion', async () => {
-    const deps = makeDeps();
-    const executor = new StepExecutor(deps);
-    const step = makeStep({ command: 'echo ok' });
-
-    await executor.executeOne(step, new Map());
-    expect(deps.persistStepRow).toHaveBeenCalledWith(
-      expect.any(String),
-      expect.objectContaining({ status: 'completed' })
-    );
-  });
-
-  it('captures output on failure', async () => {
-    const deps = makeDeps({
-      processSpawner: mockSpawner({
-        spawnShell: vi.fn(async () => ({ output: 'error: not found', exitCode: 1 })),
-      }),
-    });
-    const executor = new StepExecutor(deps);
-    const step = makeStep({ command: 'bad-command' });
-    const result = await executor.executeOne(step, new Map());
-    expect(result.output).toContain('error: not found');
-  });
-
-  it('suppresses output when captureOutput is false', async () => {
-    const executor = createExecutor();
-    const step = makeStep({ command: 'echo secret', captureOutput: false });
-    const result = await executor.executeOne(step, new Map());
-    expect(result.output).toContain('Command completed');
-    expect(result.output).not.toContain('hello');
-  });
-});
-
-// ── 7. Step retry on failure ─────────────────────────────────────────────────
-
-describe('StepExecutor — retry logic', () => {
-  // Note: monitorStep retries on thrown errors (spawn failures), not on non-zero exit codes.
-  // Non-zero exit codes are handled by toCompletionResult and produce immediate failure.
-
-  it('retries when spawn throws an error', async () => {
-    let attempt = 0;
-    const executor = createExecutor({
-      processSpawner: mockSpawner({
-        spawnShell: vi.fn(async () => {
-          attempt++;
-          if (attempt < 3) throw new Error('connection refused');
-          return { output: 'ok', exitCode: 0 };
-        }),
-      }),
-    });
-    const step = makeStep({ command: 'flaky', retries: 3 });
-    const result = await executor.executeOne(step, new Map());
-    expect(result.status).toBe('completed');
-    expect(result.retries).toBe(2);
-  });
-
-  it('fails after exhausting retries on thrown errors', async () => {
-    const executor = createExecutor({
-      processSpawner: mockSpawner({
-        spawnShell: vi.fn(async () => {
-          throw new Error('always fails');
-        }),
-      }),
-    });
-    const step = makeStep({ command: 'always-fail', retries: 2 });
-    const result = await executor.executeOne(step, new Map());
-    expect(result.status).toBe('failed');
-    expect(result.retries).toBe(2);
-    expect(result.error).toContain('always fails');
-  });
-
-  it('does not retry on non-zero exit code (immediate failure)', async () => {
-    const spawnShell = vi.fn(async () => ({ output: 'fail', exitCode: 1 }));
-    const executor = createExecutor({
-      processSpawner: mockSpawner({ spawnShell }),
-    });
-    const step = makeStep({ command: 'bad', retries: 3 });
-    const result = await executor.executeOne(step, new Map());
-    expect(result.status).toBe('failed');
-    // Called only once — no retries for clean non-zero exits
-    expect(spawnShell).toHaveBeenCalledTimes(1);
-  });
-
-  it('calls onStepRetried callback on each retry', async () => {
-    const onStepRetried = vi.fn();
-    let attempt = 0;
-    const executor = createExecutor({
-      onStepRetried,
-      processSpawner: mockSpawner({
-        spawnShell: vi.fn(async () => {
-          attempt++;
-          if (attempt < 2) throw new Error('transient');
-          return { output: 'ok', exitCode: 0 };
-        }),
-      }),
-    });
-    const step = makeStep({ command: 'flaky', retries: 2 });
-    await executor.executeOne(step, new Map());
-    expect(onStepRetried).toHaveBeenCalledTimes(1);
-  });
-});
-
-// ── 8. Process spawner — command building ────────────────────────────────────
-
-describe('ProcessSpawner — buildCommand', () => {
-  it('builds claude CLI command', () => {
-    const spawner = createProcessSpawner({ cwd: '/tmp' });
-    const agent = makeAgent({ cli: 'claude', name: 'claude-worker' });
-    const cmd = spawner.buildCommand(agent, 'Do the task');
-    expect(cmd.bin).toBe('claude');
-    expect(cmd.args).toContain('Do the task');
-  });
-
-  it('builds codex CLI command', () => {
-    const spawner = createProcessSpawner({ cwd: '/tmp' });
-    const agent = makeAgent({ cli: 'codex', name: 'codex-worker' });
-    const cmd = spawner.buildCommand(agent, 'Fix bug');
-    expect(cmd.bin).toBe('codex');
-    expect(cmd.args).toContain('Fix bug');
-  });
-
-  it('builds aider CLI command', () => {
-    const spawner = createProcessSpawner({ cwd: '/tmp' });
-    const agent = makeAgent({ cli: 'aider', name: 'aider-worker' });
-    const cmd = spawner.buildCommand(agent, 'Refactor');
-    expect(cmd.bin).toBe('aider');
-    expect(cmd.args).toContain('Refactor');
-  });
-
-  it('builds gemini CLI command', () => {
-    const spawner = createProcessSpawner({ cwd: '/tmp' });
-    const agent = makeAgent({ cli: 'gemini', name: 'gemini-worker' });
-    const cmd = spawner.buildCommand(agent, 'Analyze');
-    expect(cmd.bin).toBe('gemini');
-    expect(cmd.args).toContain('Analyze');
-  });
-});
-
-// ── 9. executeAll — DAG orchestration ────────────────────────────────────────
-
-describe('StepExecutor — executeAll', () => {
-  it('executes steps in dependency order', async () => {
-    const order: string[] = [];
-    const executor = createExecutor({
-      processSpawner: mockSpawner({
-        spawnShell: vi.fn(async () => {
-          return { output: 'ok', exitCode: 0 };
-        }),
-      }),
-      onStepStarted: vi.fn((step) => {
-        order.push(step.name);
-      }),
-    });
-    const steps = [
-      makeStep({ name: 'a', command: 'echo a' }),
-      makeStep({ name: 'b', command: 'echo b', dependsOn: ['a'] }),
-    ];
-
-    const results = await executor.executeAll(steps, new Map());
-    expect(results.size).toBe(2);
-    expect(order).toEqual(['a', 'b']);
-    expect(results.get('a')?.status).toBe('completed');
-    expect(results.get('b')?.status).toBe('completed');
-  });
-
-  it('skips downstream steps on fail-fast', async () => {
-    const executor = createExecutor({
-      processSpawner: mockSpawner({
-        spawnShell: vi.fn(async () => ({ output: 'err', exitCode: 1 })),
-      }),
-      markDownstreamSkipped: vi.fn(),
-    });
-    const steps = [
-      makeStep({ name: 'a', command: 'fail' }),
-      makeStep({ name: 'b', command: 'echo b', dependsOn: ['a'] }),
-    ];
-
-    await expect(executor.executeAll(steps, new Map(), { strategy: 'fail-fast' })).rejects.toThrow(
-      'Step "a" failed'
-    );
-  });
-
-  it('continues past failures with continue strategy', async () => {
-    let callCount = 0;
-    const executor = createExecutor({
-      processSpawner: mockSpawner({
-        spawnShell: vi.fn(async () => {
-          callCount++;
-          if (callCount === 1) return { output: 'err', exitCode: 1 };
-          return { output: 'ok', exitCode: 0 };
-        }),
-      }),
-      markDownstreamSkipped: vi.fn(),
-    });
-    const steps = [
-      makeStep({ name: 'a', command: 'fail' }),
-      makeStep({ name: 'c', command: 'echo c' }), // no dependency on a
-    ];
-
-    const results = await executor.executeAll(steps, new Map(), { strategy: 'continue' });
-    expect(results.get('a')?.status).toBe('failed');
-    expect(results.get('c')?.status).toBe('completed');
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/template-resolver.test.ts b/packages/sdk/src/workflows/__tests__/template-resolver.test.ts
deleted file mode 100644
index 0d0076c8b..000000000
--- a/packages/sdk/src/workflows/__tests__/template-resolver.test.ts
+++ /dev/null
@@ -1,164 +0,0 @@
-import { describe, expect, it } from 'vitest';
-
-// Import from the module that will be extracted from runner.ts
-import { resolveStepOutputRef, resolveTemplate, TemplateResolver } from '../template-resolver.js';
-
-describe('TemplateResolver', () => {
-  const resolver = new TemplateResolver();
-
-  describe('resolveTemplate', () => {
-    it('replaces non-step placeholders and preserves deferred step outputs', () => {
-      const result = resolveTemplate('Deploy {{env}} after {{steps.plan.output}}', { env: 'prod' });
-      expect(result).toBe('Deploy prod after {{steps.plan.output}}');
-    });
-
-    it('throws on unresolved placeholders', () => {
-      expect(() => resolveTemplate('Deploy {{missing}}', {})).toThrow('Unresolved variable: {{missing}}');
-    });
-  });
-
-  describe('resolveStepOutputRef', () => {
-    it('resolves a completed step output by reference', () => {
-      const stepOutputs = new Map([['plan', 'Build a REST API']]);
-      expect(resolveStepOutputRef('steps.plan.output', stepOutputs)).toBe('Build a REST API');
-    });
-
-    it('accepts references wrapped in template braces', () => {
-      const stepOutputs = new Map([['code', 'Created 3 files']]);
-      expect(resolveStepOutputRef('{{steps.code.output}}', stepOutputs)).toBe('Created 3 files');
-    });
-  });
-
-  describe('resolveVariables', () => {
-    it('replaces simple {{var}} placeholders in agent tasks', () => {
-      const config = {
-        version: '1',
-        name: 'test',
-        swarm: { mode: 'coordinate' as const },
-        agents: [{ name: 'a1', cli: 'claude', task: 'Deploy {{env}} to {{region}}' }],
-      };
-      const result = resolver.resolveVariables(config as any, { env: 'staging', region: 'us-east-1' });
-      expect(result.agents[0].task).toBe('Deploy staging to us-east-1');
-    });
-
-    it('replaces variables in workflow step tasks and commands', () => {
-      const config = {
-        version: '1',
-        name: 'test',
-        swarm: { mode: 'coordinate' as const },
-        agents: [],
-        workflows: [
-          {
-            name: 'wf1',
-            steps: [
-              { name: 's1', task: 'Build {{project}}', agent: 'a1' },
-              { name: 's2', command: 'deploy --env={{env}}' },
-            ],
-          },
-        ],
-      };
-      const result = resolver.resolveVariables(config as any, { project: 'relay', env: 'prod' });
-      expect(result.workflows![0].steps[0].task).toBe('Build relay');
-      expect(result.workflows![0].steps[1].command).toBe("deploy --env='prod'");
-    });
-
-    it('replaces variables in step params', () => {
-      const config = {
-        version: '1',
-        name: 'test',
-        swarm: { mode: 'coordinate' as const },
-        agents: [],
-        workflows: [
-          {
-            name: 'wf1',
-            steps: [{ name: 's1', agent: 'a1', params: { url: '{{base_url}}/api', count: 42 } }],
-          },
-        ],
-      };
-      const result = resolver.resolveVariables(config as any, { base_url: 'https://example.com' });
-      expect((result.workflows![0].steps[0].params as any).url).toBe('https://example.com/api');
-      // Non-string params are left untouched
-      expect((result.workflows![0].steps[0].params as any).count).toBe(42);
-    });
-
-    it('preserves {{steps.X.output}} placeholders for later resolution', () => {
-      const config = {
-        version: '1',
-        name: 'test',
-        swarm: { mode: 'coordinate' as const },
-        agents: [{ name: 'a1', cli: 'claude', task: 'Use {{steps.plan.output}} for {{env}}' }],
-      };
-      const result = resolver.resolveVariables(config as any, { env: 'prod' });
-      expect(result.agents[0].task).toBe('Use {{steps.plan.output}} for prod');
-    });
-
-    it('throws on unresolved non-step variables', () => {
-      const config = {
-        version: '1',
-        name: 'test',
-        swarm: { mode: 'coordinate' as const },
-        agents: [{ name: 'a1', cli: 'claude', task: 'Deploy to {{missing_var}}' }],
-      };
-      expect(() => resolver.resolveVariables(config as any, {})).toThrow(
-        'Unresolved variable: {{missing_var}}'
-      );
-    });
-
-    it('does not mutate the original config', () => {
-      const config = {
-        version: '1',
-        name: 'test',
-        swarm: { mode: 'coordinate' as const },
-        agents: [{ name: 'a1', cli: 'claude', task: 'Deploy {{env}}' }],
-      };
-      resolver.resolveVariables(config as any, { env: 'staging' });
-      expect(config.agents[0].task).toBe('Deploy {{env}}');
-    });
-  });
-
-  describe('resolveDotPath', () => {
-    it('resolves nested dot-path variables', () => {
-      const config = {
-        version: '1',
-        name: 'test',
-        swarm: { mode: 'coordinate' as const },
-        agents: [{ name: 'a1', cli: 'claude', task: 'Region: {{aws.region}}' }],
-      };
-      const vars = { aws: { region: 'us-west-2' } } as any;
-      const result = resolver.resolveVariables(config as any, vars);
-      expect(result.agents[0].task).toBe('Region: us-west-2');
-    });
-
-    it('throws for undefined nested paths', () => {
-      const config = {
-        version: '1',
-        name: 'test',
-        swarm: { mode: 'coordinate' as const },
-        agents: [{ name: 'a1', cli: 'claude', task: '{{a.b.c}}' }],
-      };
-      expect(() => resolver.resolveVariables(config as any, { a: { b: {} } } as any)).toThrow(
-        'Unresolved variable: {{a.b.c}}'
-      );
-    });
-  });
-
-  describe('interpolateStepTask', () => {
-    it('resolves step output references from completed steps', () => {
-      const template = 'Review: {{steps.plan.output}} and {{steps.code.output}}';
-      const context = {
-        steps: {
-          plan: { output: 'Build a REST API' },
-          code: { output: 'Created 3 files' },
-        },
-      } as any;
-      const result = resolver.interpolateStepTask(template, context);
-      expect(result).toBe('Review: Build a REST API and Created 3 files');
-    });
-
-    it('leaves unresolved step references intact', () => {
-      const template = 'Use {{steps.future.output}} later';
-      const result = resolver.interpolateStepTask(template, { steps: {} } as any);
-      expect(result).toBe('Use {{steps.future.output}} later');
-    });
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/verification-custom.test.ts b/packages/sdk/src/workflows/__tests__/verification-custom.test.ts
deleted file mode 100644
index 0c737cc90..000000000
--- a/packages/sdk/src/workflows/__tests__/verification-custom.test.ts
+++ /dev/null
@@ -1,292 +0,0 @@
-import { EventEmitter } from 'node:events';
-import { mkdtempSync, rmSync, writeFileSync } from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import { afterEach, beforeEach, describe, expect, it, vi } from 'vitest';
-
-import type { WorkflowDb } from '../runner.js';
-import type { RelayYamlConfig, WorkflowRunRow, WorkflowStepRow } from '../types.js';
-
-const mockRelaycastAgent = {
-  send: vi.fn().mockResolvedValue(undefined),
-  heartbeat: vi.fn().mockResolvedValue(undefined),
-  channels: {
-    create: vi.fn().mockResolvedValue(undefined),
-    join: vi.fn().mockResolvedValue(undefined),
-    invite: vi.fn().mockResolvedValue(undefined),
-  },
-};
-
-const mockRelaycast = {
-  agents: {
-    register: vi.fn().mockResolvedValue({ token: 'token-1' }),
-  },
-  as: vi.fn().mockReturnValue(mockRelaycastAgent),
-};
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn().mockImplementation(() => mockRelaycast),
-  RelayError: class RelayError extends Error {},
-}));
-
-const mockHuman = {
-  name: 'WorkflowRunner',
-  sendMessage: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockRelayInstance = {
-  spawnPty: vi.fn(),
-  human: vi.fn().mockReturnValue(mockHuman),
-  shutdown: vi.fn().mockResolvedValue(undefined),
-  onBrokerStderr: vi.fn().mockReturnValue(() => {}),
-  listAgentsRaw: vi.fn().mockResolvedValue([]),
-  addListener: vi.fn(() => () => {}),
-};
-
-vi.mock('../../relay.js', () => ({
-  AgentRelay: vi.fn().mockImplementation(() => mockRelayInstance),
-}));
-
-type QueuedSubprocessResult = {
-  stdout?: string;
-  stderr?: string;
-  code?: number | null;
-  signal?: string | null;
-  error?: Error;
-  beforeClose?: () => void;
-};
-
-let queuedSubprocessResults: QueuedSubprocessResult[] = [];
-
-const mockSubprocessSpawn = vi.fn().mockImplementation((_cmd, _args, _options) => {
-  const result = queuedSubprocessResults.shift() ?? { stdout: 'done\n', code: 0 };
-  const child = new EventEmitter() as EventEmitter & {
-    stdout: EventEmitter;
-    stderr: EventEmitter;
-    pid: number;
-    kill: ReturnType<typeof vi.fn>;
-  };
-
-  child.stdout = new EventEmitter();
-  child.stderr = new EventEmitter();
-  child.pid = 4321;
-  child.kill = vi.fn();
-
-  queueMicrotask(() => {
-    if (result.error) {
-      child.emit('error', result.error);
-      return;
-    }
-    if (result.stdout) {
-      child.stdout.emit('data', Buffer.from(result.stdout));
-    }
-    if (result.stderr) {
-      child.stderr.emit('data', Buffer.from(result.stderr));
-    }
-    result.beforeClose?.();
-    child.emit('close', result.code ?? 0, result.signal ?? null);
-  });
-
-  return child;
-});
-
-vi.mock('node:child_process', async () => {
-  const actual = await vi.importActual<typeof import('node:child_process')>('node:child_process');
-  return {
-    ...actual,
-    spawn: mockSubprocessSpawn,
-  };
-});
-
-const { WorkflowRunner } = await import('../runner.js');
-const { runVerification } = await import('../verification.js');
-
-const noopSideEffects = {
-  recordStepToolSideEffect: vi.fn(),
-  getOrCreateStepEvidenceRecord: vi.fn(() => ({
-    evidence: { coordinationSignals: [] },
-  })),
-  log: vi.fn(),
-};
-
-const tempDirs: string[] = [];
-
-function run(check: Parameters<typeof runVerification>[0], output = 'worker output', cwd?: string) {
-  return runVerification(
-    check,
-    output,
-    'custom-step',
-    undefined,
-    { allowFailure: true, cwd },
-    noopSideEffects
-  );
-}
-
-function makeDb(): WorkflowDb {
-  const runs = new Map<string, WorkflowRunRow>();
-  const steps = new Map<string, WorkflowStepRow>();
-
-  return {
-    insertRun: vi.fn(async (runRow: WorkflowRunRow) => {
-      runs.set(runRow.id, { ...runRow });
-    }),
-    updateRun: vi.fn(async (id: string, patch: Partial<WorkflowRunRow>) => {
-      const existing = runs.get(id);
-      if (existing) runs.set(id, { ...existing, ...patch });
-    }),
-    getRun: vi.fn(async (id: string) => {
-      const runRow = runs.get(id);
-      return runRow ? { ...runRow } : null;
-    }),
-    insertStep: vi.fn(async (stepRow: WorkflowStepRow) => {
-      steps.set(stepRow.id, { ...stepRow });
-    }),
-    updateStep: vi.fn(async (id: string, patch: Partial<WorkflowStepRow>) => {
-      const existing = steps.get(id);
-      if (existing) steps.set(id, { ...existing, ...patch });
-    }),
-    getStepsByRunId: vi.fn(async (runId: string) => {
-      return [...steps.values()].filter((stepRow) => stepRow.runId === runId);
-    }),
-  };
-}
-
-function makeConfig(projectDir: string, verificationValue: string): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'verification-custom',
-    swarm: { pattern: 'dag' },
-    errorHandling: {
-      strategy: 'retry',
-      retryDelayMs: 0,
-    },
-    agents: [{ name: 'worker', cli: 'claude', interactive: false }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          {
-            name: 'custom-step',
-            agent: 'worker',
-            task: 'Implement the requested change',
-            retries: 1,
-            cwd: projectDir,
-            verification: {
-              type: 'custom',
-              value: verificationValue,
-            },
-          },
-        ],
-      },
-    ],
-    trajectories: false,
-  };
-}
-
-describe('custom verification', () => {
-  beforeEach(() => {
-    vi.clearAllMocks();
-    queuedSubprocessResults = [];
-  });
-
-  afterEach(() => {
-    while (tempDirs.length > 0) {
-      const dir = tempDirs.pop();
-      if (dir) rmSync(dir, { recursive: true, force: true });
-    }
-  });
-
-  it('custom verification with command that exits 0 passes', () => {
-    const result = run({ type: 'custom', value: 'echo ok' });
-
-    expect(result.passed).toBe(true);
-    expect(result.completionReason).toBe('completed_verified');
-  });
-
-  it('custom verification with command that exits non-zero fails', () => {
-    const result = run({ type: 'custom', value: 'exit 1' });
-
-    expect(result.passed).toBe(false);
-    expect(result.completionReason).toBe('failed_verification');
-    expect(result.error).toContain('custom check "exit 1" failed');
-    expect(result.error).toContain('Command failed: exit 1');
-  });
-
-  it('custom verification captures stderr in failure message', () => {
-    const result = run({
-      type: 'custom',
-      value: "echo 'compile error: missing semicolon' >&2; exit 1",
-    });
-
-    expect(result.passed).toBe(false);
-    expect(result.error).toContain('compile error: missing semicolon');
-  });
-
-  it('custom verification with no value preserves legacy no-op', () => {
-    const result = run({ type: 'custom', value: '' });
-
-    expect(result).toEqual({ passed: false });
-  });
-
-  it('custom verification respects cwd', () => {
-    const tempDir = mkdtempSync(path.join(os.tmpdir(), 'verification-custom-cwd-'));
-    tempDirs.push(tempDir);
-    writeFileSync(path.join(tempDir, 'myfile.txt'), 'present');
-
-    const result = run({ type: 'custom', value: 'test -f myfile.txt' }, 'worker output', tempDir);
-
-    expect(result.passed).toBe(true);
-    expect(result.completionReason).toBe('completed_verified');
-  });
-
-  it('custom verification timeout kills long-running command', () => {
-    const result = run({ type: 'custom', value: 'sleep 60', timeoutMs: 1000 });
-
-    expect(result.passed).toBe(false);
-    expect(result.completionReason).toBe('failed_verification');
-    expect(result.error).toContain('sleep 60');
-    expect(result.error).toMatch(/ETIMEDOUT|timed out/i);
-  });
-
-  it('verification failure output appears in retry prompt', async () => {
-    const projectDir = mkdtempSync(path.join(os.tmpdir(), 'verification-custom-runner-'));
-    tempDirs.push(projectDir);
-
-    const verificationValue =
-      `sh -c 'if [ -f ready.txt ]; then exit 0; ` +
-      `else echo "compile error: missing semicolon" >&2; exit 1; fi'`;
-
-    queuedSubprocessResults = [
-      {
-        stdout: 'first attempt\n',
-        code: 0,
-      },
-      {
-        stdout: 'second attempt\n',
-        code: 0,
-        beforeClose: () => {
-          writeFileSync(path.join(projectDir, 'ready.txt'), 'ok');
-        },
-      },
-    ];
-
-    const runner = new WorkflowRunner({
-      cwd: projectDir,
-      db: makeDb(),
-      workspaceId: 'ws-test',
-    });
-
-    const result = await runner.execute(makeConfig(projectDir, verificationValue), 'default');
-
-    expect(result.status, result.error).toBe('completed');
-    expect(mockSubprocessSpawn).toHaveBeenCalledTimes(2);
-
-    const retryArgs = mockSubprocessSpawn.mock.calls[1]?.[1] as string[] | undefined;
-    const retryPrompt = retryArgs?.find((arg) => arg.includes('[RETRY')) ?? retryArgs?.join('\n') ?? '';
-
-    expect(retryPrompt).toContain('[VERIFICATION FAILED]');
-    expect(retryPrompt).toContain(`Command: ${verificationValue}`);
-    expect(retryPrompt).toContain('compile error: missing semicolon');
-    expect(retryPrompt).toContain('Fix the issues above before proceeding.');
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/verification-traceback.test.ts b/packages/sdk/src/workflows/__tests__/verification-traceback.test.ts
deleted file mode 100644
index 4661ad932..000000000
--- a/packages/sdk/src/workflows/__tests__/verification-traceback.test.ts
+++ /dev/null
@@ -1,558 +0,0 @@
-import { EventEmitter } from 'node:events';
-import { mkdtempSync, mkdirSync, rmSync, writeFileSync } from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import { afterAll, beforeEach, describe, expect, it, vi } from 'vitest';
-
-import type { BudgetTracker } from '../budget-tracker.js';
-import type { CliSessionQuery, CliSessionReport } from '../cli-session-collector.js';
-import type { WorkflowDb } from '../runner.js';
-import type { AgentDefinition, RelayYamlConfig, WorkflowRunRow, WorkflowStepRow } from '../types.js';
-
-type WorkflowConfigStep = NonNullable<RelayYamlConfig['workflows']>[number]['steps'][number];
-
-const tempDirs: string[] = [];
-
-type QueuedSubprocessResult = {
-  stdout?: string;
-  stderr?: string;
-  code?: number | null;
-  signal?: string | null;
-  delayMs?: number;
-  error?: Error;
-  beforeClose?: () => void;
-};
-
-type CollectorResult =
-  | CliSessionReport
-  | null
-  | ((query: CliSessionQuery) => CliSessionReport | null | Promise<CliSessionReport | null>);
-
-let queuedSubprocessResults: QueuedSubprocessResult[] = [];
-let queuedCollectorResults: CollectorResult[] = [];
-
-const mockCollectCliSession = vi.fn(async (query: CliSessionQuery): Promise<CliSessionReport | null> => {
-  const next = queuedCollectorResults.shift();
-  if (typeof next === 'function') {
-    return next(query);
-  }
-  return next ?? null;
-});
-
-vi.mock('../cli-session-collector.js', () => ({
-  collectCliSession: mockCollectCliSession,
-}));
-
-const mockSubprocessSpawn = vi.fn().mockImplementation((_cmd, _args, _options) => {
-  const result = queuedSubprocessResults.shift() ?? {
-    stdout: 'completed\n',
-    code: 0,
-  };
-
-  const child = new EventEmitter() as EventEmitter & {
-    stdout: EventEmitter;
-    stderr: EventEmitter;
-    pid: number;
-    kill: ReturnType<typeof vi.fn>;
-  };
-
-  child.stdout = new EventEmitter();
-  child.stderr = new EventEmitter();
-  child.pid = 4321;
-
-  let closed = false;
-  let delayTimer: ReturnType<typeof setTimeout> | undefined;
-  const clearPending = () => {
-    if (delayTimer) {
-      clearTimeout(delayTimer);
-      delayTimer = undefined;
-    }
-  };
-  const closeChild = (
-    code: number | null = result.code ?? 0,
-    signal: string | null = result.signal ?? null
-  ) => {
-    if (closed) return;
-    closed = true;
-    clearPending();
-    child.emit('close', code, signal);
-  };
-
-  child.kill = vi.fn((signal?: string | number) => {
-    clearPending();
-    queueMicrotask(() => closeChild(null, typeof signal === 'string' ? signal : null));
-    return true;
-  });
-
-  const emitResult = () => {
-    if (closed) return;
-    if (result.error) {
-      closed = true;
-      child.emit('error', result.error);
-      return;
-    }
-    if (result.stdout) {
-      child.stdout.emit('data', Buffer.from(result.stdout));
-    }
-    if (result.stderr) {
-      child.stderr.emit('data', Buffer.from(result.stderr));
-    }
-    result.beforeClose?.();
-    closeChild(result.code ?? 0, result.signal ?? null);
-  };
-
-  if (result.delayMs && result.delayMs > 0) {
-    delayTimer = setTimeout(emitResult, result.delayMs);
-  } else {
-    queueMicrotask(emitResult);
-  }
-
-  return child;
-});
-
-vi.mock('node:child_process', async () => {
-  const actual = await vi.importActual<typeof import('node:child_process')>('node:child_process');
-  return {
-    ...actual,
-    spawn: mockSubprocessSpawn,
-  };
-});
-
-const mockHuman = {
-  sendMessage: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockRelayInstance = {
-  spawnPty: vi.fn(),
-  human: vi.fn().mockReturnValue(mockHuman),
-  shutdown: vi.fn().mockResolvedValue(undefined),
-  onBrokerStderr: vi.fn().mockReturnValue(() => {}),
-  listAgentsRaw: vi.fn().mockResolvedValue([]),
-  listAgents: vi.fn().mockResolvedValue([]),
-  addListener: vi.fn(() => () => {}),
-};
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn(),
-  RelayError: class RelayError extends Error {},
-}));
-
-vi.mock('../../relay.js', () => ({
-  AgentRelay: vi.fn().mockImplementation(() => mockRelayInstance),
-}));
-
-const { workflow } = await import('../builder.js');
-const { WorkflowRunner } = await import('../runner.js');
-
-function makeDb(): WorkflowDb {
-  const runs = new Map<string, WorkflowRunRow>();
-  const steps = new Map<string, WorkflowStepRow>();
-
-  return {
-    insertRun: vi.fn(async (runRow: WorkflowRunRow) => {
-      runs.set(runRow.id, { ...runRow });
-    }),
-    updateRun: vi.fn(async (id: string, patch: Partial<WorkflowRunRow>) => {
-      const existing = runs.get(id);
-      if (existing) {
-        runs.set(id, { ...existing, ...patch });
-      }
-    }),
-    getRun: vi.fn(async (id: string) => {
-      const run = runs.get(id);
-      return run ? { ...run } : null;
-    }),
-    insertStep: vi.fn(async (stepRow: WorkflowStepRow) => {
-      steps.set(stepRow.id, { ...stepRow });
-    }),
-    updateStep: vi.fn(async (id: string, patch: Partial<WorkflowStepRow>) => {
-      const existing = steps.get(id);
-      if (existing) {
-        steps.set(id, { ...existing, ...patch });
-      }
-    }),
-    getStepsByRunId: vi.fn(async (runId: string) => {
-      return [...steps.values()].filter((step) => step.runId === runId).map((step) => ({ ...step }));
-    }),
-  };
-}
-
-function createWorkspace(subdirs: string[] = []): string {
-  const dir = mkdtempSync(path.join(os.tmpdir(), 'relay-verification-traceback-'));
-  tempDirs.push(dir);
-  for (const subdir of subdirs) {
-    mkdirSync(path.join(dir, subdir), { recursive: true });
-  }
-  return dir;
-}
-
-function makeRunner(cwd: string): InstanceType<typeof WorkflowRunner> {
-  return new WorkflowRunner({
-    cwd,
-    db: makeDb(),
-    workspaceId: 'ws-test',
-    relay: {
-      env: {
-        AGENT_RELAY_WORKFLOW_DISABLE_RELAYCAST: '1',
-      },
-    },
-  });
-}
-
-function makeReport(
-  tokens: Partial<NonNullable<CliSessionReport['tokens']>>,
-  overrides: Partial<CliSessionReport> = {}
-): CliSessionReport {
-  return {
-    cli: 'claude',
-    sessionId: 'session-1',
-    model: 'claude-sonnet-4',
-    provider: 'anthropic',
-    durationMs: 1_000,
-    cost: null,
-    tokens: {
-      input: tokens.input ?? 0,
-      output: tokens.output ?? 0,
-      cacheRead: tokens.cacheRead ?? 0,
-    },
-    turns: 1,
-    toolCalls: [],
-    errors: [],
-    finalStatus: 'completed',
-    summary: 'done',
-    ...overrides,
-  };
-}
-
-function makeConfig(input: {
-  workspace: string;
-  verification: WorkflowConfigStep['verification'];
-  retries?: number;
-  swarm?: Partial<RelayYamlConfig['swarm']>;
-  includeDiagnosticAgent?: boolean;
-}): RelayYamlConfig {
-  const workerCwd = path.join(input.workspace, 'worker');
-  const diagCwd = path.join(input.workspace, 'diag');
-
-  return {
-    version: '1',
-    name: 'verification-traceback',
-    swarm: {
-      pattern: 'dag',
-      ...input.swarm,
-    },
-    errorHandling: {
-      strategy: 'retry',
-      retryDelayMs: 0,
-    },
-    agents: [
-      {
-        name: 'worker',
-        cli: 'claude',
-        interactive: false,
-        cwd: workerCwd,
-      },
-      ...(input.includeDiagnosticAgent === false
-        ? []
-        : [
-            {
-              name: 'diag',
-              cli: 'claude',
-              interactive: false,
-              cwd: diagCwd,
-            } satisfies AgentDefinition,
-          ]),
-    ],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          {
-            name: 'implement',
-            agent: 'worker',
-            task: 'Implement the requested change',
-            retries: input.retries ?? 1,
-            verification: input.verification,
-          },
-        ],
-      },
-    ],
-    trajectories: false,
-  };
-}
-
-function verificationCommand(): string {
-  return (
-    `sh -c 'if [ -f ready.txt ]; then exit 0; ` +
-    `else echo "compile error: missing semicolon" >&2; exit 1; fi'`
-  );
-}
-
-function taskFromExecCall(execSpy: ReturnType<typeof vi.spyOn>, callIndex: number): string {
-  const call = execSpy.mock.calls[callIndex] as [AgentDefinition, { task?: string }] | undefined;
-  return String(call?.[1]?.task ?? '');
-}
-
-function getBudgetTracker(runner: InstanceType<typeof WorkflowRunner>): BudgetTracker | undefined {
-  return (runner as any).budgetTracker as BudgetTracker | undefined;
-}
-
-describe('verification traceback retry handling', () => {
-  beforeEach(() => {
-    vi.clearAllMocks();
-    queuedSubprocessResults = [];
-    queuedCollectorResults = [];
-    mockRelayInstance.shutdown.mockResolvedValue(undefined);
-    mockRelayInstance.onBrokerStderr.mockReturnValue(() => {});
-    mockRelayInstance.listAgents.mockResolvedValue([]);
-    mockRelayInstance.listAgentsRaw.mockResolvedValue([]);
-  });
-
-  afterAll(async () => {
-    await new Promise((resolve) => setTimeout(resolve, 250));
-    while (tempDirs.length > 0) {
-      rmSync(tempDirs.pop()!, { recursive: true, force: true });
-    }
-  });
-
-  it('verification failure without diagnosticAgent uses standard retry', async () => {
-    const workspace = createWorkspace(['worker']);
-    const runner = makeRunner(workspace);
-    const execSpy = vi.spyOn(runner as any, 'execNonInteractive');
-
-    queuedSubprocessResults = [
-      { stdout: 'first attempt\n', code: 0 },
-      {
-        stdout: 'second attempt\n',
-        code: 0,
-        beforeClose: () => {
-          writeFileSync(path.join(workspace, 'ready.txt'), 'ok');
-        },
-      },
-    ];
-
-    const result = await runner.execute(
-      makeConfig({
-        workspace,
-        includeDiagnosticAgent: false,
-        verification: {
-          type: 'custom',
-          value: verificationCommand(),
-        },
-      }),
-      'default'
-    );
-
-    expect(result.status, result.error).toBe('completed');
-    expect(execSpy).toHaveBeenCalledTimes(2);
-
-    const retryTask = taskFromExecCall(execSpy, 1);
-    expect(retryTask).toContain('[VERIFICATION FAILED]');
-    expect(retryTask).toContain(`Command: ${verificationCommand()}`);
-    expect(retryTask).toContain('compile error: missing semicolon');
-    expect(retryTask).not.toContain('Diagnostic analysis:');
-  });
-
-  it('verification failure with diagnosticAgent runs diagnostic before retry', async () => {
-    const workspace = createWorkspace(['worker', 'diag']);
-    const runner = makeRunner(workspace);
-    const execSpy = vi.spyOn(runner as any, 'execNonInteractive');
-
-    queuedSubprocessResults = [
-      { stdout: 'first attempt\n', code: 0 },
-      { stdout: 'The issue is in file X, line Y: missing semicolon\n', code: 0 },
-      { stdout: 'second attempt\n', code: 0 },
-    ];
-
-    const result = await runner.execute(
-      makeConfig({
-        workspace,
-        verification: {
-          type: 'custom',
-          value: 'exit 1',
-          diagnosticAgent: 'diag',
-        },
-      }),
-      'default'
-    );
-
-    expect(result.status).toBe('failed');
-    expect(result.error).toContain('Step "implement" failed after 1 retries');
-
-    expect(execSpy).toHaveBeenCalledTimes(3);
-
-    const diagnosticCall = execSpy.mock.calls[1] as [AgentDefinition, { task?: string }];
-    expect(diagnosticCall[0].name).toBe('diag');
-    expect(String(diagnosticCall[1].task)).toContain(
-      'Analyze what went wrong. Be specific. Do NOT fix the code.'
-    );
-
-    const retryTask = taskFromExecCall(execSpy, 2);
-    expect(retryTask).toContain('Diagnostic analysis:');
-    expect(retryTask).toContain('The issue is in file X, line Y: missing semicolon');
-  });
-
-  it('diagnostic agent timeout falls back to standard retry', async () => {
-    const workspace = createWorkspace(['worker', 'diag']);
-    const runner = makeRunner(workspace);
-    const execSpy = vi.spyOn(runner as any, 'execNonInteractive');
-    const logSpy = vi.spyOn(runner as any, 'log').mockImplementation(() => {});
-
-    queuedSubprocessResults = [
-      { stdout: 'first attempt\n', code: 0 },
-      { stdout: 'slow diagnostic\n', code: 0, delayMs: 5_000 },
-      {
-        stdout: 'second attempt\n',
-        code: 0,
-        beforeClose: () => {
-          writeFileSync(path.join(workspace, 'ready.txt'), 'ok');
-        },
-      },
-    ];
-
-    const result = await runner.execute(
-      makeConfig({
-        workspace,
-        verification: {
-          type: 'custom',
-          value: verificationCommand(),
-          diagnosticAgent: 'diag',
-          diagnosticTimeout: 100,
-        },
-      }),
-      'default'
-    );
-
-    expect(result.status, result.error).toBe('completed');
-    expect(execSpy).toHaveBeenCalledTimes(3);
-
-    const retryTask = taskFromExecCall(execSpy, 2);
-    expect(retryTask).toContain('[VERIFICATION FAILED]');
-    expect(retryTask).toContain('compile error: missing semicolon');
-    expect(retryTask).not.toContain('Diagnostic analysis:');
-    expect(logSpy).toHaveBeenCalledWith(expect.stringContaining('Diagnostic timed out'));
-  });
-
-  it('diagnostic agent failure falls back to standard retry', async () => {
-    const workspace = createWorkspace(['worker', 'diag']);
-    const runner = makeRunner(workspace);
-    const execSpy = vi.spyOn(runner as any, 'execNonInteractive');
-    const logSpy = vi.spyOn(runner as any, 'log').mockImplementation(() => {});
-
-    queuedSubprocessResults = [
-      { stdout: 'first attempt\n', code: 0 },
-      { error: new Error('diagnostic exploded') },
-      {
-        stdout: 'second attempt\n',
-        code: 0,
-        beforeClose: () => {
-          writeFileSync(path.join(workspace, 'ready.txt'), 'ok');
-        },
-      },
-    ];
-
-    const result = await runner.execute(
-      makeConfig({
-        workspace,
-        verification: {
-          type: 'custom',
-          value: verificationCommand(),
-          diagnosticAgent: 'diag',
-        },
-      }),
-      'default'
-    );
-
-    expect(result.status, result.error).toBe('completed');
-    expect(execSpy).toHaveBeenCalledTimes(3);
-
-    const retryTask = taskFromExecCall(execSpy, 2);
-    expect(retryTask).toContain('[VERIFICATION FAILED]');
-    expect(retryTask).toContain('compile error: missing semicolon');
-    expect(retryTask).not.toContain('Diagnostic analysis:');
-    expect(logSpy).toHaveBeenCalledWith(expect.stringContaining('Diagnostic failed'));
-  });
-
-  it('diagnosticAgent name validated against agent list', () => {
-    expect(() => {
-      workflow('traceback')
-        .agent('worker', { cli: 'claude' })
-        .step('implement', {
-          agent: 'worker',
-          task: 'Implement the requested change',
-          retries: 1,
-          verification: {
-            type: 'custom',
-            value: 'exit 1',
-            diagnosticAgent: 'nonexistent',
-          },
-        })
-        .toConfig();
-    }).toThrow('Step "implement" references unknown diagnosticAgent "nonexistent"');
-  });
-
-  it('diagnostic token usage recorded in budget tracker', async () => {
-    const workspace = createWorkspace(['worker', 'diag']);
-    const runner = makeRunner(workspace);
-
-    queuedSubprocessResults = [
-      { stdout: 'first attempt\n', code: 0 },
-      { stdout: 'The issue is in file X, line Y: missing semicolon\n', code: 0 },
-      {
-        stdout: 'second attempt\n',
-        code: 0,
-        beforeClose: () => {
-          writeFileSync(path.join(workspace, 'ready.txt'), 'ok');
-        },
-      },
-    ];
-    queuedCollectorResults = [null, makeReport({ input: 40, output: 10 }), null];
-
-    const result = await runner.execute(
-      makeConfig({
-        workspace,
-        swarm: { tokenBudget: 1_000 },
-        verification: {
-          type: 'custom',
-          value: verificationCommand(),
-          diagnosticAgent: 'diag',
-        },
-      }),
-      'default'
-    );
-
-    const tracker = getBudgetTracker(runner);
-
-    expect(result.status, result.error).toBe('completed');
-    expect(mockCollectCliSession).toHaveBeenCalledTimes(3);
-    expect(tracker?.getTotalUsage()).toEqual({
-      input: 40,
-      output: 10,
-      cacheRead: 0,
-      total: 50,
-    });
-  });
-
-  it('no retries configured with diagnosticAgent logs warning', () => {
-    const warnSpy = vi.spyOn(console, 'warn').mockImplementation(() => {});
-
-    workflow('traceback')
-      .agent('worker', { cli: 'claude' })
-      .agent('diag', { cli: 'claude' })
-      .step('implement', {
-        agent: 'worker',
-        task: 'Implement the requested change',
-        retries: 0,
-        verification: {
-          type: 'custom',
-          value: 'exit 1',
-          diagnosticAgent: 'diag',
-        },
-      })
-      .toConfig();
-
-    expect(warnSpy).toHaveBeenCalledWith(
-      'Step "implement": diagnosticAgent configured but no retries — diagnostic will never run'
-    );
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/verification.test.ts b/packages/sdk/src/workflows/__tests__/verification.test.ts
deleted file mode 100644
index 935451afb..000000000
--- a/packages/sdk/src/workflows/__tests__/verification.test.ts
+++ /dev/null
@@ -1,381 +0,0 @@
-import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest';
-import fs from 'node:fs';
-import path from 'node:path';
-import os from 'node:os';
-
-// The module under test — does not exist yet (red phase).
-import {
-  runVerification,
-  stripInjectedTaskEcho,
-  checkOutputContains,
-  checkFileExists,
-  checkCustom,
-  execCustomVerification,
-  findPrUrl,
-  type VerificationCheck,
-  type VerificationResult,
-  type VerificationOptions,
-  WorkflowCompletionError,
-} from '../verification.js';
-
-// ── helpers ───────────────────────────────────────────────────────────────────
-
-const noopSideEffects = {
-  recordStepToolSideEffect: vi.fn(),
-  getOrCreateStepEvidenceRecord: vi.fn(() => ({
-    evidence: { coordinationSignals: [] },
-  })),
-  log: vi.fn(),
-};
-
-function run(
-  check: VerificationCheck,
-  output: string,
-  stepName = 'test-step',
-  options?: VerificationOptions
-): VerificationResult {
-  return runVerification(check, output, stepName, undefined, options, noopSideEffects);
-}
-
-// ── tests ─────────────────────────────────────────────────────────────────────
-
-describe('verification logic', () => {
-  beforeEach(() => {
-    vi.clearAllMocks();
-  });
-
-  // 1. exit_code — pass on exit 0 (implicit success)
-  describe('exit_code', () => {
-    it('should pass when agent exited successfully (exit 0 implicit)', () => {
-      const result = run({ type: 'exit_code', value: '0' }, 'some output');
-      expect(result.passed).toBe(true);
-      expect(result.completionReason).toBe('completed_verified');
-    });
-
-    it('should still pass for non-zero value (exit_code is implicitly satisfied)', () => {
-      // per existing logic, exit_code case is a no-op — always passes if we reach it
-      const result = run({ type: 'exit_code', value: '1' }, 'output');
-      expect(result.passed).toBe(true);
-    });
-  });
-
-  // 2. output_contains — case-sensitive substring match
-  describe('output_contains', () => {
-    it('should pass when output contains the token', () => {
-      const result = run(
-        { type: 'output_contains', value: 'BUILD_SUCCESS' },
-        'Starting build...\nBUILD_SUCCESS\nDone.'
-      );
-      expect(result.passed).toBe(true);
-      expect(result.completionReason).toBe('completed_verified');
-    });
-
-    it('should fail when output does not contain the token', () => {
-      expect(() => run({ type: 'output_contains', value: 'BUILD_SUCCESS' }, 'build failed')).toThrow(
-        WorkflowCompletionError
-      );
-    });
-
-    it('should be case-sensitive', () => {
-      expect(() => run({ type: 'output_contains', value: 'BUILD_SUCCESS' }, 'build_success')).toThrow(
-        WorkflowCompletionError
-      );
-    });
-
-    it('should return failure result instead of throwing when allowFailure is set', () => {
-      const result = run({ type: 'output_contains', value: 'MISSING' }, 'no match here', 'test-step', {
-        allowFailure: true,
-      });
-      expect(result.passed).toBe(false);
-      expect(result.completionReason).toBe('failed_verification');
-      expect(result.error).toContain('MISSING');
-    });
-  });
-
-  // 3. file_exists — checks file presence at path
-  describe('file_exists', () => {
-    let tmpDir: string;
-    let tmpFile: string;
-
-    beforeEach(() => {
-      tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'verify-test-'));
-      tmpFile = path.join(tmpDir, 'artifact.txt');
-    });
-
-    afterEach(() => {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    });
-
-    it('should pass when the file exists', () => {
-      fs.writeFileSync(tmpFile, 'content');
-      // file_exists resolves relative to cwd; pass absolute path as value
-      const result = run({ type: 'file_exists', value: tmpFile }, '');
-      expect(result.passed).toBe(true);
-    });
-
-    it('should fail when the file does not exist', () => {
-      expect(() => run({ type: 'file_exists', value: path.join(tmpDir, 'nope.txt') }, '')).toThrow(
-        WorkflowCompletionError
-      );
-    });
-  });
-
-  // 4. custom verification — shell command execution
-  describe('custom', () => {
-    it('should pass when shell command exits 0', () => {
-      const result = run({ type: 'custom', value: 'true' }, 'output');
-      expect(result.passed).toBe(true);
-      expect(result.completionReason).toBe('completed_verified');
-    });
-
-    it('should fail when shell command exits non-zero', () => {
-      expect(() => run({ type: 'custom', value: 'false' }, 'output')).toThrow(WorkflowCompletionError);
-    });
-
-    it('should return failure with allowFailure', () => {
-      const result = run({ type: 'custom', value: 'false' }, 'output', 'test-step', {
-        allowFailure: true,
-      });
-      expect(result.passed).toBe(false);
-      expect(result.completionReason).toBe('failed_verification');
-    });
-
-    it('should preserve legacy no-op behavior when no command is provided', () => {
-      const result = run({ type: 'custom', value: '' }, 'output');
-      expect(result).toEqual({ passed: false });
-    });
-
-    it('should include command output in the failure message', () => {
-      const result = run(
-        { type: 'custom', value: 'printf "compile failed" >&2; exit 1' },
-        'output',
-        'test-step',
-        {
-          allowFailure: true,
-        }
-      );
-      expect(result.error).toContain('custom check "printf "compile failed" >&2; exit 1" failed');
-      expect(result.error).toContain('compile failed');
-    });
-  });
-
-  describe('execCustomVerification', () => {
-    it('should return passed true for exit-0 command', () => {
-      expect(execCustomVerification('true', process.cwd())).toEqual({ passed: true, output: '' });
-    });
-
-    it('should return passed false for exit-1 command', () => {
-      const result = execCustomVerification('false', process.cwd());
-      expect(result.passed).toBe(false);
-      expect(result.output.length).toBeGreaterThanOrEqual(0);
-    });
-
-    it('should capture stdout from command', () => {
-      const result = execCustomVerification('echo hello', process.cwd());
-      expect(result.passed).toBe(true);
-      expect(result.output).toBe('hello');
-    });
-
-    it('should capture stderr from a failing command', () => {
-      const result = execCustomVerification('printf "boom" >&2; exit 1', process.cwd());
-      expect(result.passed).toBe(false);
-      expect(result.output).toContain('boom');
-    });
-  });
-
-  // 4b. checkCustom unit tests
-  describe('checkCustom', () => {
-    it('should return passed true for exit-0 command', () => {
-      expect(checkCustom('true', 'any')).toEqual({ passed: true, stdout: '' });
-    });
-
-    it('should return passed false for exit-1 command', () => {
-      const result = checkCustom('false', 'any');
-      expect(result.passed).toBe(false);
-      expect(result.error).toBeDefined();
-    });
-
-    it('should capture stdout from command', () => {
-      const result = checkCustom('echo hello', 'any');
-      expect(result.passed).toBe(true);
-      expect(result.stdout).toBe('hello');
-    });
-
-    it('should handle regex matching', () => {
-      expect(checkCustom('regex:^foo', 'foobar')).toEqual({ passed: true });
-      expect(checkCustom('regex:^foo', 'barfoo').passed).toBe(false);
-    });
-
-    it('should handle invalid regex gracefully', () => {
-      const result = checkCustom('regex:[', 'any');
-      expect(result.passed).toBe(false);
-      expect(result.error).toContain('invalid regex');
-    });
-  });
-
-  // 5. Invalid/unknown verification type — falls through gracefully
-  describe('unknown type', () => {
-    it('should fall through and pass for unknown verification types', () => {
-      const result = run({ type: 'nonexistent' as VerificationCheck['type'], value: 'x' }, 'output');
-      // falls through the switch with no match, reaches success path
-      expect(result.passed).toBe(true);
-    });
-  });
-
-  // 6. completionMarkerFound option
-  describe('completionMarkerFound option', () => {
-    it('should log legacy marker message when completionMarkerFound is false', () => {
-      const result = run({ type: 'exit_code', value: '0' }, 'output', 'my-step', {
-        completionMarkerFound: false,
-      });
-      expect(result.passed).toBe(true);
-      expect(noopSideEffects.log).toHaveBeenCalledWith(
-        expect.stringContaining('without legacy STEP_COMPLETE marker')
-      );
-    });
-  });
-
-  // 7. stripInjectedTaskEcho
-  describe('stripInjectedTaskEcho', () => {
-    it('should return output unchanged when no injectedTaskText', () => {
-      expect(stripInjectedTaskEcho('hello world')).toBe('hello world');
-      expect(stripInjectedTaskEcho('hello world', undefined)).toBe('hello world');
-    });
-
-    it('should strip the injected task text from output', () => {
-      const task = 'Please run the build';
-      const output = 'Starting...\nPlease run the build\nBUILD_SUCCESS';
-      expect(stripInjectedTaskEcho(output, task)).toBe('Starting...\n\nBUILD_SUCCESS');
-    });
-
-    it('should handle CRLF normalization', () => {
-      const task = 'Run task\r\nwith newlines';
-      const output = 'prefix Run task\nwith newlines suffix';
-      expect(stripInjectedTaskEcho(output, task)).toBe('prefix  suffix');
-    });
-
-    it('should handle LF to CRLF normalization', () => {
-      const task = 'Run task\nwith newlines';
-      const output = 'prefix Run task\r\nwith newlines suffix';
-      expect(stripInjectedTaskEcho(output, task)).toBe('prefix  suffix');
-    });
-
-    it('should return output unchanged when task text is not found', () => {
-      expect(stripInjectedTaskEcho('output text', 'not present')).toBe('output text');
-    });
-
-    it('should handle empty injected task text', () => {
-      expect(stripInjectedTaskEcho('output', '')).toBe('output');
-    });
-  });
-
-  // 8. checkOutputContains with injectedTaskText
-  describe('checkOutputContains with injectedTaskText', () => {
-    it('should not match token that only appears in injected task echo', () => {
-      const task = 'Verify BUILD_SUCCESS appears';
-      const output = 'Verify BUILD_SUCCESS appears\nDone.';
-      expect(checkOutputContains(output, 'BUILD_SUCCESS', task)).toBe(false);
-    });
-
-    it('should match token that appears outside injected task echo', () => {
-      const task = 'Run the build';
-      const output = 'Run the build\nBUILD_SUCCESS';
-      expect(checkOutputContains(output, 'BUILD_SUCCESS', task)).toBe(true);
-    });
-
-    it('should return false for empty token', () => {
-      expect(checkOutputContains('anything', '', undefined)).toBe(false);
-    });
-  });
-
-  // 9. checkFileExists path traversal protection
-  describe('checkFileExists path traversal', () => {
-    let tmpDir: string;
-
-    beforeEach(() => {
-      tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), 'verify-traversal-'));
-    });
-
-    afterEach(() => {
-      fs.rmSync(tmpDir, { recursive: true, force: true });
-    });
-
-    it('should reject path traversal with ../', () => {
-      expect(checkFileExists('../../etc/passwd', tmpDir)).toBe(false);
-    });
-
-    it('should reject relative path with .. that resolves outside cwd', () => {
-      expect(checkFileExists('../../../etc/passwd', tmpDir)).toBe(false);
-    });
-
-    it('should allow files within cwd', () => {
-      const file = path.join(tmpDir, 'ok.txt');
-      fs.writeFileSync(file, 'ok');
-      expect(checkFileExists('ok.txt', tmpDir)).toBe(true);
-    });
-  });
-
-  describe('pr_url verification', () => {
-    it('passes when a github PR URL appears in the worker output', () => {
-      const result = run(
-        { type: 'pr_url', value: '' },
-        'shipped: https://github.com/AgentWorkforce/cloud/pull/606 ready for review'
-      );
-      expect(result.passed).toBe(true);
-      expect(result.completionReason).toBe('completed_verified');
-    });
-
-    it('fails with a WorkflowCompletionError when no PR URL is present', () => {
-      expect(() =>
-        run(
-          { type: 'pr_url', value: '' },
-          'All tests pass and the build is clean.\nfiles modified: foo.ts, bar.ts'
-        )
-      ).toThrow(WorkflowCompletionError);
-    });
-
-    it('rejects PR URLs for a different repository when a qualifier is provided', () => {
-      expect(() =>
-        run(
-          { type: 'pr_url', value: 'AgentWorkforce/relaycast' },
-          'Migration done: https://github.com/AgentWorkforce/cloud/pull/606'
-        )
-      ).toThrow(WorkflowCompletionError);
-    });
-
-    it('accepts a PR URL whose repo matches the qualifier case-insensitively', () => {
-      const result = run(
-        { type: 'pr_url', value: 'agentworkforce/relaycast' },
-        'See https://github.com/AgentWorkforce/relaycast/pull/128 for the SDK change.'
-      );
-      expect(result.passed).toBe(true);
-    });
-  });
-
-  describe('findPrUrl', () => {
-    it('returns the first matching URL when no qualifier is given', () => {
-      const url = findPrUrl(
-        'first https://github.com/foo/bar/pull/1 second https://github.com/foo/bar/pull/2'
-      );
-      expect(url).toBe('https://github.com/foo/bar/pull/1');
-    });
-
-    it('filters by repository qualifier', () => {
-      const url = findPrUrl(
-        'wrong https://github.com/foo/bar/pull/1 right https://github.com/baz/qux/pull/9',
-        'baz/qux'
-      );
-      expect(url).toBe('https://github.com/baz/qux/pull/9');
-    });
-
-    it('returns null when no PR URL is present', () => {
-      expect(findPrUrl('OWNER_DECISION: COMPLETE\nfiles modified: foo.ts')).toBeNull();
-    });
-
-    it('ignores PR URLs echoed inside the injected task text', () => {
-      const injected = 'Reference: https://github.com/foo/bar/pull/42';
-      const output = injected + '\nWorker said: tests pass, no PR opened, all good';
-      expect(findPrUrl(output, undefined, injected)).toBeNull();
-    });
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/workflow-reliability-contract.test.ts b/packages/sdk/src/workflows/__tests__/workflow-reliability-contract.test.ts
deleted file mode 100644
index 276027387..000000000
--- a/packages/sdk/src/workflows/__tests__/workflow-reliability-contract.test.ts
+++ /dev/null
@@ -1,637 +0,0 @@
-import { afterEach, describe, expect, it, vi } from 'vitest';
-import { mkdirSync, mkdtempSync, rmSync, writeFileSync } from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-
-import { workflow } from '../builder.js';
-import { WorkflowRunner, type WorkflowDb } from '../runner.js';
-import type { RelayYamlConfig, WorkflowRunRow, WorkflowStepRow } from '../types.js';
-
-afterEach(() => {
-  vi.unstubAllGlobals();
-});
-
-function makeDb(): WorkflowDb {
-  const runs = new Map<string, WorkflowRunRow>();
-  const steps = new Map<string, WorkflowStepRow>();
-
-  return {
-    insertRun: vi.fn(async (run: WorkflowRunRow) => {
-      runs.set(run.id, { ...run });
-    }),
-    updateRun: vi.fn(async (id: string, patch: Partial<WorkflowRunRow>) => {
-      const existing = runs.get(id);
-      if (existing) runs.set(id, { ...existing, ...patch });
-    }),
-    getRun: vi.fn(async (id: string) => {
-      const run = runs.get(id);
-      return run ? { ...run } : null;
-    }),
-    insertStep: vi.fn(async (step: WorkflowStepRow) => {
-      steps.set(step.id, { ...step });
-    }),
-    updateStep: vi.fn(async (id: string, patch: Partial<WorkflowStepRow>) => {
-      const existing = steps.get(id);
-      if (existing) steps.set(id, { ...existing, ...patch });
-    }),
-    getStepsByRunId: vi.fn(async (runId: string) =>
-      [...steps.values()].filter((step) => step.runId === runId).map((step) => ({ ...step }))
-    ),
-  };
-}
-
-function baseConfig(overrides: Partial<RelayYamlConfig> = {}): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'workflow-reliability-contract',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'fixer', cli: 'claude', role: 'implementation engineer', interactive: false }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          {
-            name: 'verify',
-            type: 'deterministic',
-            command: 'verify',
-            captureOutput: true,
-          },
-        ],
-      },
-    ],
-    trajectories: false,
-    ...overrides,
-  };
-}
-
-describe('workflow reliability contract', () => {
-  it('makes SDK builder workflows repairable by default', () => {
-    const config = workflow('default-reliable')
-      .agent('fixer', { cli: 'claude', role: 'implementation engineer' })
-      .step('verify', { type: 'deterministic', command: 'npm test' })
-      .toConfig();
-
-    expect(config.errorHandling).toMatchObject({
-      strategy: 'retry',
-      maxRetries: 2,
-      retryDelayMs: 1000,
-      repairRetries: 2,
-    });
-  });
-
-  it('offers reliable and repairable presets for workflow authors', () => {
-    const reliable = workflow('reliable')
-      .agent('fixer', { cli: 'claude', role: 'implementation engineer' })
-      .step('verify', { type: 'deterministic', command: 'npm test' })
-      .reliable({ repairAgent: 'fixer', repairRetries: 3 })
-      .toConfig();
-    const repairable = workflow('repairable')
-      .agent('fixer', { cli: 'claude', role: 'implementation engineer' })
-      .step('verify', { type: 'deterministic', command: 'npm test' })
-      .repairable({ maxRetries: 4 })
-      .toConfig();
-
-    expect(reliable.errorHandling).toMatchObject({
-      strategy: 'retry',
-      maxRetries: 3,
-      repairAgent: 'fixer',
-      repairRetries: 3,
-    });
-    expect(repairable.errorHandling).toMatchObject({
-      strategy: 'retry',
-      maxRetries: 4,
-      repairRetries: 4,
-    });
-  });
-
-  it('applies repair-aware defaults to raw runner configs with agents', async () => {
-    const executeDeterministicStep = vi
-      .fn()
-      .mockResolvedValueOnce({ output: 'missing artifact', exitCode: 1 })
-      .mockResolvedValueOnce({ output: 'artifact exists', exitCode: 0 });
-    const executeAgentStep = vi.fn(async () => 'created artifact');
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: process.cwd(),
-      executor: { executeDeterministicStep, executeAgentStep },
-    });
-
-    const run = await runner.execute(baseConfig(), 'default');
-
-    expect(run.status, run.error).toBe('completed');
-    expect(executeAgentStep).toHaveBeenCalledTimes(1);
-    expect(executeDeterministicStep).toHaveBeenCalledTimes(2);
-  });
-
-  it('routes repairable deterministic failures through a repair agent before retrying', async () => {
-    const executeDeterministicStep = vi
-      .fn()
-      .mockResolvedValueOnce({ output: 'missing generated artifact', exitCode: 1 })
-      .mockResolvedValueOnce({ output: 'artifact exists', exitCode: 0 });
-    const executeAgentStep = vi.fn(async () => 'created generated artifact');
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: process.cwd(),
-      executor: { executeDeterministicStep, executeAgentStep },
-    });
-
-    const run = await runner.execute(
-      baseConfig({
-        errorHandling: { strategy: 'retry', repairRetries: 1, retryDelayMs: 1, repairAgent: 'fixer' },
-      }),
-      'default'
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(executeAgentStep).toHaveBeenCalledTimes(1);
-    expect((executeAgentStep as any).mock.calls[0][2]).toContain('A deterministic workflow gate failed');
-    expect(executeDeterministicStep).toHaveBeenCalledTimes(2);
-  });
-
-  it('still retries the deterministic gate when the repair agent attempt throws', async () => {
-    const executeDeterministicStep = vi
-      .fn()
-      .mockResolvedValueOnce({ output: 'transient failure', exitCode: 1 })
-      .mockResolvedValueOnce({ output: 'passed after retry', exitCode: 0 });
-    const executeAgentStep = vi.fn(async () => {
-      throw new Error('repair model unavailable');
-    });
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: process.cwd(),
-      executor: { executeDeterministicStep, executeAgentStep },
-    });
-
-    const run = await runner.execute(
-      baseConfig({
-        errorHandling: { strategy: 'retry', repairRetries: 1, retryDelayMs: 1, repairAgent: 'fixer' },
-      }),
-      'default'
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(executeAgentStep).toHaveBeenCalledTimes(1);
-    expect(executeDeterministicStep).toHaveBeenCalledTimes(2);
-  });
-
-  it('fails only after the deterministic repair retry budget is exhausted', async () => {
-    const executeDeterministicStep = vi.fn(async () => ({ output: 'still broken', exitCode: 1 }));
-    const executeAgentStep = vi.fn(async () => 'attempted repair');
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: process.cwd(),
-      executor: { executeDeterministicStep, executeAgentStep },
-    });
-
-    const run = await runner.execute(
-      baseConfig({
-        errorHandling: { strategy: 'retry', repairRetries: 2, retryDelayMs: 1, repairAgent: 'fixer' },
-      }),
-      'default'
-    );
-
-    expect(run.status).toBe('failed');
-    expect(run.error).toContain('verify');
-    expect(executeAgentStep).toHaveBeenCalledTimes(2);
-    expect(executeDeterministicStep).toHaveBeenCalledTimes(3);
-  });
-
-  it('keeps soft deterministic checks non-terminal so a later agent step can fix them', async () => {
-    const executeDeterministicStep = vi.fn(async () => ({ output: 'typecheck failed', exitCode: 1 }));
-    const executeAgentStep = vi.fn(async () => 'fixed typecheck');
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: process.cwd(),
-      executor: { executeDeterministicStep, executeAgentStep },
-    });
-
-    const run = await runner.execute(
-      baseConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'soft-validation',
-                type: 'deterministic',
-                command: 'npm run typecheck',
-                captureOutput: true,
-                failOnError: false,
-              },
-              {
-                name: 'fix-validation',
-                agent: 'fixer',
-                task: 'Fix validation using {{steps.soft-validation.output}}',
-                dependsOn: ['soft-validation'],
-              },
-            ],
-          },
-        ],
-      }),
-      'default'
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(executeAgentStep).toHaveBeenCalledTimes(1);
-    expect((executeAgentStep as any).mock.calls[0][2]).toContain('typecheck failed');
-  });
-
-  it('treats final hard validation as repairable before terminal failure', async () => {
-    const executeDeterministicStep = vi
-      .fn()
-      .mockResolvedValueOnce({ output: 'final typecheck failed', exitCode: 1 })
-      .mockResolvedValueOnce({ output: 'final validation passed', exitCode: 0 });
-    const executeAgentStep = vi.fn(async () => 'fixed final validation');
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: process.cwd(),
-      executor: { executeDeterministicStep, executeAgentStep },
-    });
-
-    const run = await runner.execute(
-      baseConfig({
-        errorHandling: { strategy: 'retry', repairRetries: 1, retryDelayMs: 1, repairAgent: 'fixer' },
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'final-hard-validation',
-                type: 'deterministic',
-                command: 'npm run typecheck && npm test',
-                captureOutput: true,
-                failOnError: true,
-              },
-            ],
-          },
-        ],
-      }),
-      'default'
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(executeAgentStep).toHaveBeenCalledTimes(1);
-    expect((executeAgentStep as any).mock.calls[0][2]).toContain('final-hard-validation');
-    expect(executeDeterministicStep).toHaveBeenCalledTimes(2);
-  });
-
-  it('keeps sibling branches independent when one branch captures a soft failure for repair', async () => {
-    const executeDeterministicStep = vi.fn(async (_step, command: string) => {
-      if (command === 'branch-a-soft-check') return { output: 'branch A needs repair', exitCode: 1 };
-      return { output: `${command} ok`, exitCode: 0 };
-    });
-    const executeAgentStep = vi.fn(async () => 'merged branch evidence and fixed branch A');
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: process.cwd(),
-      executor: { executeDeterministicStep, executeAgentStep },
-    });
-
-    const run = await runner.execute(
-      baseConfig({
-        swarm: { pattern: 'fan-out' },
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'branch-a-validation',
-                type: 'deterministic',
-                command: 'branch-a-soft-check',
-                captureOutput: true,
-                failOnError: false,
-              },
-              {
-                name: 'branch-b-validation',
-                type: 'deterministic',
-                command: 'branch-b-check',
-                captureOutput: true,
-                failOnError: true,
-              },
-              {
-                name: 'merge-and-fix',
-                agent: 'fixer',
-                task: 'Use {{steps.branch-a-validation.output}} and {{steps.branch-b-validation.output}}.',
-                dependsOn: ['branch-a-validation', 'branch-b-validation'],
-              },
-            ],
-          },
-        ],
-      }),
-      'default'
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(executeDeterministicStep).toHaveBeenCalledTimes(2);
-    expect(executeAgentStep).toHaveBeenCalledTimes(1);
-    expect((executeAgentStep as any).mock.calls[0][2]).toContain('branch A needs repair');
-    expect((executeAgentStep as any).mock.calls[0][2]).toContain('branch-b-check ok');
-  });
-
-  it('uses the best available workflow agent when no explicit repairAgent is configured', async () => {
-    const executeDeterministicStep = vi
-      .fn()
-      .mockResolvedValueOnce({ output: 'needs repair', exitCode: 1 })
-      .mockResolvedValueOnce({ output: 'fixed', exitCode: 0 });
-    const executeAgentStep = vi.fn(async () => 'fixed by fallback agent');
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: process.cwd(),
-      executor: { executeDeterministicStep, executeAgentStep },
-    });
-
-    const run = await runner.execute(
-      baseConfig({
-        errorHandling: { strategy: 'retry', repairRetries: 1, retryDelayMs: 1 },
-        agents: [
-          { name: 'reviewer', cli: 'claude', role: 'reviewer' },
-          { name: 'implementer', cli: 'claude', role: 'implementation engineer', interactive: false },
-        ],
-      }),
-      'default'
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect((executeAgentStep as any).mock.calls[0][1]).toMatchObject({ name: 'implementer' });
-  });
-
-  it('falls back to a suitable workflow agent when the configured repairAgent is invalid', async () => {
-    const executeDeterministicStep = vi
-      .fn()
-      .mockResolvedValueOnce({ output: 'needs repair', exitCode: 1 })
-      .mockResolvedValueOnce({ output: 'fixed', exitCode: 0 });
-    const executeAgentStep = vi.fn(async () => 'fixed by fallback agent');
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: process.cwd(),
-      executor: { executeDeterministicStep, executeAgentStep },
-    });
-
-    const run = await runner.execute(
-      baseConfig({
-        errorHandling: {
-          strategy: 'retry',
-          repairRetries: 1,
-          retryDelayMs: 1,
-          repairAgent: 'missing-repair-agent',
-        },
-      }),
-      'default'
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect((executeAgentStep as any).mock.calls[0][1]).toMatchObject({ name: 'fixer' });
-  });
-
-  it('preserves cached step output when resuming from a later repair step', async () => {
-    const tmpDir = mkdtempSync(path.join(os.tmpdir(), 'relay-reliability-start-from-'));
-    const previousRunId = 'previous-run-with-soft-validation';
-    const outputDir = path.join(tmpDir, '.agent-relay', 'step-outputs', previousRunId);
-    mkdirSync(outputDir, { recursive: true });
-    writeFileSync(path.join(outputDir, 'soft-validation.md'), 'cached typecheck failure');
-
-    const executeAgentStep = vi.fn(async () => 'fixed cached validation failure');
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: tmpDir,
-      executor: { executeAgentStep },
-    });
-
-    try {
-      const run = await runner.execute(
-        baseConfig({
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                {
-                  name: 'soft-validation',
-                  type: 'deterministic',
-                  command: 'npm run typecheck',
-                  captureOutput: true,
-                  failOnError: false,
-                },
-                {
-                  name: 'fix-validation',
-                  agent: 'fixer',
-                  task: 'Fix this prior output: {{steps.soft-validation.output}}',
-                  dependsOn: ['soft-validation'],
-                },
-              ],
-            },
-          ],
-        }),
-        'default',
-        undefined,
-        { startFrom: 'fix-validation', previousRunId }
-      );
-
-      expect(run.status, run.error).toBe('completed');
-      expect(executeAgentStep).toHaveBeenCalledTimes(1);
-      expect((executeAgentStep as any).mock.calls[0][2]).toContain('cached typecheck failure');
-    } finally {
-      rmSync(tmpDir, { recursive: true, force: true });
-    }
-  });
-
-  it('repairs malformed agent artifacts before retrying the agent step', async () => {
-    const executeAgentStep = vi.fn(async (step) => {
-      if (step.name.includes('-repair-')) return 'patched artifact instructions';
-      if (
-        (executeAgentStep as any).mock.calls.filter(([s]: any[]) => s.name === 'write-artifact').length === 1
-      ) {
-        return 'plain prose without required metadata';
-      }
-      return 'artifact complete\nRICKY_MASTER_CHILD_RUN_VERIFIED';
-    });
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: process.cwd(),
-      executor: { executeAgentStep },
-    });
-
-    const run = await runner.execute(
-      baseConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'write-artifact',
-                agent: 'fixer',
-                task: 'Write a structured workflow artifact.',
-                verification: {
-                  type: 'output_contains',
-                  value: 'RICKY_MASTER_CHILD_RUN_VERIFIED',
-                },
-              },
-            ],
-          },
-        ],
-      }),
-      'default'
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(executeAgentStep).toHaveBeenCalledTimes(3);
-    expect((executeAgentStep as any).mock.calls[1][0]).toMatchObject({ name: 'write-artifact-repair-1' });
-    expect((executeAgentStep as any).mock.calls[1][2]).toContain('invalid artifact');
-  });
-
-  it('repairs child INVALID_ARTIFACT failures instead of stopping the master at attempt one', async () => {
-    const executeAgentStep = vi.fn(async (step) => {
-      if (step.name.includes('-repair-')) return 'repaired child workflow artifact';
-      const childAttempts = (executeAgentStep as any).mock.calls.filter(
-        ([s]: any[]) => s.name === 'run-update-config-2'
-      ).length;
-      if (childAttempts === 1) {
-        return 'Execution: blocked — INVALID_ARTIFACT at final-hard-validation';
-      }
-      return 'Execution: success — run child-fixed\nRICKY_MASTER_CHILD_RUN_VERIFIED';
-    });
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: process.cwd(),
-      executor: { executeAgentStep },
-    });
-
-    const run = await runner.execute(
-      baseConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'run-update-config-2',
-                agent: 'fixer',
-                task: 'Run the child workflow and return structured evidence.',
-                verification: {
-                  type: 'output_contains',
-                  value: 'RICKY_MASTER_CHILD_RUN_VERIFIED',
-                },
-              },
-              {
-                name: 'final-signoff',
-                type: 'deterministic',
-                command: 'true',
-                dependsOn: ['run-update-config-2'],
-              },
-            ],
-          },
-        ],
-      }),
-      'default'
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(executeAgentStep).toHaveBeenCalledTimes(3);
-    expect((executeAgentStep as any).mock.calls[1][2]).toContain('INVALID_ARTIFACT');
-  });
-
-  it('keeps retrying the failed gate when a repair agent returns an unusable fix', async () => {
-    const executeDeterministicStep = vi
-      .fn()
-      .mockResolvedValueOnce({ output: 'INVALID_ARTIFACT', exitCode: 1 })
-      .mockResolvedValueOnce({ output: 'still INVALID_ARTIFACT', exitCode: 1 })
-      .mockResolvedValueOnce({ output: 'artifact valid', exitCode: 0 });
-    const executeAgentStep = vi
-      .fn()
-      .mockResolvedValueOnce('malformed repair response without fenced artifact')
-      .mockResolvedValueOnce('valid repair response with metadata');
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: process.cwd(),
-      executor: { executeDeterministicStep, executeAgentStep },
-    });
-
-    const run = await runner.execute(
-      baseConfig({
-        errorHandling: { strategy: 'retry', repairRetries: 2, retryDelayMs: 1, repairAgent: 'fixer' },
-      }),
-      'default'
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(executeAgentStep).toHaveBeenCalledTimes(2);
-    expect(executeDeterministicStep).toHaveBeenCalledTimes(3);
-  });
-
-  it('runs supervised api owners without spawning an interactive owner process', async () => {
-    const fetch = vi.fn(async () => {
-      return new Response(
-        JSON.stringify({
-          content: [{ type: 'text', text: 'OWNER_DECISION: COMPLETE\nReason: worker output verified' }],
-          model: 'claude-sonnet-4-20250514',
-        }),
-        { status: 200, headers: { 'content-type': 'application/json' } }
-      );
-    });
-    vi.stubGlobal('fetch', fetch);
-
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: process.cwd(),
-      envSecrets: { ANTHROPIC_API_KEY: 'test-api-key' },
-    });
-    const spawnAndWait = vi.fn(async (agent: any, _step: any, _timeoutMs: any, options: any) => {
-      options?.onSpawned?.({ actualName: agent.name, agent: { release: async () => undefined } });
-      if (agent.name === 'worker') {
-        return { output: 'DONE', exitCode: 0, promptTaskText: 'worker task' };
-      }
-      throw new Error('api owner should not use spawnAndWait');
-    });
-    (runner as any).spawnAndWait = spawnAndWait;
-
-    const result = await (runner as any).executeSupervisedAgentStep(
-      {
-        name: 'supervised-api-owner',
-        agent: 'worker',
-        task: 'produce done',
-        verification: { type: 'output_contains', value: 'DONE' },
-      },
-      {
-        specialist: { name: 'worker', cli: 'claude', role: 'worker' },
-        owner: { name: 'owner', cli: 'api', role: 'owner' },
-      },
-      'produce done'
-    );
-
-    expect(result).toMatchObject({
-      specialistOutput: 'DONE',
-      completionReason: 'completed_by_owner_decision',
-    });
-    expect(fetch).toHaveBeenCalledTimes(1);
-    expect(spawnAndWait).toHaveBeenCalledTimes(1);
-  });
-
-  it('does not run repair agents for fail-fast workflows even when agents are present', async () => {
-    const executeDeterministicStep = vi.fn(async () => ({ output: 'hard failure', exitCode: 1 }));
-    const executeAgentStep = vi.fn(async () => 'unexpected repair');
-    const runner = new WorkflowRunner({
-      db: makeDb(),
-      workspaceId: 'ws-test',
-      cwd: process.cwd(),
-      executor: { executeDeterministicStep, executeAgentStep },
-    });
-
-    const run = await runner.execute(baseConfig({ errorHandling: { strategy: 'fail-fast' } }), 'default');
-
-    expect(run.status).toBe('failed');
-    expect(executeAgentStep).not.toHaveBeenCalled();
-    expect(executeDeterministicStep).toHaveBeenCalledTimes(1);
-  });
-});
diff --git a/packages/sdk/src/workflows/__tests__/workflow-reliability-e2e.test.ts b/packages/sdk/src/workflows/__tests__/workflow-reliability-e2e.test.ts
deleted file mode 100644
index a9ef17163..000000000
--- a/packages/sdk/src/workflows/__tests__/workflow-reliability-e2e.test.ts
+++ /dev/null
@@ -1,248 +0,0 @@
-import { describe, expect, it } from 'vitest';
-import { execSync } from 'node:child_process';
-import { mkdirSync, mkdtempSync, rmSync, writeFileSync } from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-
-import { WorkflowRunner } from '../runner.js';
-import type { AgentDefinition, RelayYamlConfig, WorkflowStep } from '../types.js';
-
-const CHECK_MARKER =
-  "node -e \"const fs=require('fs');const v=fs.readFileSync('marker.txt','utf8').trim();if(v!=='fixed'){console.log('marker='+v);process.exit(1)}console.log('ok')\"";
-
-function baseConfig(
-  name: string,
-  pattern: RelayYamlConfig['swarm']['pattern'],
-  steps: NonNullable<RelayYamlConfig['workflows']>[number]['steps']
-): RelayYamlConfig {
-  return {
-    version: '1',
-    name,
-    swarm: { pattern },
-    agents: [
-      {
-        name: 'fixer',
-        cli: 'claude',
-        role: 'implementation engineer',
-        interactive: false,
-      },
-    ],
-    workflows: [{ name: 'default', steps }],
-    trajectories: false,
-  };
-}
-
-function makeWorkspace(): string {
-  const cwd = mkdtempSync(path.join(os.tmpdir(), 'relay-workflow-reliability-e2e-'));
-  writeFileSync(path.join(cwd, 'marker.txt'), 'broken\n');
-  return cwd;
-}
-
-async function runReliabilityWorkflow(config: RelayYamlConfig, cwd = makeWorkspace()) {
-  const callsByStep = new Map<string, number>();
-  const executeAgentStep = async (
-    step: WorkflowStep,
-    _agent: AgentDefinition,
-    resolvedTask: string
-  ): Promise<string> => {
-    const count = (callsByStep.get(step.name) ?? 0) + 1;
-    callsByStep.set(step.name, count);
-
-    if (step.name.includes('-repair-')) {
-      writeFileSync(path.join(step.cwd ?? cwd, 'marker.txt'), 'fixed\n');
-      return `repair complete for ${step.name}`;
-    }
-
-    if (/invalid[- ]artifact/i.test(step.name) && count === 1) {
-      return 'Execution: blocked — INVALID_ARTIFACT at final-hard-validation';
-    }
-
-    if (/child/i.test(resolvedTask) && count === 1) {
-      return 'Execution: blocked — INVALID_ARTIFACT at final-hard-validation';
-    }
-
-    return `Execution: success\nRICKY_MASTER_CHILD_RUN_VERIFIED\n${resolvedTask.slice(0, 80)}`;
-  };
-
-  const runner = new WorkflowRunner({
-    workspaceId: 'ws-e2e',
-    cwd,
-    executor: { executeAgentStep },
-  });
-
-  try {
-    const run = await runner.execute(config, 'default');
-    return { run, callsByStep };
-  } finally {
-    rmSync(cwd, { recursive: true, force: true });
-  }
-}
-
-describe('workflow reliability e2e shapes', () => {
-  it('repairs a failing deterministic gate in a pipeline workflow', async () => {
-    const { run, callsByStep } = await runReliabilityWorkflow(
-      baseConfig('reliable-pipeline', 'pipeline', [
-        { name: 'prepare', agent: 'fixer', task: 'Prepare inputs.' },
-        {
-          name: 'verify',
-          type: 'deterministic',
-          command: CHECK_MARKER,
-          dependsOn: ['prepare'],
-          captureOutput: true,
-        },
-      ])
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(callsByStep.has('verify-repair-1')).toBe(true);
-  });
-
-  it('repairs a failing deterministic gate in a DAG workflow', async () => {
-    const { run, callsByStep } = await runReliabilityWorkflow(
-      baseConfig('reliable-dag', 'dag', [
-        { name: 'backend', agent: 'fixer', task: 'Prepare backend evidence.' },
-        { name: 'frontend', agent: 'fixer', task: 'Prepare frontend evidence.' },
-        {
-          name: 'integrated-validation',
-          type: 'deterministic',
-          command: CHECK_MARKER,
-          dependsOn: ['backend', 'frontend'],
-          captureOutput: true,
-        },
-      ])
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(callsByStep.has('integrated-validation-repair-1')).toBe(true);
-  });
-
-  it('keeps fan-out siblings isolated while repairing the failed branch gate', async () => {
-    const { run, callsByStep } = await runReliabilityWorkflow(
-      baseConfig('reliable-fan-out', 'fan-out', [
-        {
-          name: 'branch-a-validation',
-          type: 'deterministic',
-          command: CHECK_MARKER,
-          captureOutput: true,
-        },
-        {
-          name: 'branch-b-validation',
-          type: 'deterministic',
-          command: 'node -e "console.log(\'branch-b-ok\')"',
-          captureOutput: true,
-        },
-        {
-          name: 'merge',
-          agent: 'fixer',
-          task: 'Merge {{steps.branch-a-validation.output}} and {{steps.branch-b-validation.output}}.',
-          dependsOn: ['branch-a-validation', 'branch-b-validation'],
-        },
-      ])
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(callsByStep.has('branch-a-validation-repair-1')).toBe(true);
-    expect(callsByStep.has('branch-b-validation-repair-1')).toBe(false);
-  });
-
-  it('repairs child workflow INVALID_ARTIFACT output before master final validation', async () => {
-    const { run, callsByStep } = await runReliabilityWorkflow(
-      baseConfig('reliable-master-child', 'hierarchical', [
-        {
-          name: 'run-child-workflow',
-          agent: 'fixer',
-          task: 'Run child workflow and return RICKY_MASTER_CHILD_RUN_VERIFIED.',
-          verification: {
-            type: 'output_contains',
-            value: 'RICKY_MASTER_CHILD_RUN_VERIFIED',
-          },
-        },
-        {
-          name: 'master-final-validation',
-          type: 'deterministic',
-          command: CHECK_MARKER,
-          dependsOn: ['run-child-workflow'],
-          captureOutput: true,
-        },
-      ])
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(callsByStep.has('run-child-workflow-repair-1')).toBe(true);
-    expect(callsByStep.has('master-final-validation-repair-1')).toBe(false);
-  });
-
-  it('repairs a deterministic-only workflow with a configured repair agent', async () => {
-    const { run, callsByStep } = await runReliabilityWorkflow(
-      baseConfig('reliable-deterministic-only', 'pipeline', [
-        {
-          name: 'verify-only',
-          type: 'deterministic',
-          command: CHECK_MARKER,
-          captureOutput: true,
-        },
-      ])
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(callsByStep.has('verify-only-repair-1')).toBe(true);
-  });
-
-  it('repairs agent artifact retries and then passes deterministic validation', async () => {
-    const { run, callsByStep } = await runReliabilityWorkflow(
-      baseConfig('reliable-agent-plus-gates', 'pipeline', [
-        {
-          name: 'invalid-artifact-author',
-          agent: 'fixer',
-          task: 'Produce structured artifact metadata.',
-          verification: {
-            type: 'output_contains',
-            value: 'RICKY_MASTER_CHILD_RUN_VERIFIED',
-          },
-        },
-        {
-          name: 'verify-artifact',
-          type: 'deterministic',
-          command: CHECK_MARKER,
-          dependsOn: ['invalid-artifact-author'],
-          captureOutput: true,
-        },
-      ])
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(callsByStep.has('invalid-artifact-author-repair-1')).toBe(true);
-    expect(callsByStep.has('verify-artifact-repair-1')).toBe(false);
-  });
-
-  it('repairs validation inside a git worktree-backed workflow', async () => {
-    const cwd = makeWorkspace();
-    execSync('git init -q', { cwd });
-    execSync('git config user.email test@example.com', { cwd });
-    execSync('git config user.name "Relay Test"', { cwd });
-    execSync('git add marker.txt && git commit -q -m init', { cwd });
-
-    const { run, callsByStep } = await runReliabilityWorkflow(
-      baseConfig('reliable-worktree', 'pipeline', [
-        {
-          name: 'make-worktree',
-          type: 'worktree',
-          branch: 'reliability-worktree-test',
-          path: 'child-worktree',
-        },
-        {
-          name: 'verify-in-worktree',
-          type: 'deterministic',
-          command: CHECK_MARKER,
-          cwd: 'child-worktree',
-          dependsOn: ['make-worktree'],
-          captureOutput: true,
-        },
-      ]),
-      cwd
-    );
-
-    expect(run.status, run.error).toBe('completed');
-    expect(callsByStep.has('verify-in-worktree-repair-1')).toBe(true);
-  });
-});
diff --git a/packages/sdk/src/workflows/api-executor.ts b/packages/sdk/src/workflows/api-executor.ts
deleted file mode 100644
index 63dceb42f..000000000
--- a/packages/sdk/src/workflows/api-executor.ts
+++ /dev/null
@@ -1,158 +0,0 @@
-/**
- * API Executor — calls LLM provider APIs directly via fetch().
- * Used when agent cli is 'api'. No sandbox, no CLI, no PTY.
- */
-
-type Provider = 'anthropic' | 'openai' | 'google';
-
-function detectProvider(model: string): Provider {
-  if (model.startsWith('claude')) return 'anthropic';
-  if (model.startsWith('gpt') || model.startsWith('o1') || model.startsWith('o3') || model.startsWith('o4'))
-    return 'openai';
-  if (model.startsWith('gemini')) return 'google';
-  return 'anthropic';
-}
-
-function getApiKey(provider: Provider, envSecrets?: Record<string, string>): string {
-  const envMap: Record<Provider, string[]> = {
-    anthropic: ['ANTHROPIC_API_KEY'],
-    openai: ['OPENAI_API_KEY'],
-    google: ['GOOGLE_API_KEY', 'GEMINI_API_KEY'],
-  };
-  for (const key of envMap[provider]) {
-    const value = envSecrets?.[key] ?? process.env[key];
-    if (value) return value;
-  }
-  throw new Error(`No API key for "${provider}". Set ${envMap[provider].join(' or ')}.`);
-}
-
-interface ApiResponse {
-  content: string;
-  model: string;
-  usage?: { inputTokens: number; outputTokens: number };
-}
-
-async function callAnthropic(
-  apiKey: string,
-  model: string,
-  task: string,
-  maxTokens: number,
-  systemPrompt?: string
-): Promise<ApiResponse> {
-  const res = await fetch('https://api.anthropic.com/v1/messages', {
-    method: 'POST',
-    headers: { 'content-type': 'application/json', 'x-api-key': apiKey, 'anthropic-version': '2023-06-01' },
-    body: JSON.stringify({
-      model,
-      max_tokens: maxTokens,
-      ...(systemPrompt ? { system: systemPrompt } : {}),
-      messages: [{ role: 'user', content: task }],
-    }),
-  });
-  if (!res.ok) throw new Error(`Anthropic API error (${res.status}): ${await res.text()}`);
-  const data = (await res.json()) as {
-    content: Array<{ type: string; text?: string }>;
-    model: string;
-    usage?: { input_tokens: number; output_tokens: number };
-  };
-  return {
-    content: data.content
-      .filter((c) => c.type === 'text')
-      .map((c) => c.text ?? '')
-      .join(''),
-    model: data.model,
-    usage: data.usage
-      ? { inputTokens: data.usage.input_tokens, outputTokens: data.usage.output_tokens }
-      : undefined,
-  };
-}
-
-async function callOpenAI(
-  apiKey: string,
-  model: string,
-  task: string,
-  maxTokens: number,
-  systemPrompt?: string
-): Promise<ApiResponse> {
-  const messages: Array<{ role: string; content: string }> = [];
-  if (systemPrompt) messages.push({ role: 'system', content: systemPrompt });
-  messages.push({ role: 'user', content: task });
-  const res = await fetch('https://api.openai.com/v1/chat/completions', {
-    method: 'POST',
-    headers: { 'content-type': 'application/json', authorization: `Bearer ${apiKey}` },
-    body: JSON.stringify({ model, max_tokens: maxTokens, messages }),
-  });
-  if (!res.ok) throw new Error(`OpenAI API error (${res.status}): ${await res.text()}`);
-  const data = (await res.json()) as {
-    choices: Array<{ message: { content: string } }>;
-    model: string;
-    usage?: { prompt_tokens: number; completion_tokens: number };
-  };
-  return {
-    content: data.choices[0]?.message?.content ?? '',
-    model: data.model,
-    usage: data.usage
-      ? { inputTokens: data.usage.prompt_tokens, outputTokens: data.usage.completion_tokens }
-      : undefined,
-  };
-}
-
-async function callGoogle(
-  apiKey: string,
-  model: string,
-  task: string,
-  maxTokens: number,
-  systemPrompt?: string
-): Promise<ApiResponse> {
-  const res = await fetch(
-    `https://generativelanguage.googleapis.com/v1beta/models/${model}:generateContent`,
-    {
-      method: 'POST',
-      headers: { 'content-type': 'application/json', 'x-goog-api-key': apiKey },
-      body: JSON.stringify({
-        ...(systemPrompt ? { systemInstruction: { parts: [{ text: systemPrompt }] } } : {}),
-        contents: [{ parts: [{ text: task }] }],
-        generationConfig: { maxOutputTokens: maxTokens },
-      }),
-    }
-  );
-  if (!res.ok) throw new Error(`Google API error (${res.status}): ${await res.text()}`);
-  const data = (await res.json()) as {
-    candidates: Array<{ content: { parts: Array<{ text: string }> } }>;
-    usageMetadata?: { promptTokenCount: number; candidatesTokenCount: number };
-  };
-  return {
-    content: data.candidates[0]?.content?.parts?.map((p) => p.text).join('') ?? '',
-    model,
-    usage: data.usageMetadata
-      ? {
-          inputTokens: data.usageMetadata.promptTokenCount,
-          outputTokens: data.usageMetadata.candidatesTokenCount,
-        }
-      : undefined,
-  };
-}
-
-const PROVIDER_CALLERS = { anthropic: callAnthropic, openai: callOpenAI, google: callGoogle } as const;
-
-export interface ApiExecutorOptions {
-  envSecrets?: Record<string, string>;
-  defaultModel?: string;
-  defaultMaxTokens?: number;
-  skills?: string;
-}
-
-export async function executeApiStep(
-  model: string,
-  task: string,
-  options: ApiExecutorOptions = {}
-): Promise<string> {
-  const resolvedModel = model || options.defaultModel || 'claude-sonnet-4-20250514';
-  const maxTokens = options.defaultMaxTokens ?? 4096;
-  const provider = detectProvider(resolvedModel);
-  const apiKey = getApiKey(provider, options.envSecrets);
-  const response = await PROVIDER_CALLERS[provider](apiKey, resolvedModel, task, maxTokens, options.skills);
-  return response.content;
-}
-
-export { detectProvider, getApiKey };
diff --git a/packages/sdk/src/workflows/barrier.ts b/packages/sdk/src/workflows/barrier.ts
deleted file mode 100644
index eb9d764d8..000000000
--- a/packages/sdk/src/workflows/barrier.ts
+++ /dev/null
@@ -1,239 +0,0 @@
-/**
- * Barrier Manager — synchronization barriers with all/any/majority semantics.
- *
- * Barriers gate downstream workflow steps until a set of upstream agents
- * or steps have resolved. Supports three resolution modes:
- *
- * - **all**      — every agent in `waitFor` must resolve (default)
- * - **any**      — at least one agent resolves
- * - **majority** — more than half of `waitFor` must resolve
- */
-
-import { randomBytes } from 'node:crypto';
-import { EventEmitter } from 'node:events';
-import type { DbClient } from './coordinator.js';
-
-// ── Types ───────────────────────────────────────────────────────────────────
-
-export type BarrierMode = 'all' | 'any' | 'majority';
-
-export interface BarrierDefinition {
-  name: string;
-  waitFor: string[];
-  mode?: BarrierMode;
-  timeoutMs?: number;
-}
-
-export interface BarrierRow {
-  id: string;
-  runId: string;
-  barrierName: string;
-  waitFor: string[];
-  resolved: string[];
-  isSatisfied: boolean;
-  timeoutMs: number | null;
-  createdAt: string;
-  updatedAt: string;
-}
-
-export interface BarrierManagerEvents {
-  'barrier:created': (barrier: BarrierRow) => void;
-  'barrier:resolved': (barrierName: string, agent: string) => void;
-  'barrier:satisfied': (barrier: BarrierRow) => void;
-  'barrier:timeout': (barrier: BarrierRow) => void;
-}
-
-// ── Manager ─────────────────────────────────────────────────────────────────
-
-export class BarrierManager extends EventEmitter {
-  private db: DbClient;
-  /** In-memory mode tracking (not persisted — set once at creation). */
-  private modes = new Map<string, BarrierMode>();
-  private timeoutTimers = new Map<string, ReturnType<typeof setTimeout>>();
-
-  constructor(db: DbClient) {
-    super();
-    this.db = db;
-  }
-
-  // ── Create ──────────────────────────────────────────────────────────────
-
-  /**
-   * Create a barrier for a workflow run.
-   */
-  async createBarrier(runId: string, definition: BarrierDefinition): Promise<BarrierRow> {
-    const id = `bar_${Date.now()}_${randomBytes(4).toString('hex')}`;
-    const now = new Date().toISOString();
-    const mode = definition.mode ?? 'all';
-
-    const { rows } = await this.db.query<BarrierRow>(
-      `INSERT INTO workflow_barriers (id, run_id, barrier_name, wait_for, resolved, is_satisfied, timeout_ms, created_at, updated_at)
-       VALUES ($1, $2, $3, $4, '[]'::jsonb, FALSE, $5, $6, $6)
-       RETURNING *`,
-      [id, runId, definition.name, JSON.stringify(definition.waitFor), definition.timeoutMs ?? null, now]
-    );
-
-    const barrier = rows[0];
-    const key = `${runId}:${definition.name}`;
-    this.modes.set(key, mode);
-
-    if (definition.timeoutMs) {
-      this.scheduleTimeout(barrier, definition.timeoutMs);
-    }
-
-    this.emit('barrier:created', barrier);
-    return barrier;
-  }
-
-  /**
-   * Bulk-create barriers from a list of definitions (e.g. from coordination config).
-   */
-  async createBarriers(runId: string, definitions: BarrierDefinition[]): Promise<BarrierRow[]> {
-    const results: BarrierRow[] = [];
-    for (const def of definitions) {
-      results.push(await this.createBarrier(runId, def));
-    }
-    return results;
-  }
-
-  // ── Resolve ─────────────────────────────────────────────────────────────
-
-  /**
-   * Mark an agent/step as resolved for a barrier. Returns whether the
-   * barrier is now fully satisfied.
-   */
-  async resolve(
-    runId: string,
-    barrierName: string,
-    agent: string
-  ): Promise<{ satisfied: boolean; barrier: BarrierRow }> {
-    const now = new Date().toISOString();
-
-    // Atomic: append agent to resolved array if not already present.
-    const { rows } = await this.db.query<BarrierRow>(
-      `UPDATE workflow_barriers
-       SET resolved = CASE
-             WHEN resolved @> $3::jsonb THEN resolved
-             ELSE resolved || $3::jsonb
-           END,
-           updated_at = $4
-       WHERE run_id = $1 AND barrier_name = $2 AND is_satisfied = FALSE
-       RETURNING *`,
-      [runId, barrierName, JSON.stringify(agent), now]
-    );
-
-    if (rows.length === 0) {
-      // Barrier may already be satisfied or not exist.
-      const existing = await this.getBarrier(runId, barrierName);
-      if (!existing) throw new Error(`Barrier ${barrierName} not found for run ${runId}`);
-      return { satisfied: existing.isSatisfied, barrier: existing };
-    }
-
-    const barrier = rows[0];
-    this.emit('barrier:resolved', barrierName, agent);
-
-    const key = `${runId}:${barrierName}`;
-    const mode = this.modes.get(key) ?? 'all';
-
-    if (this.checkSatisfied(barrier, mode)) {
-      return this.markSatisfied(barrier);
-    }
-
-    return { satisfied: false, barrier };
-  }
-
-  // ── Queries ─────────────────────────────────────────────────────────────
-
-  async getBarrier(runId: string, barrierName: string): Promise<BarrierRow | null> {
-    const { rows } = await this.db.query<BarrierRow>(
-      `SELECT * FROM workflow_barriers WHERE run_id = $1 AND barrier_name = $2`,
-      [runId, barrierName]
-    );
-    return rows[0] ?? null;
-  }
-
-  async getBarriers(runId: string): Promise<BarrierRow[]> {
-    const { rows } = await this.db.query<BarrierRow>(
-      `SELECT * FROM workflow_barriers WHERE run_id = $1 ORDER BY created_at ASC`,
-      [runId]
-    );
-    return rows;
-  }
-
-  async getUnsatisfiedBarriers(runId: string): Promise<BarrierRow[]> {
-    const { rows } = await this.db.query<BarrierRow>(
-      `SELECT * FROM workflow_barriers WHERE run_id = $1 AND is_satisfied = FALSE ORDER BY created_at ASC`,
-      [runId]
-    );
-    return rows;
-  }
-
-  /**
-   * Check if a named barrier is satisfied (useful for gating downstream work).
-   */
-  async isSatisfied(runId: string, barrierName: string): Promise<boolean> {
-    const barrier = await this.getBarrier(runId, barrierName);
-    return barrier?.isSatisfied ?? false;
-  }
-
-  // ── Cleanup ─────────────────────────────────────────────────────────────
-
-  cleanup(): void {
-    for (const timer of this.timeoutTimers.values()) clearTimeout(timer);
-    this.timeoutTimers.clear();
-    this.modes.clear();
-  }
-
-  // ── Private ─────────────────────────────────────────────────────────────
-
-  private checkSatisfied(barrier: BarrierRow, mode: BarrierMode): boolean {
-    const waitFor: string[] = Array.isArray(barrier.waitFor) ? barrier.waitFor : [];
-    const resolved: string[] = Array.isArray(barrier.resolved) ? barrier.resolved : [];
-
-    switch (mode) {
-      case 'all':
-        return waitFor.every((w) => resolved.includes(w));
-      case 'any':
-        return resolved.length > 0;
-      case 'majority':
-        return resolved.length > waitFor.length / 2;
-    }
-  }
-
-  private async markSatisfied(barrier: BarrierRow): Promise<{ satisfied: boolean; barrier: BarrierRow }> {
-    const now = new Date().toISOString();
-    const { rows } = await this.db.query<BarrierRow>(
-      `UPDATE workflow_barriers SET is_satisfied = TRUE, updated_at = $2
-       WHERE id = $1
-       RETURNING *`,
-      [barrier.id, now]
-    );
-
-    const updated = rows[0];
-    const key = `${barrier.runId}:${barrier.barrierName}`;
-    this.clearTimeout(key);
-    this.emit('barrier:satisfied', updated);
-
-    return { satisfied: true, barrier: updated };
-  }
-
-  private scheduleTimeout(barrier: BarrierRow, timeoutMs: number): void {
-    const key = `${barrier.runId}:${barrier.barrierName}`;
-    const timer = setTimeout(async () => {
-      const current = await this.getBarrier(barrier.runId, barrier.barrierName);
-      if (current && !current.isSatisfied) {
-        this.emit('barrier:timeout', current);
-      }
-    }, timeoutMs);
-    timer.unref();
-    this.timeoutTimers.set(key, timer);
-  }
-
-  private clearTimeout(key: string): void {
-    const timer = this.timeoutTimers.get(key);
-    if (timer) {
-      globalThis.clearTimeout(timer);
-      this.timeoutTimers.delete(key);
-    }
-  }
-}
diff --git a/packages/sdk/src/workflows/budget-tracker.ts b/packages/sdk/src/workflows/budget-tracker.ts
deleted file mode 100644
index f1ea8f76c..000000000
--- a/packages/sdk/src/workflows/budget-tracker.ts
+++ /dev/null
@@ -1,274 +0,0 @@
-export interface BudgetTrackerStepConfig {
-  stepName: string;
-  agentName: string;
-  maxTokens?: number;
-}
-
-export interface BudgetTrackerOptions {
-  perAgent?: number;
-  perWorkflow?: number;
-  workflowBudget?: number;
-  steps?: BudgetTrackerStepConfig[];
-}
-
-export interface TokenUsage {
-  input: number;
-  output: number;
-  cacheRead: number;
-  total: number;
-}
-
-export interface BudgetAvailability {
-  allowed: boolean;
-  reason?: string;
-}
-
-export interface OverBudgetResult {
-  over: boolean;
-  reason?: string;
-}
-
-export interface BudgetStatus {
-  agentLimitExceeded: boolean;
-  workflowBudgetExceeded: boolean;
-  workflowBudgetExhausted: boolean;
-}
-
-export interface StepBudgetStatus {
-  used?: number;
-  limit?: number;
-  over: boolean;
-}
-
-export interface WorkflowBudgetStatus {
-  used: number;
-  limit?: number;
-  exhausted: boolean;
-}
-
-export interface RunSummaryBudgetData {
-  steps: Map<string, StepBudgetStatus>;
-  workflow?: WorkflowBudgetStatus;
-}
-
-function emptyUsage(): TokenUsage {
-  return { input: 0, output: 0, cacheRead: 0, total: 0 };
-}
-
-function toUsage(value: number | Partial<Omit<TokenUsage, 'total'>>): TokenUsage {
-  if (typeof value === 'number') {
-    const input = Number.isFinite(value) ? Math.max(0, Math.round(value)) : 0;
-    return { input, output: 0, cacheRead: 0, total: input };
-  }
-
-  const input = Number.isFinite(value.input) ? Math.max(0, Math.round(value.input ?? 0)) : 0;
-  const output = Number.isFinite(value.output) ? Math.max(0, Math.round(value.output ?? 0)) : 0;
-  const cacheRead = Number.isFinite(value.cacheRead) ? Math.max(0, Math.round(value.cacheRead ?? 0)) : 0;
-  return {
-    input,
-    output,
-    cacheRead,
-    total: input + output,
-  };
-}
-
-function addUsage(left: TokenUsage, right: TokenUsage): TokenUsage {
-  const input = left.input + right.input;
-  const output = left.output + right.output;
-  const cacheRead = left.cacheRead + right.cacheRead;
-  return {
-    input,
-    output,
-    cacheRead,
-    total: input + output,
-  };
-}
-
-export class BudgetExceededError extends Error {
-  readonly stepName: string;
-  readonly budgetType: 'agent' | 'workflow';
-  readonly limit: number;
-  readonly actual: number;
-  readonly used: number;
-
-  constructor(stepName: string, budgetType: 'agent' | 'workflow', limit: number, actual: number) {
-    const qualifier = budgetType === 'workflow' ? 'workflow budget exhausted' : 'agent budget exceeded';
-    super(`Step "${stepName}" cannot continue: ${qualifier} (${actual}/${limit})`);
-    this.name = 'BudgetExceededError';
-    this.stepName = stepName;
-    this.budgetType = budgetType;
-    this.limit = limit;
-    this.actual = actual;
-    this.used = actual;
-  }
-}
-
-export class BudgetTracker {
-  private readonly defaultAgentBudget?: number;
-  private readonly workflowBudget?: number;
-  private readonly stepLimits = new Map<string, number | undefined>();
-  private readonly stepUsage = new Map<string, TokenUsage>();
-  private totalUsage: TokenUsage = emptyUsage();
-  private workflowBudgetExhausted = false;
-
-  constructor(options: BudgetTrackerOptions) {
-    this.defaultAgentBudget = options.perAgent;
-    this.workflowBudget = options.workflowBudget ?? options.perWorkflow;
-
-    for (const step of options.steps ?? []) {
-      this.stepLimits.set(step.stepName, step.maxTokens);
-    }
-  }
-
-  recordUsage(stepName: string, usage: number | Partial<Omit<TokenUsage, 'total'>>): void {
-    const normalized = toUsage(usage);
-    const current = this.stepUsage.get(stepName) ?? emptyUsage();
-    const next = addUsage(current, normalized);
-    this.stepUsage.set(stepName, next);
-    this.totalUsage = addUsage(this.totalUsage, normalized);
-
-    if (this.workflowBudget !== undefined && this.totalUsage.total >= this.workflowBudget) {
-      this.workflowBudgetExhausted = true;
-    }
-  }
-
-  getStepUsage(stepName: string): TokenUsage {
-    return this.stepUsage.get(stepName) ?? emptyUsage();
-  }
-
-  getTotalUsage(): TokenUsage {
-    return this.totalUsage;
-  }
-
-  getRemainingBudget(): { agent?: number; workflow?: number } {
-    return {
-      agent:
-        this.defaultAgentBudget !== undefined
-          ? Math.max(0, this.defaultAgentBudget - this.totalUsage.total)
-          : undefined,
-      workflow:
-        this.workflowBudget !== undefined
-          ? Math.max(0, this.workflowBudget - this.totalUsage.total)
-          : undefined,
-    };
-  }
-
-  checkCanSpawn(stepName: string): BudgetAvailability {
-    if (this.workflowBudget !== undefined && this.totalUsage.total >= this.workflowBudget) {
-      return {
-        allowed: false,
-        reason: `Cannot spawn ${stepName}: workflow budget exceeded (${this.totalUsage.total}/${this.workflowBudget})`,
-      };
-    }
-
-    if (this.workflowBudget !== undefined) {
-      const remainingWorkflowBudget = this.workflowBudget - this.totalUsage.total;
-      const stepLimit = this.getStepLimit(stepName);
-      const minimumHeadroom =
-        stepLimit !== undefined
-          ? Math.min(stepLimit, this.workflowBudget)
-          : this.defaultAgentBudget !== undefined
-            ? Math.ceil(this.defaultAgentBudget * 0.1)
-            : Math.ceil(this.workflowBudget * 0.1);
-
-      if (remainingWorkflowBudget <= minimumHeadroom) {
-        return {
-          allowed: false,
-          reason:
-            stepLimit !== undefined
-              ? `Cannot spawn ${stepName}: remaining workflow budget ${remainingWorkflowBudget} is below step budget ${stepLimit}`
-              : this.defaultAgentBudget !== undefined
-                ? `Cannot spawn ${stepName}: remaining workflow budget ${remainingWorkflowBudget} ` +
-                  `is below 10% of per-agent budget ${this.defaultAgentBudget}`
-                : `Cannot spawn ${stepName}: remaining workflow budget ${remainingWorkflowBudget} ` +
-                  `is below 10% headroom threshold for workflow budget ${this.workflowBudget}`,
-        };
-      }
-    }
-
-    return { allowed: true };
-  }
-
-  isOverBudget(stepName: string): OverBudgetResult {
-    const stepUsage = this.getStepUsage(stepName);
-    const stepLimit = this.getStepLimit(stepName);
-    if (stepLimit !== undefined && stepUsage.total > stepLimit) {
-      return {
-        over: true,
-        reason: `Step "${stepName}" exceeded per-agent budget (${stepUsage.total}/${stepLimit})`,
-      };
-    }
-
-    if (this.workflowBudget !== undefined && this.totalUsage.total > this.workflowBudget) {
-      return {
-        over: true,
-        reason: `Workflow exceeded total budget (${this.totalUsage.total}/${this.workflowBudget})`,
-      };
-    }
-
-    return { over: false };
-  }
-
-  getBudgetStatus(stepName: string): BudgetStatus {
-    const stepUsage = this.getStepUsage(stepName);
-    const stepLimit = this.getStepLimit(stepName);
-    return {
-      agentLimitExceeded: stepLimit !== undefined && stepUsage.total > stepLimit,
-      workflowBudgetExceeded:
-        this.workflowBudget !== undefined && this.totalUsage.total > this.workflowBudget,
-      workflowBudgetExhausted:
-        this.workflowBudget !== undefined &&
-        (this.workflowBudgetExhausted || this.totalUsage.total >= this.workflowBudget),
-    };
-  }
-
-  getStepBudgetStatus(stepName: string): StepBudgetStatus | undefined {
-    const usage = this.stepUsage.get(stepName);
-    const hasExplicitLimit = this.stepLimits.has(stepName);
-    const limit = this.getStepLimit(stepName);
-
-    if (!usage && !hasExplicitLimit && limit === undefined) {
-      return undefined;
-    }
-
-    return {
-      used: usage?.total,
-      limit,
-      over: limit !== undefined && (usage?.total ?? 0) > limit,
-    };
-  }
-
-  getRunSummaryBudgetData(): RunSummaryBudgetData | undefined {
-    const steps = new Map<string, StepBudgetStatus>();
-    const stepNames = new Set<string>([...this.stepLimits.keys(), ...this.stepUsage.keys()]);
-
-    for (const stepName of stepNames) {
-      const status = this.getStepBudgetStatus(stepName);
-      if (status) {
-        steps.set(stepName, status);
-      }
-    }
-
-    const workflow =
-      this.workflowBudget !== undefined || this.totalUsage.total > 0
-        ? {
-            used: this.totalUsage.total,
-            limit: this.workflowBudget,
-            exhausted:
-              this.workflowBudget !== undefined &&
-              (this.workflowBudgetExhausted || this.totalUsage.total >= this.workflowBudget),
-          }
-        : undefined;
-
-    if (steps.size === 0 && !workflow) {
-      return undefined;
-    }
-
-    return { steps, workflow };
-  }
-
-  private getStepLimit(stepName: string): number | undefined {
-    const limit = this.stepLimits.get(stepName);
-    return limit ?? this.defaultAgentBudget;
-  }
-}
diff --git a/packages/sdk/src/workflows/builder.ts b/packages/sdk/src/workflows/builder.ts
deleted file mode 100644
index f2eb1f8f7..000000000
--- a/packages/sdk/src/workflows/builder.ts
+++ /dev/null
@@ -1,594 +0,0 @@
-import path from 'node:path';
-import { stringify as stringifyYaml } from 'yaml';
-
-import type { AgentRelayOptions } from '../relay.js';
-import type {
-  AgentCli,
-  AgentDefinition,
-  AgentPreset,
-  Barrier,
-  CoordinationConfig,
-  DryRunReport,
-  ErrorHandlingConfig,
-  IdleNudgeConfig,
-  PathDefinition,
-  RelayYamlConfig,
-  StateConfig,
-  SwarmPattern,
-  TrajectoryConfig,
-  VerificationCheck,
-  WorkflowDefinition,
-  WorkflowExecuteOptions,
-  WorkflowRunRow,
-  WorkflowStep,
-} from './types.js';
-import { JsonFileWorkflowDb } from './file-db.js';
-import { WorkflowRunner, type WorkflowEventListener } from './runner.js';
-import type { RunnerStepExecutor } from './types.js';
-import { formatDryRunReport } from './dry-run-format.js';
-import { createDefaultEventLogger, type LogLevel } from './default-logger.js';
-import { runInCloud, type CloudRunOptions } from './cloud-runner.js';
-import type { VariableContext } from './template-resolver.js';
-
-// ── Option types for the builder API ────────────────────────────────────────
-
-export interface AgentOptions {
-  cli: AgentCli;
-  role?: string;
-  task?: string;
-  channels?: string[];
-  model?: string;
-  maxTokens?: number;
-  timeoutMs?: number;
-  retries?: number;
-  /**
-   * Seconds of silence on the agent's PTY before the runtime marks it idle and
-   * tears it down. Default: 30s. Set to `0` to disable idle detection entirely.
-   *
-   * When to override (per-agent):
-   *   - You expect long quiet stretches by design — a long-running reviewer
-   *     waiting for downstream verdicts, a grader watching a file that updates
-   *     every few minutes, or a `@-mention` recipient whose triggering event
-   *     may arrive >30s after spawn. Setting `0` (or a generous N) prevents
-   *     the runtime from killing the agent before the awaited event arrives.
-   *
-   * When NOT to override:
-   *   - One-shot worker steps. The default is right; idle-as-complete is what
-   *     makes `OWNER_DECISION: COMPLETE` + clean exit fast.
-   *
-   * See the `writing-agent-relay-workflows` skill ("Idle detection beats
-   * 'wait for X' prompts") for the trade-offs around long-running interactive
-   * agents and the Per-turn interactive spawn alternative.
-   */
-  idleThresholdSecs?: number;
-  /** When false, the agent runs as a non-interactive subprocess (no PTY, no relay messaging).
-   *  Default: true. */
-  interactive?: boolean;
-  /** Agent preset: 'lead' (interactive PTY), 'worker' | 'reviewer' | 'analyst' (non-interactive subprocess). */
-  preset?: AgentPreset;
-  /** Skills to make available to the agent (for API-mode agents). */
-  skills?: string;
-}
-
-/** Options for agent steps (default). */
-export interface AgentStepOptions {
-  agent: string;
-  task: string;
-  cwd?: string;
-  dependsOn?: string[];
-  verification?: VerificationCheck;
-  timeoutMs?: number;
-  retries?: number;
-}
-
-/** Options for deterministic (shell command) steps. */
-export interface DeterministicStepOptions {
-  type: 'deterministic';
-  command: string;
-  cwd?: string;
-  /** Capture stdout as step output for downstream steps. Default: true. */
-  captureOutput?: boolean;
-  /** Fail if command exit code is non-zero. Default: true. */
-  failOnError?: boolean;
-  dependsOn?: string[];
-  verification?: VerificationCheck;
-  timeoutMs?: number;
-}
-
-/** Options for worktree steps (create/checkout git worktrees). */
-export interface WorktreeStepOptions {
-  type: 'worktree';
-  branch: string;
-  baseBranch?: string;
-  path?: string;
-  createBranch?: boolean;
-  dependsOn?: string[];
-  timeoutMs?: number;
-}
-
-export type StepOptions = AgentStepOptions | DeterministicStepOptions | WorktreeStepOptions;
-
-export interface ErrorOptions {
-  maxRetries?: number;
-  retryDelayMs?: number;
-  notifyChannel?: string;
-  repairAgent?: string;
-  repairRetries?: number;
-}
-
-export type ReliabilityOptions = ErrorOptions;
-
-export interface WorkflowRunOptions {
-  /** Run a specific workflow by name (default: first). */
-  workflow?: string;
-  /** Template variable substitutions. */
-  vars?: VariableContext;
-  /** Working directory (default: process.cwd()). */
-  cwd?: string;
-  /** AgentRelay options (all optional). */
-  relay?: AgentRelayOptions;
-  /** Progress callback. */
-  onEvent?: WorkflowEventListener;
-  /** Validate and print execution plan without spawning agents. */
-  dryRun?: boolean;
-  /** External step executor (e.g. Daytona sandbox backend). */
-  executor?: RunnerStepExecutor;
-  /** Start from a specific step, skipping all predecessors. */
-  startFrom?: string;
-  /** Previous run ID whose cached outputs are used with startFrom. */
-  previousRunId?: string;
-  /** Console log verbosity: "verbose" | "normal" (default) | "quiet" | false (silent). */
-  logLevel?: LogLevel;
-  /** Renderer: "listr" for listr2 UI, "default" for console logger, false to disable. */
-  renderer?: 'listr' | 'default' | false;
-  /** Run the workflow in the cloud instead of locally. */
-  cloud?: boolean;
-  /** Cloud API base URL (or set CLOUD_API_URL env var). */
-  cloudApiUrl?: string;
-  /** Cloud API authentication token (or set CLOUD_API_TOKEN env var). */
-  cloudApiToken?: string;
-  /** Environment secrets to forward to cloud agents. */
-  envSecrets?: Record<string, string>;
-  /** Polling interval in ms for cloud run status checks. */
-  cloudPollIntervalMs?: number;
-  /** Callback invoked when the cloud run status changes. */
-  onCloudStatusChange?: (status: string, runId: string) => void;
-}
-
-// ── WorkflowBuilder ─────────────────────────────────────────────────────────
-
-/**
- * Fluent builder for constructing workflow configurations programmatically.
- *
- * @example
- * ```typescript
- * import { workflow } from "@agent-relay/sdk/workflows";
- *
- * const result = await workflow("my-workflow")
- *   .pattern("dag")
- *   .agent("worker", { cli: "claude", role: "Backend engineer" })
- *   .step("build", { agent: "worker", task: "Build the project" })
- *   .step("test", { agent: "worker", task: "Run tests", dependsOn: ["build"] })
- *   .run();
- * ```
- */
-export class WorkflowBuilder {
-  private _name: string;
-  private _description?: string;
-  private _pattern: SwarmPattern = 'dag';
-  private _maxConcurrency?: number;
-  private _timeoutMs?: number;
-  private _channel?: string;
-  private _idleNudge?: IdleNudgeConfig;
-  private _paths?: PathDefinition[];
-  private _agents: AgentDefinition[] = [];
-  private _steps: WorkflowStep[] = [];
-  private _errorHandling?: ErrorHandlingConfig;
-  private _coordination?: CoordinationConfig;
-  private _state?: StateConfig;
-  private _trajectories?: TrajectoryConfig | false;
-  private _startFrom?: string;
-  private _previousRunId?: string;
-
-  constructor(name: string) {
-    this._name = name;
-  }
-
-  /** Set workflow description. */
-  description(desc: string): this {
-    this._description = desc;
-    return this;
-  }
-
-  /** Set swarm pattern (default: "dag"). */
-  pattern(p: SwarmPattern): this {
-    this._pattern = p;
-    return this;
-  }
-
-  /** Set maximum concurrent agents. */
-  maxConcurrency(n: number): this {
-    this._maxConcurrency = n;
-    return this;
-  }
-
-  /** Set global timeout in milliseconds. */
-  timeout(ms: number): this {
-    this._timeoutMs = ms;
-    return this;
-  }
-
-  /** Set the relay channel for agent communication. */
-  channel(ch: string): this {
-    const CHANNEL_RE = /^[a-z0-9][a-z0-9-]*$/;
-    if (!CHANNEL_RE.test(ch)) {
-      throw new Error(
-        `Invalid channel name "${ch}". Channel names must be lowercase alphanumeric and hyphens, starting with a letter or number. ` +
-          `Fix: use .toLowerCase().replace(/[^a-z0-9-]/g, '-').replace(/-+/g, '-').replace(/^-|-$/g, '')`
-      );
-    }
-    this._channel = ch;
-    return this;
-  }
-
-  /** Configure idle agent detection and nudging for interactive agents. */
-  idleNudge(config: IdleNudgeConfig): this {
-    this._idleNudge = config;
-    return this;
-  }
-
-  /** Set workflow coordination settings (barriers, voting threshold, consensus strategy). */
-  coordination(config: CoordinationConfig): this {
-    this._coordination = config;
-    return this;
-  }
-
-  /** Configure shared workflow state backend settings. */
-  state(config: StateConfig): this {
-    this._state = config;
-    return this;
-  }
-
-  /** Configure trajectory recording, or pass `false` to disable it. */
-  trajectories(config: TrajectoryConfig | false): this {
-    this._trajectories = config;
-    return this;
-  }
-
-  /** Start execution from a specific step, skipping all predecessor steps. */
-  startFrom(stepName: string): this {
-    this._startFrom = stepName;
-    return this;
-  }
-
-  /** Set the previous run ID whose cached step outputs should be used with startFrom. */
-  previousRunId(id: string): this {
-    this._previousRunId = id;
-    return this;
-  }
-
-  /**
-   * Declare named paths to additional directories the workflow needs.
-   *
-   * For multi-repo cloud workflows (relay#774, cloud#302), each entry is
-   * tarballed by the CLI at submit time and mounted at
-   * `/home/daytona/workspace/{name}/` in the sandbox. Locally, the runner
-   * resolves `path` relative to the workflow file's parent directory and
-   * agents reference each entry by its declared `name`.
-   *
-   * Calling this is a no-op for the runtime — the runner doesn't need
-   * `paths` to execute steps. The CLI and the cloud bootstrap consume
-   * it. Declaring via the builder keeps single-source-of-truth for tools
-   * that walk the built config (e.g. dashboards, dry-run reports).
-   */
-  paths(paths: PathDefinition[]): this {
-    if (!Array.isArray(paths)) {
-      throw new Error('.paths() expects an array of PathDefinition objects');
-    }
-    const seen = new Set<string>();
-    for (const p of paths) {
-      if (!p || typeof p.name !== 'string' || typeof p.path !== 'string') {
-        throw new Error('.paths() entries must each have string `name` and `path` fields');
-      }
-      if (seen.has(p.name)) {
-        throw new Error(`.paths() got duplicate entry name "${p.name}"`);
-      }
-      seen.add(p.name);
-    }
-    this._paths = paths.map((p) => ({ ...p }));
-    return this;
-  }
-
-  /** Add an agent definition. */
-  agent(name: string, options: AgentOptions): this {
-    const def: AgentDefinition = {
-      name,
-      cli: options.cli,
-    };
-
-    if (options.role !== undefined) def.role = options.role;
-    if (options.task !== undefined) def.task = options.task;
-    if (options.channels !== undefined) def.channels = options.channels;
-    if (options.preset !== undefined) def.preset = options.preset;
-    if (options.interactive !== undefined) def.interactive = options.interactive;
-    if (options.skills !== undefined) def.skills = options.skills;
-
-    if (
-      options.model !== undefined ||
-      options.maxTokens !== undefined ||
-      options.timeoutMs !== undefined ||
-      options.retries !== undefined ||
-      options.idleThresholdSecs !== undefined
-    ) {
-      def.constraints = {};
-      if (options.model !== undefined) def.constraints.model = options.model;
-      if (options.maxTokens !== undefined) def.constraints.maxTokens = options.maxTokens;
-      if (options.timeoutMs !== undefined) def.constraints.timeoutMs = options.timeoutMs;
-      if (options.retries !== undefined) def.constraints.retries = options.retries;
-      if (options.idleThresholdSecs !== undefined)
-        def.constraints.idleThresholdSecs = options.idleThresholdSecs;
-    }
-
-    this._agents.push(def);
-    return this;
-  }
-
-  /** Add a workflow step (agent or deterministic). */
-  step(name: string, options: StepOptions): this {
-    const step: WorkflowStep = { name };
-
-    if ('type' in options && options.type === 'deterministic') {
-      if (!options.command) {
-        throw new Error('deterministic steps must have a command');
-      }
-      if ('agent' in options || 'task' in options) {
-        throw new Error('deterministic steps must not have agent or task');
-      }
-      step.type = 'deterministic';
-      step.command = options.command;
-      if (options.cwd !== undefined) step.cwd = options.cwd;
-      if (options.captureOutput !== undefined) step.captureOutput = options.captureOutput;
-      if (options.failOnError !== undefined) step.failOnError = options.failOnError;
-      if (options.dependsOn !== undefined) step.dependsOn = options.dependsOn;
-      if (options.verification !== undefined) step.verification = options.verification;
-      if (options.timeoutMs !== undefined) step.timeoutMs = options.timeoutMs;
-    } else if ('type' in options && options.type === 'worktree') {
-      if ('agent' in options || 'task' in options) {
-        throw new Error('worktree steps must not have agent or task');
-      }
-      step.type = 'worktree';
-      step.branch = options.branch;
-      if (options.baseBranch !== undefined) step.baseBranch = options.baseBranch;
-      if (options.path !== undefined) step.path = options.path;
-      if (options.createBranch !== undefined) step.createBranch = options.createBranch;
-      if (options.dependsOn !== undefined) step.dependsOn = options.dependsOn;
-      if (options.timeoutMs !== undefined) step.timeoutMs = options.timeoutMs;
-    } else {
-      // Agent step
-      const agentOpts = options as AgentStepOptions;
-      if (!agentOpts.agent || !agentOpts.task) {
-        throw new Error('Agent steps must have both agent and task');
-      }
-      step.agent = agentOpts.agent;
-      step.task = agentOpts.task;
-      if (agentOpts.cwd !== undefined) step.cwd = agentOpts.cwd;
-      if (agentOpts.dependsOn !== undefined) step.dependsOn = agentOpts.dependsOn;
-      if (agentOpts.verification !== undefined) step.verification = agentOpts.verification;
-      if (agentOpts.timeoutMs !== undefined) step.timeoutMs = agentOpts.timeoutMs;
-      if (agentOpts.retries !== undefined) step.retries = agentOpts.retries;
-    }
-
-    this._steps.push(step);
-    return this;
-  }
-
-  /** Set error handling strategy. */
-  onError(strategy: 'fail-fast' | 'continue' | 'retry', options?: ErrorOptions): this {
-    this._errorHandling = { strategy };
-    if (options?.maxRetries !== undefined) this._errorHandling.maxRetries = options.maxRetries;
-    if (options?.retryDelayMs !== undefined) this._errorHandling.retryDelayMs = options.retryDelayMs;
-    if (options?.notifyChannel !== undefined) this._errorHandling.notifyChannel = options.notifyChannel;
-    if (options?.repairAgent !== undefined) this._errorHandling.repairAgent = options.repairAgent;
-    if (options?.repairRetries !== undefined) this._errorHandling.repairRetries = options.repairRetries;
-    return this;
-  }
-
-  /**
-   * Opt into the product reliability contract: repairable workflow failures get
-   * routed through an agent and retried before the workflow is allowed to fail.
-   */
-  repairable(options: ReliabilityOptions = {}): this {
-    return this.onError('retry', {
-      maxRetries: options.maxRetries ?? options.repairRetries ?? 2,
-      retryDelayMs: options.retryDelayMs ?? 1000,
-      notifyChannel: options.notifyChannel,
-      repairAgent: options.repairAgent,
-      repairRetries: options.repairRetries ?? options.maxRetries ?? 2,
-    });
-  }
-
-  /** Alias for `.repairable()` for workflow authors who think in product terms. */
-  reliable(options: ReliabilityOptions = {}): this {
-    return this.repairable(options);
-  }
-
-  private validateBuilderState(): void {
-    const hasAgentSteps = this._steps.some((s) => s.type !== 'deterministic' && s.type !== 'worktree');
-    if (hasAgentSteps && this._agents.length === 0) {
-      throw new Error('Workflow must have at least one agent when using agent steps');
-    }
-    if (this._steps.length === 0) {
-      throw new Error('Workflow must have at least one step');
-    }
-
-    const agentNames = new Set(this._agents.map((agent) => agent.name));
-    for (const step of this._steps) {
-      const diagnosticAgent = step.verification?.diagnosticAgent;
-      if (!diagnosticAgent) continue;
-
-      if (!agentNames.has(diagnosticAgent)) {
-        throw new Error(`Step "${step.name}" references unknown diagnosticAgent "${diagnosticAgent}"`);
-      }
-
-      if (step.retries === undefined || step.retries === 0) {
-        console.warn(
-          `Step "${step.name}": diagnosticAgent configured but no retries — diagnostic will never run`
-        );
-      }
-    }
-  }
-
-  /** Build and return the RelayYamlConfig object. */
-  toConfig(): RelayYamlConfig {
-    this.validateBuilderState();
-
-    const wfDef: WorkflowDefinition = {
-      name: `${this._name}-workflow`,
-      steps: [...this._steps],
-    };
-
-    const config: RelayYamlConfig = {
-      version: '1.0',
-      name: this._name,
-      swarm: {
-        pattern: this._pattern,
-      },
-      agents: [...this._agents],
-      workflows: [wfDef],
-    };
-
-    if (this._description !== undefined) config.description = this._description;
-    if (this._paths !== undefined && this._paths.length > 0) {
-      config.paths = this._paths.map((p) => ({ ...p }));
-    }
-    if (this._maxConcurrency !== undefined) config.swarm.maxConcurrency = this._maxConcurrency;
-    if (this._timeoutMs !== undefined) config.swarm.timeoutMs = this._timeoutMs;
-    if (this._channel !== undefined) config.swarm.channel = this._channel;
-    if (this._idleNudge !== undefined) config.swarm.idleNudge = this._idleNudge;
-    config.errorHandling = this._errorHandling ?? {
-      strategy: 'retry',
-      maxRetries: 2,
-      retryDelayMs: 1000,
-      repairRetries: 2,
-    };
-    if (this._coordination !== undefined) config.coordination = this._coordination;
-    if (this._state !== undefined) config.state = this._state;
-    if (this._trajectories !== undefined) config.trajectories = this._trajectories;
-
-    return config;
-  }
-
-  /** Serialize the config to a YAML string. */
-  toYaml(): string {
-    return stringifyYaml(this.toConfig());
-  }
-
-  /** Build the config and execute it with the WorkflowRunner. */
-  async run(options: WorkflowRunOptions & { dryRun: true }): Promise<DryRunReport>;
-  async run(options?: WorkflowRunOptions): Promise<WorkflowRunRow>;
-  async run(options: WorkflowRunOptions = {}): Promise<WorkflowRunRow | DryRunReport> {
-    const config = this.toConfig();
-    const runnerCwd = options.cwd ?? process.cwd();
-    const dbPath = path.join(runnerCwd, '.agent-relay', 'workflow-runs.jsonl');
-    const db = new JsonFileWorkflowDb(dbPath);
-
-    const runner = new WorkflowRunner({
-      cwd: options.cwd,
-      relay: options.relay,
-      executor: options.executor,
-      envSecrets: options.envSecrets,
-      db,
-    });
-
-    // Auto-detect DRY_RUN env var so existing scripts get dry-run for free
-    const isDryRun = options.dryRun ?? !!process.env.DRY_RUN;
-
-    if (isDryRun) {
-      const report = runner.dryRun(config, options.workflow, options.vars);
-      console.log(formatDryRunReport(report));
-      return report;
-    }
-
-    // Cloud execution path — submit to remote API and poll for completion
-    if (options.cloud) {
-      const cloudApiUrl = options.cloudApiUrl ?? process.env.CLOUD_API_URL;
-      const cloudApiToken = options.cloudApiToken ?? process.env.CLOUD_API_TOKEN;
-      if (!cloudApiUrl) throw new Error('cloud: true requires cloudApiUrl or CLOUD_API_URL env var');
-      if (!cloudApiToken) throw new Error('cloud: true requires cloudApiToken or CLOUD_API_TOKEN env var');
-      return runInCloud(config, {
-        cloudApiUrl,
-        cloudApiToken,
-        envSecrets: options.envSecrets,
-        pollIntervalMs: options.cloudPollIntervalMs,
-        timeoutMs: this._timeoutMs,
-        onStatusChange: options.onCloudStatusChange,
-      });
-    }
-
-    // Wire up default console logger unless explicitly disabled
-    // renderer: "listr" owns the terminal — skip console logger to avoid garbled output
-    // renderer: false implies no output at all
-    const logLevel =
-      options.renderer === 'listr' || options.renderer === false ? false : (options.logLevel ?? 'normal');
-    if (logLevel !== false) {
-      runner.on(createDefaultEventLogger(logLevel));
-    }
-
-    // Wire up user-provided event handler (additive — does not replace the default logger)
-    if (options.onEvent) {
-      runner.on(options.onEvent);
-    }
-
-    // Auto-detect RESUME_RUN_ID env var for resuming failed runs
-    const resumeRunId = process.env.RESUME_RUN_ID;
-
-    const startFrom = this._startFrom ?? options.startFrom ?? process.env.START_FROM;
-    const previousRunId = this._previousRunId ?? options.previousRunId ?? process.env.PREVIOUS_RUN_ID;
-    const executeOptions: WorkflowExecuteOptions | undefined = startFrom
-      ? { startFrom, previousRunId }
-      : undefined;
-
-    // If listr renderer requested, wire it up and run concurrently
-    // Must be set up BEFORE the resume check so resume runs also get event output
-    if (options.renderer === 'listr') {
-      const { createWorkflowRenderer } = await import('./listr-renderer.js');
-      const renderer = createWorkflowRenderer();
-      runner.on(renderer.onEvent);
-
-      const runPromise = resumeRunId
-        ? runner.resume(resumeRunId, options.vars, config)
-        : runner.execute(config, options.workflow, options.vars, executeOptions);
-
-      try {
-        const [result] = await Promise.all([runPromise, renderer.start()]);
-        return result;
-      } finally {
-        renderer.unmount();
-      }
-    }
-
-    if (resumeRunId) {
-      return runner.resume(resumeRunId, options.vars, config);
-    }
-
-    return runner.execute(config, options.workflow, options.vars, executeOptions);
-  }
-}
-
-// ── Entry point ─────────────────────────────────────────────────────────────
-
-/**
- * Create a new workflow builder.
- *
- * @example
- * ```typescript
- * const result = await workflow("my-task")
- *   .pattern("fan-out")
- *   .agent("worker", { cli: "claude" })
- *   .step("do-work", { agent: "worker", task: "Build the feature" })
- *   .run();
- * ```
- */
-export function workflow(name: string): WorkflowBuilder {
-  return new WorkflowBuilder(name);
-}
diff --git a/packages/sdk/src/workflows/builtin-templates/bug-fix.yaml b/packages/sdk/src/workflows/builtin-templates/bug-fix.yaml
deleted file mode 100644
index 7396636fa..000000000
--- a/packages/sdk/src/workflows/builtin-templates/bug-fix.yaml
+++ /dev/null
@@ -1,139 +0,0 @@
-version: '1.0'
-name: bug-fix
-description: 'Blueprint-style bug investigation and remediation with validation gates.'
-swarm:
-  pattern: hub-spoke
-  maxConcurrency: 2
-  timeoutMs: 2700000
-  channel: swarm-bug-fix
-  idleNudge:
-    nudgeAfterMs: 120000
-    escalateAfterMs: 120000
-    maxNudges: 1
-agents:
-  - name: lead
-    cli: claude
-    role: 'Coordinates debugging and release decisions'
-    permissions: { access: full }
-  - name: investigator
-    cli: codex
-    role: 'Reproduces and scopes the defect'
-    permissions: { access: readonly }
-    interactive: false
-  - name: fixer
-    cli: codex
-    role: 'Implements and tests the fix'
-    permissions: { access: readwrite }
-    interactive: false
-  - name: verifier
-    cli: claude
-    role: 'Validates risk, regressions, and completion'
-    permissions: { access: readonly }
-workflows:
-  - name: bug-remediation
-    description: 'Investigate root cause, patch safely, and verify no regressions.'
-    onError: retry
-    preflight:
-      - command: git status --porcelain
-        failIf: non-empty
-        description: 'Ensure working directory is clean'
-      - command: npm test 2>/dev/null || echo "baseline"
-        description: 'Capture baseline test state'
-    steps:
-      # Agent: Investigate root cause
-      - name: investigate
-        type: agent
-        agent: investigator
-        task: |
-          Reproduce the issue, identify root cause, and provide a fix strategy:
-          {{task}}
-        verification:
-          type: output_contains
-          value: ROOT_CAUSE_IDENTIFIED
-
-      # Deterministic: Create fix branch
-      - name: create-branch
-        type: deterministic
-        dependsOn: [investigate]
-        command: git checkout -b fix/{{branch-name}}
-
-      # Agent: Implement the fix
-      - name: patch
-        type: agent
-        agent: fixer
-        dependsOn: [create-branch]
-        task: |
-          Implement the fix based on the investigation report:
-          {{steps.investigate.output}}
-        retries: 2
-        verification:
-          type: output_contains
-          value: PATCH_APPLIED
-
-      # Deterministic: Run tests
-      - name: test
-        type: deterministic
-        dependsOn: [patch]
-        command: npm test
-
-      # Agent: Fix test failures if any (with iteration limit)
-      - name: fix-if-broken
-        type: agent
-        agent: fixer
-        dependsOn: [test]
-        task: |
-          Review test results. If tests failed, fix them. If all passed, output TESTS_PASSED.
-          Test output: {{steps.test.output}}
-        maxIterations: 2
-        verification:
-          type: output_contains
-          value: TESTS_PASSED
-
-      # Deterministic: Commit
-      - name: commit
-        type: deterministic
-        dependsOn: [fix-if-broken]
-        command: 'git add -A && git commit -m "fix: {{steps.investigate.output | first-line}}"'
-
-      # Agent: Verify no regressions
-      - name: regression-check
-        type: agent
-        agent: verifier
-        dependsOn: [commit]
-        task: |
-          Validate the patch for correctness and regression risk:
-          {{steps.patch.output}}
-        verification:
-          type: output_contains
-          value: VERIFICATION_COMPLETE
-
-      # Deterministic: Push to remote
-      - name: push
-        type: deterministic
-        dependsOn: [regression-check]
-        command: git push origin fix/{{branch-name}}
-
-      # Agent: Closeout
-      - name: closeout
-        type: agent
-        agent: lead
-        dependsOn: [push]
-        task: |
-          Prepare final incident summary, residual risk, and deployment notes.
-        verification:
-          type: output_contains
-          value: DONE
-coordination:
-  barriers:
-    - name: fix-ready
-      waitFor: [investigate, patch, regression-check]
-      timeoutMs: 600000
-state:
-  backend: memory
-  ttlMs: 43200000
-  namespace: bug-fix
-errorHandling:
-  strategy: retry
-  maxRetries: 3
-  retryDelayMs: 3000
-  notifyChannel: swarm-bug-fix
diff --git a/packages/sdk/src/workflows/builtin-templates/code-review.yaml b/packages/sdk/src/workflows/builtin-templates/code-review.yaml
deleted file mode 100644
index f606f786e..000000000
--- a/packages/sdk/src/workflows/builtin-templates/code-review.yaml
+++ /dev/null
@@ -1,137 +0,0 @@
-version: '1.0'
-name: code-review
-description: 'Blueprint-style parallel code review with deterministic diff capture.'
-swarm:
-  pattern: fan-out
-  maxConcurrency: 4
-  timeoutMs: 2400000
-  channel: swarm-code-review
-  idleNudge:
-    nudgeAfterMs: 120000
-    escalateAfterMs: 120000
-    maxNudges: 1
-agents:
-  - name: lead
-    cli: claude
-    role: 'Aggregates review output and final recommendations'
-    permissions: { access: full }
-  - name: reviewer-architecture
-    cli: codex
-    role: 'Assesses architecture and maintainability'
-    permissions: { access: readonly }
-    interactive: false
-  - name: reviewer-correctness
-    cli: claude
-    role: 'Assesses correctness and testing'
-    permissions: { access: readonly }
-    interactive: false
-  - name: reviewer-security
-    cli: gemini
-    role: 'Assesses security posture and abuse resistance'
-    permissions: { access: readonly }
-    interactive: false
-workflows:
-  - name: parallel-review
-    description: 'Run focused reviews in parallel and synthesize final guidance.'
-    onError: fail
-    preflight:
-      - command: git diff --stat HEAD~1 2>/dev/null || git diff --stat 2>/dev/null || echo "No diff available"
-        description: 'Check there are changes to review'
-    steps:
-      # Deterministic: Capture diff for review
-      - name: capture-diff
-        type: deterministic
-        command: git diff HEAD~1 2>/dev/null || git diff 2>/dev/null || echo "No changes"
-        captureOutput: true
-
-      # Deterministic: Capture file list
-      - name: capture-files
-        type: deterministic
-        dependsOn: [capture-diff]
-        command: git diff --name-only HEAD~1 2>/dev/null || git diff --name-only 2>/dev/null || echo "No files"
-
-      # Agent: Prepare context
-      - name: prepare-context
-        type: agent
-        agent: lead
-        dependsOn: [capture-diff, capture-files]
-        task: |
-          Summarize change intent, impacted modules, and review priorities:
-          {{task}}
-
-          Changed files: {{steps.capture-files.output}}
-        verification:
-          type: output_contains
-          value: REVIEW_CONTEXT_READY
-
-      # Agent: Architecture review (parallel)
-      - name: architecture-pass
-        type: agent
-        agent: reviewer-architecture
-        dependsOn: [prepare-context]
-        task: |
-          Review architecture, coupling, and long-term maintainability:
-          {{steps.prepare-context.output}}
-
-          Diff:
-          {{steps.capture-diff.output}}
-        verification:
-          type: output_contains
-          value: ARCH_REVIEW_COMPLETE
-
-      # Agent: Correctness review (parallel)
-      - name: correctness-pass
-        type: agent
-        agent: reviewer-correctness
-        dependsOn: [prepare-context]
-        task: |
-          Review behavior, tests, and likely regression paths:
-          {{steps.prepare-context.output}}
-
-          Diff:
-          {{steps.capture-diff.output}}
-        verification:
-          type: output_contains
-          value: CORRECTNESS_REVIEW_COMPLETE
-
-      # Agent: Security review (parallel)
-      - name: security-pass
-        type: agent
-        agent: reviewer-security
-        dependsOn: [prepare-context]
-        task: |
-          Review attack surface, secret handling, and input validation:
-          {{steps.prepare-context.output}}
-
-          Diff:
-          {{steps.capture-diff.output}}
-        verification:
-          type: output_contains
-          value: SECURITY_REVIEW_COMPLETE
-
-      # Agent: Consolidate findings
-      - name: consolidate
-        type: agent
-        agent: lead
-        dependsOn: [architecture-pass, correctness-pass, security-pass]
-        task: |
-          Produce merged findings, severity levels, and final recommendation.
-          Architecture review: {{steps.architecture-pass.output}}
-          Correctness review: {{steps.correctness-pass.output}}
-          Security review: {{steps.security-pass.output}}
-        verification:
-          type: output_contains
-          value: DONE
-coordination:
-  barriers:
-    - name: reviews-complete
-      waitFor: [architecture-pass, correctness-pass, security-pass]
-      timeoutMs: 900000
-  consensusStrategy: majority
-state:
-  backend: memory
-  ttlMs: 21600000
-  namespace: code-review
-errorHandling:
-  strategy: fail-fast
-  notifyChannel: swarm-code-review
diff --git a/packages/sdk/src/workflows/builtin-templates/competitive.yaml b/packages/sdk/src/workflows/builtin-templates/competitive.yaml
deleted file mode 100644
index ab8c41583..000000000
--- a/packages/sdk/src/workflows/builtin-templates/competitive.yaml
+++ /dev/null
@@ -1,107 +0,0 @@
-version: '1.0'
-name: competitive
-description: 'Multiple agents independently implement solutions, then compare and select the best approach.'
-swarm:
-  pattern: competitive
-  maxConcurrency: 4
-  timeoutMs: 5400000
-  channel: swarm-competitive
-agents:
-  - name: lead
-    cli: claude
-    role: 'Defines spec, judges implementations, and selects winner'
-    permissions: { access: readwrite }
-  - name: team-alpha
-    cli: claude
-    role: 'Independent implementation team A'
-    permissions: { access: readwrite }
-  - name: team-beta
-    cli: codex
-    role: 'Independent implementation team B'
-    permissions: { access: readwrite }
-  - name: team-gamma
-    cli: gemini
-    role: 'Independent implementation team C'
-    permissions: { access: readwrite }
-workflows:
-  - name: competitive-build
-    description: 'Independent parallel implementations followed by comparison and selection.'
-    onError: fail
-    steps:
-      - name: define-spec
-        agent: lead
-        task: |
-          Define clear requirements, acceptance criteria, and evaluation rubric:
-          {{task}}
-        verification:
-          type: output_contains
-          value: SPEC_COMPLETE
-      - name: implement-alpha
-        agent: team-alpha
-        dependsOn: [define-spec]
-        task: |
-          Implement solution independently based on spec:
-          {{steps.define-spec.output}}
-
-          Do not coordinate with other teams. Focus on your best approach.
-        verification:
-          type: output_contains
-          value: IMPLEMENTATION_COMPLETE
-      - name: implement-beta
-        agent: team-beta
-        dependsOn: [define-spec]
-        task: |
-          Implement solution independently based on spec:
-          {{steps.define-spec.output}}
-
-          Do not coordinate with other teams. Focus on your best approach.
-        verification:
-          type: output_contains
-          value: IMPLEMENTATION_COMPLETE
-      - name: implement-gamma
-        agent: team-gamma
-        dependsOn: [define-spec]
-        task: |
-          Implement solution independently based on spec:
-          {{steps.define-spec.output}}
-
-          Do not coordinate with other teams. Focus on your best approach.
-        verification:
-          type: output_contains
-          value: IMPLEMENTATION_COMPLETE
-      - name: compare-solutions
-        agent: lead
-        dependsOn: [implement-alpha, implement-beta, implement-gamma]
-        task: |
-          Compare all implementations against the evaluation rubric.
-
-          Team Alpha: {{steps.implement-alpha.output}}
-          Team Beta: {{steps.implement-beta.output}}
-          Team Gamma: {{steps.implement-gamma.output}}
-
-          Analyze trade-offs, strengths, and weaknesses of each approach.
-        verification:
-          type: output_contains
-          value: COMPARISON_COMPLETE
-      - name: select-winner
-        agent: lead
-        dependsOn: [compare-solutions]
-        task: |
-          Select the winning implementation or synthesize the best elements.
-          Provide rationale and integration plan.
-        verification:
-          type: output_contains
-          value: DONE
-coordination:
-  barriers:
-    - name: implementations-complete
-      waitFor: [implement-alpha, implement-beta, implement-gamma]
-      timeoutMs: 3600000
-  consensusStrategy: majority
-state:
-  backend: memory
-  ttlMs: 21600000
-  namespace: competitive
-errorHandling:
-  strategy: continue
-  notifyChannel: swarm-competitive
diff --git a/packages/sdk/src/workflows/builtin-templates/documentation.yaml b/packages/sdk/src/workflows/builtin-templates/documentation.yaml
deleted file mode 100644
index a67306a86..000000000
--- a/packages/sdk/src/workflows/builtin-templates/documentation.yaml
+++ /dev/null
@@ -1,128 +0,0 @@
-version: '1.0'
-name: documentation
-description: 'Blueprint-style documentation workflow with deterministic file operations.'
-swarm:
-  pattern: handoff
-  maxConcurrency: 1
-  timeoutMs: 3000000
-  channel: swarm-documentation
-  idleNudge:
-    nudgeAfterMs: 120000
-    escalateAfterMs: 120000
-    maxNudges: 1
-agents:
-  - name: lead
-    cli: claude
-    role: 'Owns final editorial sign-off'
-  - name: researcher
-    cli: codex
-    role: 'Collects technical context and source details'
-    interactive: false
-  - name: writer
-    cli: codex
-    role: 'Drafts user-facing documentation'
-    permissions:
-      access: readwrite
-      files:
-        write: ['docs/**', '*.md', 'web/content/**']
-    interactive: false
-  - name: editor
-    cli: claude
-    role: 'Edits for accuracy, clarity, and structure'
-    permissions:
-      access: readwrite
-      files:
-        write: ['docs/**', '*.md', 'web/content/**']
-workflows:
-  - name: docs-production
-    description: 'Gather context, draft docs, edit, and publish summary.'
-    onError: skip
-    preflight:
-      - command: git status --porcelain
-        failIf: non-empty
-        description: 'Ensure working directory is clean'
-    steps:
-      # Deterministic: List existing docs
-      - name: list-docs
-        type: deterministic
-        command: find . -name "*.md" -o -name "*.mdx" 2>/dev/null | head -50 || echo "No docs found"
-
-      # Agent: Gather context
-      - name: gather-context
-        type: agent
-        agent: researcher
-        dependsOn: [list-docs]
-        task: |
-          Collect source context and required updates:
-          {{task}}
-
-          Existing documentation files:
-          {{steps.list-docs.output}}
-        verification:
-          type: output_contains
-          value: CONTEXT_COMPLETE
-
-      # Deterministic: Create docs branch
-      - name: create-branch
-        type: deterministic
-        dependsOn: [gather-context]
-        command: git checkout -b docs/{{branch-name}}
-
-      # Agent: Draft documentation
-      - name: draft
-        type: agent
-        agent: writer
-        dependsOn: [create-branch]
-        task: |
-          Draft documentation updates based on gathered context:
-          {{steps.gather-context.output}}
-        verification:
-          type: output_contains
-          value: DRAFT_COMPLETE
-
-      # Agent: Edit draft
-      - name: edit
-        type: agent
-        agent: editor
-        dependsOn: [draft]
-        task: |
-          Edit the draft for technical accuracy and readability:
-          {{steps.draft.output}}
-        verification:
-          type: output_contains
-          value: EDIT_COMPLETE
-
-      # Deterministic: Commit docs
-      - name: commit
-        type: deterministic
-        dependsOn: [edit]
-        command: 'git add -A && git commit -m "docs: {{steps.gather-context.output | first-line}}"'
-
-      # Deterministic: Push
-      - name: push
-        type: deterministic
-        dependsOn: [commit]
-        command: git push origin docs/{{branch-name}}
-
-      # Agent: Publish summary
-      - name: publish-summary
-        type: agent
-        agent: lead
-        dependsOn: [push]
-        task: |
-          Publish a final summary of documentation changes and open items.
-        verification:
-          type: output_contains
-          value: DONE
-coordination:
-  barriers:
-    - name: docs-ready
-      waitFor: [gather-context, draft, edit]
-      timeoutMs: 600000
-state:
-  backend: memory
-  ttlMs: 259200000
-  namespace: documentation
-errorHandling:
-  strategy: continue
-  notifyChannel: swarm-documentation
diff --git a/packages/sdk/src/workflows/builtin-templates/feature-dev.yaml b/packages/sdk/src/workflows/builtin-templates/feature-dev.yaml
deleted file mode 100644
index 83d6dd72e..000000000
--- a/packages/sdk/src/workflows/builtin-templates/feature-dev.yaml
+++ /dev/null
@@ -1,146 +0,0 @@
-version: '1.0'
-name: feature-dev
-description: 'Blueprint-style feature development with deterministic quality gates.'
-swarm:
-  pattern: hub-spoke
-  maxConcurrency: 2
-  timeoutMs: 3600000
-  channel: swarm-feature-dev
-  idleNudge:
-    nudgeAfterMs: 120000
-    escalateAfterMs: 120000
-    maxNudges: 1
-agents:
-  - name: lead
-    cli: claude
-    role: 'Lead engineer coordinating delivery'
-    permissions: { access: full }
-  - name: planner
-    cli: codex
-    role: 'Plans implementation and acceptance criteria'
-    permissions: { access: readonly }
-    interactive: false
-  - name: developer
-    cli: codex
-    role: 'Implements planned changes'
-    permissions: { access: readwrite }
-    interactive: false
-  - name: reviewer
-    cli: claude
-    role: 'Reviews code quality and release risk'
-    permissions: { access: readonly }
-workflows:
-  - name: feature-delivery
-    description: 'Plan, implement, review, and finalize a feature request with quality gates.'
-    onError: retry
-    preflight:
-      - command: git status --porcelain
-        failIf: non-empty
-        description: 'Ensure working directory is clean'
-      - command: npm run type-check 2>/dev/null || echo "skip"
-        description: 'Run type checking if available'
-    steps:
-      # Agent: Planning
-      - name: plan
-        type: agent
-        agent: planner
-        task: |
-          Analyze the feature request and produce a concrete implementation plan:
-          {{task}}
-        retries: 1
-        verification:
-          type: output_contains
-          value: PLAN_COMPLETE
-
-      # Deterministic: Create feature branch
-      - name: create-branch
-        type: deterministic
-        dependsOn: [plan]
-        command: git checkout -b feature/{{branch-name}}
-
-      # Agent: Implementation
-      - name: implement
-        type: agent
-        agent: developer
-        dependsOn: [create-branch]
-        task: |
-          Implement the approved plan:
-          {{steps.plan.output}}
-        retries: 1
-        verification:
-          type: output_contains
-          value: IMPLEMENTATION_COMPLETE
-
-      # Deterministic: Lint
-      - name: lint
-        type: deterministic
-        dependsOn: [implement]
-        command: npm run lint:fix 2>/dev/null || npm run lint 2>/dev/null || echo "No lint configured"
-
-      # Deterministic: Run tests
-      - name: test
-        type: deterministic
-        dependsOn: [lint]
-        command: npm test 2>/dev/null || echo "No tests configured"
-
-      # Agent: Fix any failures (with iteration limit)
-      - name: fix-failures
-        type: agent
-        agent: developer
-        dependsOn: [test]
-        task: |
-          Review test results and fix any failures. If all tests passed, output TESTS_PASSED.
-          Test output: {{steps.test.output}}
-        maxIterations: 2
-        verification:
-          type: output_contains
-          value: TESTS_PASSED
-
-      # Deterministic: Stage and commit
-      - name: commit
-        type: deterministic
-        dependsOn: [fix-failures]
-        command: 'git add -A && git commit -m "feat: {{steps.plan.output | first-line}}"'
-
-      # Agent: Code review
-      - name: review
-        type: agent
-        agent: reviewer
-        dependsOn: [commit]
-        task: |
-          Review implementation quality, correctness, and test coverage:
-          {{steps.implement.output}}
-        verification:
-          type: output_contains
-          value: REVIEW_COMPLETE
-
-      # Deterministic: Push to remote
-      - name: push
-        type: deterministic
-        dependsOn: [review]
-        command: git push origin feature/{{branch-name}}
-
-      # Agent: Finalize
-      - name: finalize
-        type: agent
-        agent: lead
-        dependsOn: [push]
-        task: |
-          Summarize decisions and ship readiness for the feature.
-        verification:
-          type: output_contains
-          value: DONE
-coordination:
-  barriers:
-    - name: delivery-ready
-      waitFor: [plan, implement, review]
-      timeoutMs: 900000
-state:
-  backend: memory
-  ttlMs: 86400000
-  namespace: feature-dev
-errorHandling:
-  strategy: retry
-  maxRetries: 2
-  retryDelayMs: 5000
-  notifyChannel: swarm-feature-dev
diff --git a/packages/sdk/src/workflows/builtin-templates/refactor.yaml b/packages/sdk/src/workflows/builtin-templates/refactor.yaml
deleted file mode 100644
index c7ca5e713..000000000
--- a/packages/sdk/src/workflows/builtin-templates/refactor.yaml
+++ /dev/null
@@ -1,145 +0,0 @@
-version: '1.0'
-name: refactor
-description: 'Blueprint-style refactor workflow with deterministic quality gates.'
-swarm:
-  pattern: hierarchical
-  maxConcurrency: 2
-  timeoutMs: 4500000
-  channel: swarm-refactor
-  idleNudge:
-    nudgeAfterMs: 120000
-    escalateAfterMs: 120000
-    maxNudges: 1
-agents:
-  - name: lead
-    cli: claude
-    role: 'Owns scope, sequencing, and acceptance'
-    permissions: { access: full }
-  - name: architect
-    cli: codex
-    role: 'Designs target architecture and migration plan'
-    permissions: { access: readwrite }
-    interactive: false
-  - name: refactorer
-    cli: codex
-    role: 'Executes scoped refactor changes'
-    permissions: { access: readwrite }
-    interactive: false
-  - name: tester
-    cli: claude
-    role: 'Validates behavior parity and risk'
-    permissions: { access: readonly }
-workflows:
-  - name: refactor-execution
-    description: 'Analyze current system, design approach, refactor, and validate.'
-    onError: retry
-    preflight:
-      - command: git status --porcelain
-        failIf: non-empty
-        description: 'Ensure working directory is clean'
-      - command: npm test 2>/dev/null || echo "baseline"
-        description: 'Capture baseline test results'
-    steps:
-      # Agent: Analyze current design
-      - name: analyze
-        type: agent
-        agent: architect
-        task: |
-          Analyze current design and identify refactor opportunities:
-          {{task}}
-        verification:
-          type: output_contains
-          value: ANALYSIS_COMPLETE
-
-      # Agent: Design refactor plan
-      - name: design
-        type: agent
-        agent: architect
-        dependsOn: [analyze]
-        task: |
-          Provide incremental refactor plan with rollback notes:
-          {{steps.analyze.output}}
-        verification:
-          type: output_contains
-          value: PLAN_COMPLETE
-
-      # Deterministic: Create refactor branch
-      - name: create-branch
-        type: deterministic
-        dependsOn: [design]
-        command: git checkout -b refactor/{{branch-name}}
-
-      # Agent: Execute refactor
-      - name: refactor-code
-        type: agent
-        agent: refactorer
-        dependsOn: [create-branch]
-        task: |
-          Execute the refactor plan while preserving behavior:
-          {{steps.design.output}}
-        retries: 2
-        verification:
-          type: output_contains
-          value: REFACTOR_COMPLETE
-
-      # Deterministic: Run linting
-      - name: lint
-        type: deterministic
-        dependsOn: [refactor-code]
-        command: npm run lint:fix 2>/dev/null || npm run lint 2>/dev/null || echo "No lint configured"
-
-      # Deterministic: Run tests
-      - name: test
-        type: deterministic
-        dependsOn: [lint]
-        command: npm test
-
-      # Agent: Validate behavior parity
-      - name: validate
-        type: agent
-        agent: tester
-        dependsOn: [test]
-        task: |
-          Validate no regressions and ensure tests/quality checks pass:
-          {{steps.refactor-code.output}}
-          Test results: {{steps.test.output}}
-        verification:
-          type: output_contains
-          value: VALIDATION_COMPLETE
-
-      # Deterministic: Commit
-      - name: commit
-        type: deterministic
-        dependsOn: [validate]
-        command: 'git add -A && git commit -m "refactor: {{steps.design.output | first-line}}"'
-
-      # Deterministic: Push
-      - name: push
-        type: deterministic
-        dependsOn: [commit]
-        command: git push origin refactor/{{branch-name}}
-
-      # Agent: Handoff
-      - name: handoff
-        type: agent
-        agent: lead
-        dependsOn: [push]
-        task: |
-          Produce final refactor summary and open follow-up items.
-        verification:
-          type: output_contains
-          value: DONE
-coordination:
-  barriers:
-    - name: refactor-ready
-      waitFor: [analyze, design, refactor-code, validate]
-      timeoutMs: 900000
-state:
-  backend: memory
-  ttlMs: 604800000
-  namespace: refactor
-errorHandling:
-  strategy: retry
-  maxRetries: 2
-  retryDelayMs: 5000
-  notifyChannel: swarm-refactor
diff --git a/packages/sdk/src/workflows/builtin-templates/review-loop.yaml b/packages/sdk/src/workflows/builtin-templates/review-loop.yaml
deleted file mode 100644
index 6a8ef35ef..000000000
--- a/packages/sdk/src/workflows/builtin-templates/review-loop.yaml
+++ /dev/null
@@ -1,227 +0,0 @@
-version: '1.0'
-name: review-loop
-description: 'Implement a task with automated multi-perspective code review loop. Inspired by claude-review-loop pattern.'
-swarm:
-  pattern: review-loop
-  maxConcurrency: 4
-  timeoutMs: 3600000
-  channel: swarm-review-loop
-  idleNudge:
-    nudgeAfterMs: 180000
-    escalateAfterMs: 180000
-    maxNudges: 2
-agents:
-  - name: implementer
-    cli: claude
-    role: 'Senior developer implementing the task and addressing review feedback'
-    permissions: { access: full }
-  - name: reviewer-diff
-    cli: codex
-    role: 'Code quality reviewer focusing on git diff, tests, and potential bugs'
-    permissions: { access: readonly }
-    interactive: false
-  - name: reviewer-architecture
-    cli: claude
-    role: 'Architecture and design reviewer assessing structure and maintainability'
-    permissions: { access: readonly }
-    interactive: false
-  - name: reviewer-security
-    cli: codex
-    role: 'Security reviewer checking for OWASP Top 10 vulnerabilities'
-    permissions: { access: readonly }
-    interactive: false
-workflows:
-  - name: review-loop-workflow
-    description: 'Implement task, run parallel reviews, consolidate feedback, and address issues.'
-    onError: fail
-    steps:
-      # Phase 1: Implementation
-      - name: implement
-        type: agent
-        agent: implementer
-        task: |
-          Implement the following task:
-          {{task}}
-
-          When complete, output: IMPLEMENTATION COMPLETE
-        verification:
-          type: output_contains
-          value: IMPLEMENTATION COMPLETE
-
-      # Deterministic: Capture diff for review
-      - name: capture-diff
-        type: deterministic
-        dependsOn: [implement]
-        command: git diff HEAD~1 2>/dev/null || git diff 2>/dev/null || echo "No changes"
-        captureOutput: true
-
-      # Deterministic: Capture file list
-      - name: capture-files
-        type: deterministic
-        dependsOn: [capture-diff]
-        command: git diff --name-only HEAD~1 2>/dev/null || git diff --name-only 2>/dev/null || echo "No files"
-        captureOutput: true
-
-      # Phase 2: Parallel Reviews (fan-out)
-      - name: review-diff
-        type: agent
-        agent: reviewer-diff
-        dependsOn: [capture-files]
-        task: |
-          Review the git diff for code quality issues:
-
-          Focus areas:
-          - Code readability and clarity
-          - Test coverage (are new features tested?)
-          - Potential bugs or edge cases
-          - Error handling completeness
-
-          Changed files: {{steps.capture-files.output}}
-
-          Diff:
-          {{steps.capture-diff.output}}
-
-          Output format:
-          - If all looks good: REVIEW:PASS
-          - If issues found: REVIEW:ISSUES followed by numbered list of issues
-        verification:
-          type: output_contains
-          value: 'REVIEW:'
-
-      - name: review-architecture
-        type: agent
-        agent: reviewer-architecture
-        dependsOn: [capture-files]
-        task: |
-          Review the architecture and design:
-
-          Focus areas:
-          - Design patterns and best practices
-          - Separation of concerns
-          - Code organization and maintainability
-          - API design (if applicable)
-
-          Changed files: {{steps.capture-files.output}}
-
-          Diff:
-          {{steps.capture-diff.output}}
-
-          Output format:
-          - If all looks good: REVIEW:PASS
-          - If issues found: REVIEW:ISSUES followed by numbered list of issues
-        verification:
-          type: output_contains
-          value: 'REVIEW:'
-
-      - name: review-security
-        type: agent
-        agent: reviewer-security
-        dependsOn: [capture-files]
-        task: |
-          Security review for OWASP Top 10 vulnerabilities:
-
-          Focus areas:
-          - Injection vulnerabilities (SQL, command, XSS)
-          - Authentication and authorization issues
-          - Sensitive data exposure
-          - Security misconfiguration
-          - Input validation
-
-          Changed files: {{steps.capture-files.output}}
-
-          Diff:
-          {{steps.capture-diff.output}}
-
-          Output format:
-          - If secure: REVIEW:PASS
-          - If vulnerabilities found: REVIEW:ISSUES followed by numbered list with severity
-        verification:
-          type: output_contains
-          value: 'REVIEW:'
-
-      # Phase 3: Consolidate reviews
-      - name: consolidate
-        type: agent
-        agent: implementer
-        dependsOn: [review-diff, review-architecture, review-security]
-        task: |
-          Review all feedback from the code reviewers and consolidate findings:
-
-          ## Diff Review
-          {{steps.review-diff.output}}
-
-          ## Architecture Review
-          {{steps.review-architecture.output}}
-
-          ## Security Review
-          {{steps.review-security.output}}
-
-          Tasks:
-          1. Analyze each review's findings
-          2. Identify which issues are valid and should be addressed
-          3. Note any conflicting feedback
-          4. Create a prioritized action plan
-
-          Output: CONSOLIDATED with summary of issues to address (or NO_ISSUES if all reviews passed)
-        verification:
-          type: output_contains
-          value: CONSOLIDATED
-
-      # Phase 4: Address feedback (the loop)
-      - name: address-feedback
-        type: agent
-        agent: implementer
-        dependsOn: [consolidate]
-        task: |
-          Address the consolidated review feedback:
-
-          {{steps.consolidate.output}}
-
-          For each valid issue:
-          1. Make the necessary code changes
-          2. Explain what was fixed and why
-
-          If there were no issues to address, confirm the implementation is complete.
-
-          Output: ADDRESSED followed by summary of changes made (or NO_CHANGES_NEEDED)
-        verification:
-          type: output_contains
-          value: ADDRESSED
-        retries: 2
-        maxIterations: 3
-
-      # Final step: Completion summary
-      - name: complete
-        type: agent
-        agent: implementer
-        dependsOn: [address-feedback]
-        task: |
-          Provide a final summary of the completed work:
-
-          Original task: {{task}}
-
-          Include:
-          1. What was implemented
-          2. Key decisions made
-          3. Review feedback that was addressed
-          4. Any remaining considerations or follow-up items
-
-          Output: DONE
-        verification:
-          type: output_contains
-          value: DONE
-
-coordination:
-  barriers:
-    - name: reviews-complete
-      waitFor: [review-diff, review-architecture, review-security]
-      timeoutMs: 900000
-  consensusStrategy: majority
-state:
-  backend: memory
-  ttlMs: 21600000
-  namespace: review-loop
-errorHandling:
-  strategy: continue
-  maxRetries: 2
-  notifyChannel: swarm-review-loop
diff --git a/packages/sdk/src/workflows/builtin-templates/security-audit.yaml b/packages/sdk/src/workflows/builtin-templates/security-audit.yaml
deleted file mode 100644
index 4c2acd226..000000000
--- a/packages/sdk/src/workflows/builtin-templates/security-audit.yaml
+++ /dev/null
@@ -1,139 +0,0 @@
-version: '1.0'
-name: security-audit
-description: 'Blueprint-style security assessment with deterministic scanning and agent triage.'
-swarm:
-  pattern: pipeline
-  maxConcurrency: 1
-  timeoutMs: 5400000
-  channel: swarm-security-audit
-  idleNudge:
-    nudgeAfterMs: 120000
-    escalateAfterMs: 120000
-    maxNudges: 1
-agents:
-  - name: lead
-    cli: claude
-    role: 'Owns final risk sign-off and recommendations'
-    permissions: { access: full }
-  - name: analyst
-    cli: claude
-    role: 'Prioritizes findings and recommends mitigations'
-    permissions:
-      access: readonly
-      files:
-        deny: ['.env', 'secrets/**', '*.pem', '*.key']
-  - name: remediator
-    cli: codex
-    role: 'Implements approved remediations'
-    permissions: { access: readwrite }
-    interactive: false
-  - name: verifier
-    cli: gemini
-    role: 'Verifies fixes and residual exposure'
-    permissions:
-      access: readonly
-      files:
-        deny: ['.env', 'secrets/**', '*.pem', '*.key']
-workflows:
-  - name: audit-pipeline
-    description: 'Scan, triage, remediate, verify, and report security posture.'
-    onError: fail
-    preflight:
-      - command: npm audit --json 2>/dev/null | head -100 || echo "{}"
-        description: 'Run npm audit preflight check'
-      - command: git diff --check 2>/dev/null || echo "clean"
-        description: 'Check for whitespace errors'
-    steps:
-      # Deterministic: Run npm audit
-      - name: scan-npm
-        type: deterministic
-        command: npm audit --json 2>/dev/null || echo '{"vulnerabilities":{}}'
-        captureOutput: true
-
-      # Deterministic: Run additional security scans if available
-      - name: scan-extra
-        type: deterministic
-        dependsOn: [scan-npm]
-        command: |
-          if command -v semgrep &> /dev/null; then
-            semgrep --config auto --json . 2>/dev/null || echo '{"results":[]}'
-          else
-            echo '{"results":[],"note":"semgrep not installed"}'
-          fi
-
-      # Agent: Triage findings
-      - name: triage
-        type: agent
-        agent: analyst
-        dependsOn: [scan-npm, scan-extra]
-        task: |
-          Prioritize security findings by severity and exploitability:
-
-          NPM Audit: {{steps.scan-npm.output}}
-          Additional Scans: {{steps.scan-extra.output}}
-
-          Task context: {{task}}
-        verification:
-          type: output_contains
-          value: TRIAGE_COMPLETE
-
-      # Agent: Implement remediations
-      - name: remediate
-        type: agent
-        agent: remediator
-        dependsOn: [triage]
-        task: |
-          Implement mitigations for approved findings:
-          {{steps.triage.output}}
-        retries: 1
-        verification:
-          type: output_contains
-          value: REMEDIATION_COMPLETE
-
-      # Deterministic: Re-run tests
-      - name: test
-        type: deterministic
-        dependsOn: [remediate]
-        command: npm test 2>/dev/null || echo "No tests configured"
-
-      # Agent: Verify fixes
-      - name: verify
-        type: agent
-        agent: verifier
-        dependsOn: [test]
-        task: |
-          Re-test security posture and confirm mitigations hold:
-          {{steps.remediate.output}}
-          Test results: {{steps.test.output}}
-        verification:
-          type: output_contains
-          value: VERIFICATION_COMPLETE
-
-      # Deterministic: Commit security fixes
-      - name: commit
-        type: deterministic
-        dependsOn: [verify]
-        command: 'git add -A && git commit -m "security: address vulnerabilities from audit" 2>/dev/null || echo "No changes to commit"'
-
-      # Agent: Final report
-      - name: report
-        type: agent
-        agent: lead
-        dependsOn: [commit]
-        task: |
-          Produce final audit report with residual risk and next actions.
-        verification:
-          type: output_contains
-          value: DONE
-coordination:
-  barriers:
-    - name: audit-complete
-      waitFor: [scan-npm, triage, remediate, verify]
-      timeoutMs: 1200000
-state:
-  backend: memory
-  ttlMs: 86400000
-  namespace: security-audit
-errorHandling:
-  strategy: fail-fast
-  notifyChannel: swarm-security-audit
diff --git a/packages/sdk/src/workflows/channel-messenger.ts b/packages/sdk/src/workflows/channel-messenger.ts
deleted file mode 100644
index d5a9a14f3..000000000
--- a/packages/sdk/src/workflows/channel-messenger.ts
+++ /dev/null
@@ -1,335 +0,0 @@
-import { stripAnsi as stripAnsiFn } from '../pty.js';
-import type { StepOutcome } from './trajectory.js';
-import type { AgentDefinition, WorkflowStepRow } from './types.js';
-
-type StepStateLike = {
-  row: Pick<WorkflowStepRow, 'agentName' | 'status'>;
-};
-
-export interface ChannelRelayLike {
-  send(to: string, text: string): Promise<unknown>;
-}
-
-export interface ChannelMessengerOptions {
-  postFn?: (text: string) => void;
-}
-
-export async function sendToChannel(
-  relay: ChannelRelayLike,
-  channel: string,
-  message: string
-): Promise<void> {
-  await relay.send(channel, message);
-}
-
-export function truncateMessage(message: string, maxLength: number): string {
-  if (maxLength <= 0) return '';
-  return message.length > maxLength ? message.slice(-maxLength) : message;
-}
-
-export function formatStepOutput(stepName: string, output: string, maxLength = 2000): string {
-  const scrubbed = scrubForChannel(output);
-  if (scrubbed.length === 0) {
-    return `**[${stepName}]** Step completed — output written to disk`;
-  }
-
-  const preview = truncateMessage(scrubbed, maxLength);
-  return `**[${stepName}] Output:**\n\`\`\`\n${preview}\n\`\`\``;
-}
-
-export function formatError(stepName: string, error: unknown): string {
-  const raw = error instanceof Error ? error.message : String(error);
-  // Strip absolute paths that could leak internal directory structure
-  const message = raw.replace(/(?:\/[\w.-]+){3,}/g, '[path]');
-  return `**[${stepName}]** Failed: ${message}`;
-}
-
-// Common secret patterns to redact from channel output.
-const SECRET_PATTERNS = [
-  /(?:api[_-]?key|apikey|secret[_-]?key|access[_-]?token|auth[_-]?token|bearer)\s*[:=]\s*\S+/gi,
-  /(?:sk|pk|rk|ak)[-_][a-zA-Z0-9]{20,}/g,
-  /ghp_[a-zA-Z0-9]{36,}/g,
-  /gho_[a-zA-Z0-9]{36,}/g,
-  /github_pat_[a-zA-Z0-9_]{22,}/g,
-  /xox[bpors]-[a-zA-Z0-9-]+/g,
-  /-----BEGIN\s+(?:RSA\s+)?PRIVATE\s+KEY-----[\s\S]*?-----END/g,
-];
-
-// Unicode spinner / ornament characters used by Claude TUI animations.
-// Includes block-element chars (▗▖▘▝) used in the Claude Code header bar.
-const SPINNER =
-  '\\u2756\\u2738\\u2739\\u273a\\u273b\\u273c\\u273d\\u2731\\u2732\\u2733\\u2734\\u2735\\u2736\\u2737\\u2743\\u2745\\u2746\\u25d6\\u25d7\\u25d8\\u25d9\\u2022\\u25cf\\u25cb\\u25a0\\u25a1\\u25b6\\u25c0\\u23f5\\u23f6\\u23f7\\u23f8\\u23f9\\u25e2\\u25e3\\u25e4\\u25e5\\u2597\\u2596\\u2598\\u259d\\u2bc8\\u2bc7\\u2bc5\\u2bc6\\u00b7' +
-  '\\u2590\\u258c\\u2588\\u2584\\u2580\\u259a\\u259e' +
-  '\\u2b21\\u2b22';
-
-// Pre-compiled regex constants — hoisted to module level to avoid recompilation per call.
-const SPINNER_RE = new RegExp(`[${SPINNER}]`, 'gu');
-const SPINNER_CLASS_RE = new RegExp(`^[\\s${SPINNER}]*$`, 'u');
-const BOX_DRAWING_ONLY_RE = /^[\s\u2500-\u257f\u2580-\u259f\u25a0-\u25ff\-_=~]{3,}$/u;
-const BROKER_LOG_RE = /^\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}\.\d+Z\s+(?:INFO|WARN|ERROR|DEBUG)\s/u;
-const CLAUDE_HEADER_RE =
-  /^(?:[\s\u2580-\u259f✢*·▗▖▘▝]+\s*)?(?:Claude\s+Code(?:\s+v?[\d.]+)?|(?:Sonnet|Haiku|Opus)\s*[\d.]+|claude-(?:sonnet|haiku|opus)-[\w.-]+|Running\s+on\s+claude)/iu;
-const DIR_BREADCRUMB_RE = /^\s*~[\\/]/u;
-const UI_HINT_RE =
-  /\b(?:Press\s*up\s*to\s*edit|tab\s*to\s*queue|bypass\s*permissions|esc\s*to\s*interrupt|paste\s*again\s*to\s*expand|shift\s*[+]?\s*tab\s*to\s*cycle|running\s+stop\s+hook|fan\s+out\s+subagents)/iu;
-const VIM_MODE_RE =
-  /^[-\s]*--?(?:INSERT|NORMAL|VISUAL|REPLACE)--?[-\s]*$|--?(?:INSERT|NORMAL|VISUAL|REPLACE)--/u;
-const CLAUDE_FOOTER_RE =
-  /(?:Opus|Sonnet|Haiku)\s*\d[\d.]*\s*\(?(?:1M\s*context|context)?\)?\s*ctx\s*:\s*\d+%/iu;
-const THINKING_LINE_RE = new RegExp(`^[\\s${SPINNER}]*\\s*\\w[\\w\\s]*\\u2026\\s*$`, 'u');
-const THINKING_STATUS_RE =
-  /\b(?:thinking\s+(?:with\s+\w+\s+effort|more\s+with|harder)|↓\s*\d+\s*tokens?\b|↑\s*\d+\s*tokens?\b|crunched\s+for\s+\d|sautéed\s+for\s+\d|befuddl|flibbertigib|gitifying|flowing\s*…)/iu;
-const CURSOR_ONLY_RE = /^[\s❯⎿›»◀▶←→↑↓⟨⟩⟪⟫·]+$/u;
-const CURSOR_AGENT_RE =
-  /^(?:Cursor Agent|[\s⬡⬢]*Generating[.\s]|\[Pasted text|Auto-run all|Add a follow-up|ctrl\+c to stop|shift\+tab|Auto$|\/\s*commands|@\s*files|!\s*shell|follow-ups?\s|The user ha)/iu;
-const SLASH_COMMAND_RE = /^\/\w+\s*$/u;
-const MCP_JSON_KV_RE =
-  /^\s*"(?:type|method|params|result|id|jsonrpc|tool|name|arguments|content|role|metadata)"\s*:/u;
-const MEANINGFUL_CONTENT_RE = /[a-zA-Z0-9]/u;
-const MALFORMED_PTY_FRAME_RUN_RE = /(?:(?:qW0|q[A-Za-z]?0|[lmjkx]q{2,}|q{2,}[lmjkx]?)[\s|/_=\-~]*){4,}/giu;
-const MALFORMED_PTY_FRAME_ONLY_RE = /^[\s|/_=\-~lmjkxqtwuvn0W]{12,}$/iu;
-
-export function scrubSecrets(text: string): string {
-  let result = text;
-  for (const pattern of SECRET_PATTERNS) {
-    result = result.replace(pattern, '[REDACTED]');
-  }
-  return result;
-}
-
-function stripMalformedPtyFrameGarbage(line: string): string {
-  const strippedRuns = line.replace(MALFORMED_PTY_FRAME_RUN_RE, ' ');
-  const compact = strippedRuns.replace(SPINNER_RE, '').replace(/\s+/g, '');
-  if (compact.length >= 12 && MALFORMED_PTY_FRAME_ONLY_RE.test(compact)) {
-    return '';
-  }
-  return strippedRuns;
-}
-
-export function scrubForChannel(text: string): string {
-  // Strip system-reminder blocks (closed or unclosed) iteratively to avoid
-  // polynomial backtracking (ReDoS) with [\s\S]*? on adversarial input.
-  let withoutSystemReminders = text;
-  const openTag = '<system-reminder>';
-  const closeTag = '</system-reminder>';
-  let idx: number;
-  while ((idx = withoutSystemReminders.toLowerCase().indexOf(openTag)) !== -1) {
-    const closeIdx = withoutSystemReminders.toLowerCase().indexOf(closeTag, idx + openTag.length);
-    if (closeIdx !== -1) {
-      withoutSystemReminders =
-        withoutSystemReminders.slice(0, idx) + withoutSystemReminders.slice(closeIdx + closeTag.length);
-    } else {
-      // Unclosed tag — strip everything from the opening tag onward
-      withoutSystemReminders = withoutSystemReminders.slice(0, idx);
-      break;
-    }
-  }
-
-  // Normalize CRLF and bare \r before stripping ANSI — PTY output often
-  // contains \r\r\n which leaves stray \r after stripping that confuse line splitting.
-  const normalized = withoutSystemReminders.replace(/\r\n/g, '\n').replace(/\r/g, '\n');
-  const ansiStripped = stripAnsiFn(normalized);
-
-  // Redact secrets before further processing
-  const secretsRedacted = scrubSecrets(ansiStripped);
-
-  const countJsonDepth = (line: string): number => {
-    let depth = 0;
-    for (const ch of line) {
-      if (ch === '{' || ch === '[') depth += 1;
-      if (ch === '}' || ch === ']') depth -= 1;
-    }
-    return depth;
-  };
-
-  const lines = secretsRedacted.split('\n');
-  const meaningful: string[] = [];
-  let jsonDepth = 0;
-
-  for (const line of lines) {
-    const cleanedLine = stripMalformedPtyFrameGarbage(line);
-    const trimmed = cleanedLine.trim();
-
-    if (jsonDepth > 0) {
-      jsonDepth += countJsonDepth(cleanedLine);
-      if (jsonDepth <= 0) jsonDepth = 0;
-      continue;
-    }
-
-    if (trimmed.length === 0) continue;
-
-    if (trimmed.startsWith('{') || /^\[\s*\{/.test(trimmed)) {
-      jsonDepth = Math.max(countJsonDepth(cleanedLine), 0);
-      continue;
-    }
-
-    if (MCP_JSON_KV_RE.test(cleanedLine)) continue;
-    if (SPINNER_CLASS_RE.test(trimmed)) continue;
-    if (BOX_DRAWING_ONLY_RE.test(trimmed)) continue;
-    if (BROKER_LOG_RE.test(trimmed)) continue;
-    if (CLAUDE_HEADER_RE.test(trimmed)) continue;
-    if (DIR_BREADCRUMB_RE.test(trimmed)) continue;
-    if (UI_HINT_RE.test(trimmed)) continue;
-    if (VIM_MODE_RE.test(trimmed)) continue;
-    if (CLAUDE_FOOTER_RE.test(trimmed)) continue;
-    if (THINKING_LINE_RE.test(trimmed)) continue;
-    if (THINKING_STATUS_RE.test(trimmed)) continue;
-    if (CURSOR_ONLY_RE.test(trimmed)) continue;
-    if (CURSOR_AGENT_RE.test(trimmed)) continue;
-    if (SLASH_COMMAND_RE.test(trimmed)) continue;
-    if (!MEANINGFUL_CONTENT_RE.test(trimmed)) continue;
-
-    const alphanum = trimmed.replace(SPINNER_RE, '').replace(/\s+/g, '');
-    if (alphanum.replace(/[^a-zA-Z0-9]/g, '').length <= 3) continue;
-
-    meaningful.push(cleanedLine);
-  }
-
-  return meaningful
-    .join('\n')
-    .replace(/\n{3,}/g, '\n\n')
-    .trim();
-}
-
-export class ChannelMessenger {
-  private readonly postFn?: (text: string) => void;
-
-  constructor(options: ChannelMessengerOptions = {}) {
-    this.postFn = options.postFn;
-  }
-
-  buildNonInteractiveAwareness(
-    agentMap: Map<string, AgentDefinition>,
-    stepStates: Map<string, StepStateLike>
-  ): string | undefined {
-    const nonInteractive = [...agentMap.values()].filter((agent) => agent.interactive === false);
-    if (nonInteractive.length === 0) return undefined;
-
-    const agentToSteps = new Map<string, string[]>();
-    for (const [stepName, state] of stepStates) {
-      const agentName = state.row.agentName;
-      if (!agentName) continue;
-      if (!agentToSteps.has(agentName)) agentToSteps.set(agentName, []);
-      agentToSteps.get(agentName)!.push(stepName);
-    }
-
-    const lines = nonInteractive.map((agent) => {
-      const stepRefs = (agentToSteps.get(agent.name) ?? []).map((stepName) => `{{steps.${stepName}.output}}`);
-      return (
-        `- ${agent.name} (${agent.cli}) — will return output when complete` +
-        (stepRefs.length > 0 ? `. Access via: ${stepRefs.join(', ')}` : '')
-      );
-    });
-
-    return (
-      '\n\n---\n' +
-      'Note: The following agents are non-interactive workers and cannot receive messages:\n' +
-      lines.join('\n') +
-      '\n' +
-      'Do NOT attempt to message these agents. Use the {{steps.<name>.output}} references above to access their results.'
-    );
-  }
-
-  buildRelayRegistrationNote(cli: string, agentName: string): string {
-    if (cli === 'claude') return '';
-    return (
-      '---\n' +
-      'RELAY SETUP — do this FIRST before any other relay tool:\n' +
-      `1. Call: register_agent(name="${agentName}")\n` +
-      '   This authenticates you in the Relaycast workspace.\n' +
-      '   ALL relay tools (mcp__relaycast__send_dm, mcp__relaycast__check_inbox, mcp__relaycast__post_message, etc.) require\n' +
-      '   registration first — they will fail with "Not registered" otherwise.\n' +
-      `2. Your agent name is "${agentName}" — use this exact name when registering.`
-    );
-  }
-
-  buildDelegationGuidance(cli: string, timeoutMs?: number): string {
-    const timeoutNote = timeoutMs
-      ? `You have approximately ${Math.round(timeoutMs / 60000)} minutes before this step times out. ` +
-        'Plan accordingly — delegate early if the work is substantial.\n\n'
-      : '';
-    const subAgentOption =
-      cli === 'claude'
-        ? 'Option 2 — Use built-in sub-agents (Task tool) for research or scoped work:\n' +
-          '  - Good for exploring code, reading files, or making targeted changes\n' +
-          '  - Can run multiple sub-agents in parallel\n\n'
-        : '';
-
-    return (
-      '---\n' +
-      'AUTONOMOUS DELEGATION — READ THIS BEFORE STARTING:\n' +
-      timeoutNote +
-      'Before diving in, assess whether this task is too large or complex for a single agent. ' +
-      'If it involves multiple independent subtasks, touches many files, or could take a long time, ' +
-      'you should break it down and delegate to helper agents to avoid timeouts.\n\n' +
-      'Option 1 — Spawn relay agents (for real parallel coding work):\n' +
-      '  - mcp__relaycast__add_agent(name="helper-1", cli="claude", task="Specific subtask description")\n' +
-      '  - Coordinate via mcp__relaycast__send_dm(to="helper-1", text="...")\n' +
-      '  - Check on them with mcp__relaycast__check_inbox()\n' +
-      '  - Clean up when done: mcp__relaycast__remove_agent(name="helper-1")\n\n' +
-      subAgentOption +
-      'Guidelines:\n' +
-      '- You are the lead — delegate but stay in control, track progress, integrate results\n' +
-      '- Give each helper a clear, self-contained task with enough context to work independently\n' +
-      "- For simple or quick work, just do it yourself — don't over-delegate\n" +
-      '- Always release spawned relay agents when their work is complete\n' +
-      '- When spawning non-claude agents (codex, gemini, etc.), prepend to their task:\n' +
-      '  "RELAY SETUP: First call register_agent(name=\'<exact-agent-name>\') before any other relay tool."'
-    );
-  }
-
-  postCompletionReport(
-    workflowName: string,
-    outcomes: StepOutcome[],
-    summary: string,
-    confidence: number
-  ): void {
-    const completed = outcomes.filter((outcome) => outcome.status === 'completed');
-    const skipped = outcomes.filter((outcome) => outcome.status === 'skipped');
-    const retried = outcomes.filter((outcome) => outcome.attempts > 1);
-
-    const lines: string[] = [
-      `## Workflow **${workflowName}** — Complete`,
-      '',
-      summary,
-      `Confidence: ${Math.round(confidence * 100)}%`,
-      '',
-      '### Steps',
-      ...completed.map(
-        (outcome) =>
-          `- **${outcome.name}** (${outcome.agent}) — passed${outcome.verificationPassed ? ' (verified)' : ''}${outcome.attempts > 1 ? ` after ${outcome.attempts} attempts` : ''}`
-      ),
-      ...skipped.map((outcome) => `- **${outcome.name}** — skipped`),
-    ];
-
-    if (retried.length > 0) {
-      lines.push('', '### Retries');
-      for (const outcome of retried) {
-        lines.push(`- ${outcome.name}: ${outcome.attempts} attempts`);
-      }
-    }
-
-    this.postFn?.(lines.join('\n'));
-  }
-
-  postFailureReport(workflowName: string, outcomes: StepOutcome[], errorMsg: string): void {
-    const completed = outcomes.filter((outcome) => outcome.status === 'completed');
-    const failed = outcomes.filter((outcome) => outcome.status === 'failed');
-    const skipped = outcomes.filter((outcome) => outcome.status === 'skipped');
-
-    const lines: string[] = [
-      `## Workflow **${workflowName}** — Failed`,
-      '',
-      `${completed.length}/${outcomes.length} steps passed. Error: ${errorMsg}`,
-      '',
-      '### Steps',
-      ...completed.map((outcome) => `- **${outcome.name}** (${outcome.agent}) — passed`),
-      ...failed.map(
-        (outcome) => `- **${outcome.name}** (${outcome.agent}) — FAILED: ${outcome.error ?? 'unknown'}`
-      ),
-      ...skipped.map((outcome) => `- **${outcome.name}** — skipped`),
-    ];
-
-    this.postFn?.(lines.join('\n'));
-  }
-}
diff --git a/packages/sdk/src/workflows/cli-session-collector.ts b/packages/sdk/src/workflows/cli-session-collector.ts
deleted file mode 100644
index 2e7deaf3f..000000000
--- a/packages/sdk/src/workflows/cli-session-collector.ts
+++ /dev/null
@@ -1,58 +0,0 @@
-import type { AgentCli } from './types.js';
-import { ClaudeCodeCollector } from './collectors/claude.js';
-import { CodexCollector } from './collectors/codex.js';
-import { OpenCodeCollector } from './collectors/opencode.js';
-
-export interface CliSessionReport {
-  cli: AgentCli;
-  sessionId: string | null;
-  model: string | null;
-  provider: string | null;
-  durationMs: number | null;
-  cost: number | null;
-  tokens: {
-    input: number;
-    output: number;
-    cacheRead: number;
-  } | null;
-  turns: number;
-  toolCalls: { name: string; count: number }[];
-  errors: { turn: number; text: string }[];
-  finalStatus: 'completed' | 'failed' | 'unknown';
-  summary: string | null;
-  raw?: object;
-}
-
-export interface CliSessionQuery {
-  cli: AgentCli;
-  cwd: string;
-  startedAt: number;
-  completedAt: number;
-}
-
-export interface CliSessionCollector {
-  canCollect(): boolean;
-  collect(query: CliSessionQuery): Promise<CliSessionReport | null>;
-}
-
-export function createCollector(cli: AgentCli): CliSessionCollector | null {
-  switch (cli) {
-    case 'opencode':
-      return new OpenCodeCollector();
-    case 'claude':
-      return new ClaudeCodeCollector();
-    case 'codex':
-      return new CodexCollector();
-    default:
-      return null;
-  }
-}
-
-export async function collectCliSession(query: CliSessionQuery): Promise<CliSessionReport | null> {
-  const collector = createCollector(query.cli);
-  if (!collector || !collector.canCollect()) {
-    return null;
-  }
-
-  return collector.collect(query);
-}
diff --git a/packages/sdk/src/workflows/cli.ts b/packages/sdk/src/workflows/cli.ts
deleted file mode 100644
index 3c2b550b0..000000000
--- a/packages/sdk/src/workflows/cli.ts
+++ /dev/null
@@ -1,481 +0,0 @@
-#!/usr/bin/env node
-
-/**
- * CLI entry point for running relay.yaml workflows.
- *
- * Usage:
- *   relay-workflow <yaml-path> [--workflow <name>]
- *   relay-workflow --resume <run-id>
- *   npx @agent-relay/sdk run <yaml-path> [--workflow <name>]
- */
-
-import path from 'node:path';
-import chalk from 'chalk';
-
-import type { WorkflowEvent } from './runner.js';
-import { WorkflowRunner } from './runner.js';
-import { JsonFileWorkflowDb } from './file-db.js';
-
-function printUsage(): void {
-  console.log(
-    `
-Usage: relay-workflow <yaml-path> [options]
-       relay-workflow --resume <run-id>
-
-Run a relay.yaml workflow file.
-
-Arguments:
-  <yaml-path>              Path to the relay.yaml workflow file
-
-Options:
-  --workflow <name>        Run a specific workflow by name (default: first)
-  --resume <run-id>        Resume a failed or interrupted run by its run ID
-  --start-from <step>      Start from a specific step, skipping predecessors
-  --previous-run-id <id>   Use cached outputs from a specific prior run (with --start-from)
-  --validate               Validate workflow YAML for common issues without running
-  --help                   Show this help message
-
-Examples:
-  relay-workflow workflows/daytona-migration.yaml
-  relay-workflow workflows/feature-dev.yaml --workflow build-and-test
-  relay-workflow --resume f409ce1d1788710bcc6abb55
-`.trim()
-  );
-}
-
-type RunnerConfig = Awaited<ReturnType<WorkflowRunner['parseYamlFile']>>;
-
-type RunnerResult = Awaited<ReturnType<WorkflowRunner['execute']>>;
-
-type ExecuteOptions = {
-  startFrom: string;
-  previousRunId?: string;
-};
-
-/** Flags that consume the next argument as their value. Single source of truth for CLI parsing. */
-const FLAGS_WITH_VALUES = new Set(['--resume', '--workflow', '--start-from', '--previous-run-id']);
-
-function getYamlPathArg(args: string[]): string | undefined {
-  for (let i = 0; i < args.length; i += 1) {
-    const arg = args[i];
-    if (arg.startsWith('--')) {
-      if (FLAGS_WITH_VALUES.has(arg)) i += 1;
-      continue;
-    }
-    return arg;
-  }
-  return undefined;
-}
-
-interface RenderableTask {
-  output?: string;
-  title: string;
-}
-
-interface StepHandle {
-  resolve: () => void;
-  reject: (error: Error) => void;
-  setOutput: (text: string) => void;
-  markSkipped: () => void;
-}
-
-// Filter [broker] and [workflow HH:MM] noise while listr owns the terminal,
-// but let the observer URL and channel name through.
-function installOutputFilter(): () => void {
-  const orig = console.log.bind(console);
-  console.log = (...args: unknown[]) => {
-    const str = String(args[0] ?? '');
-    if (str.includes('Observer:') || str.includes('agentrelay.com') || str.includes('Channel: wf-')) {
-      orig(...args);
-      return;
-    }
-    if (/\[broker\]/.test(str) || /\[workflow\s+\d{2}:\d{2}\]/.test(str)) return;
-    orig(...args);
-  };
-  return () => {
-    console.log = orig;
-  };
-}
-
-async function runWithListr(
-  runner: WorkflowRunner,
-  config: RunnerConfig,
-  workflowName: string | undefined,
-  executeOptions: ExecuteOptions | undefined
-): Promise<RunnerResult> {
-  const stepHandles = new Map<string, StepHandle>();
-  const restoreConsole = installOutputFilter();
-
-  let resolveWorkflow!: () => void;
-  let rejectWorkflow!: (error: Error) => void;
-  const workflowDone = new Promise<void>((resolve, reject) => {
-    resolveWorkflow = resolve;
-    rejectWorkflow = reject;
-  });
-  workflowDone.catch(() => {});
-
-  let setHeader: (text: string) => void = () => {};
-
-  const { Listr } = await import('listr2');
-  // eslint-disable-next-line @typescript-eslint/no-explicit-any
-  const listr = new (Listr as any)(
-    [
-      {
-        title: chalk.dim('Workflow starting...'),
-        task: async (_ctx: unknown, task: any): Promise<void> => {
-          setHeader = (text: string): void => {
-            task.title = text;
-          };
-          await workflowDone;
-        },
-      },
-    ],
-    {
-      concurrent: true,
-      renderer: process.stdout.isTTY ? 'default' : 'verbose',
-      rendererOptions: {
-        collapseErrors: false,
-        showErrorMessage: true,
-      },
-    }
-  );
-
-  runner.on((event: WorkflowEvent) => {
-    switch (event.type) {
-      case 'run:started': {
-        setHeader(chalk.dim(`[workflow] run ${event.runId.slice(0, 8)}...`));
-        break;
-      }
-
-      case 'step:started': {
-        let resolveStep!: () => void;
-        let rejectStep!: (error: Error) => void;
-        let taskRef: RenderableTask | null = null;
-        let skipped = false;
-
-        const done = new Promise<void>((resolve, reject) => {
-          resolveStep = resolve;
-          rejectStep = reject;
-        });
-        done.catch(() => {});
-
-        stepHandles.set(event.stepName, {
-          resolve: resolveStep,
-          reject: rejectStep,
-          setOutput: (text: string) => {
-            if (taskRef) {
-              taskRef.output = text;
-            }
-          },
-          markSkipped: () => {
-            skipped = true;
-            if (taskRef) {
-              taskRef.title = chalk.dim(`${event.stepName} (skipped)`);
-            }
-          },
-        });
-
-        listr.add({
-          title: chalk.white(event.stepName),
-          task: async (_ctx: unknown, task: any): Promise<void> => {
-            taskRef = task as RenderableTask;
-            if (skipped) {
-              taskRef.title = chalk.dim(`${event.stepName} (skipped)`);
-            }
-            await done;
-          },
-          rendererOptions: {
-            persistentOutput: true,
-          },
-        });
-        break;
-      }
-
-      case 'step:owner-assigned': {
-        const handle = stepHandles.get(event.stepName);
-        if (handle) {
-          handle.setOutput(
-            chalk.dim(`> Owner: ${event.ownerName}`) +
-              (event.specialistName ? chalk.dim(` - specialist: ${event.specialistName}`) : '')
-          );
-        }
-        break;
-      }
-
-      case 'step:retrying': {
-        const handle = stepHandles.get(event.stepName);
-        if (handle) {
-          handle.setOutput(chalk.yellow(`Retrying (attempt ${event.attempt})`));
-        }
-        break;
-      }
-
-      case 'step:nudged': {
-        const handle = stepHandles.get(event.stepName);
-        if (handle) {
-          handle.setOutput(chalk.dim(`> Nudge #${event.nudgeCount}`));
-        }
-        break;
-      }
-
-      case 'step:force-released': {
-        const handle = stepHandles.get(event.stepName);
-        if (handle) {
-          handle.setOutput(chalk.yellow('> Force-released'));
-        }
-        break;
-      }
-
-      case 'step:review-completed': {
-        const handle = stepHandles.get(event.stepName);
-        if (handle) {
-          handle.setOutput(chalk.dim(`> Review: ${event.decision} by ${event.reviewerName}`));
-        }
-        break;
-      }
-
-      case 'step:owner-timeout': {
-        const handle = stepHandles.get(event.stepName);
-        if (handle) {
-          handle.setOutput(chalk.red(`> Owner ${event.ownerName} timed out`));
-        }
-        break;
-      }
-
-      case 'step:agent-report': {
-        const handle = stepHandles.get(event.stepName);
-        if (handle) {
-          const model = event.report.model ? `:${event.report.model}` : '';
-          handle.setOutput(chalk.dim(`> Report collected (${event.report.cli}${model})`));
-        }
-        break;
-      }
-
-      case 'step:completed': {
-        stepHandles.get(event.stepName)?.resolve();
-        break;
-      }
-
-      case 'step:skipped': {
-        const handle = stepHandles.get(event.stepName);
-        if (handle) {
-          handle.markSkipped();
-          handle.resolve();
-        } else {
-          // Step was skipped without ever being started (downstream of a failure).
-          // Add an already-resolved task so it shows in the listr output.
-          listr.add({
-            title: chalk.dim(`${event.stepName} (skipped)`),
-            task: async (): Promise<void> => {},
-            rendererOptions: { persistentOutput: true },
-          });
-        }
-        break;
-      }
-
-      case 'step:failed': {
-        stepHandles.get(event.stepName)?.reject(new Error(event.error ?? 'Step failed'));
-        break;
-      }
-
-      case 'run:completed': {
-        setHeader(chalk.green('Workflow completed'));
-        resolveWorkflow();
-        break;
-      }
-
-      case 'run:failed': {
-        setHeader(chalk.red(`Workflow failed: ${event.error}`));
-        rejectWorkflow(new Error(event.error ?? 'Workflow failed'));
-        break;
-      }
-
-      case 'run:cancelled': {
-        setHeader(chalk.yellow('Workflow cancelled'));
-        resolveWorkflow();
-        break;
-      }
-
-      case 'broker:event':
-        break;
-
-      default: {
-        const _exhaustive: never = event;
-        void _exhaustive;
-      }
-    }
-  });
-
-  const [result] = await Promise.all([
-    runner.execute(config, workflowName, undefined, executeOptions),
-    listr.run().catch(() => {
-      // Step failures are already represented in runner result.
-    }),
-  ]);
-
-  restoreConsole();
-  return result;
-}
-
-async function main(): Promise<void> {
-  const args = process.argv.slice(2);
-  const yamlPath = getYamlPathArg(args);
-
-  if (args.length === 0 || args.includes('--help')) {
-    printUsage();
-    process.exit(args.includes('--help') ? 0 : 1);
-  }
-
-  // Use a file-backed DB so runs survive process restarts and --resume works.
-  const dbPath = path.join(process.cwd(), '.agent-relay', 'workflow-runs.jsonl');
-  const fileDb = new JsonFileWorkflowDb(dbPath);
-  if (!fileDb.isWritable()) {
-    console.warn(
-      `[workflow] warning: cannot write to ${dbPath} — run state will not be persisted (--resume unavailable)`
-    );
-  }
-
-  const runner = new WorkflowRunner({ db: fileDb });
-  let shuttingDown = false;
-  const shutdown = async (signal: string): Promise<void> => {
-    if (shuttingDown) return;
-    shuttingDown = true;
-    console.log(`\n[workflow] ${signal} received — shutting down broker...`);
-    await runner.relay?.shutdown().catch(() => undefined);
-    process.exit(130);
-  };
-  process.on('SIGINT', () => void shutdown('SIGINT'));
-  process.on('SIGTERM', () => void shutdown('SIGTERM'));
-
-  // ── Resume mode ────────────────────────────────────────────────────────────
-  const resumeIdx = args.indexOf('--resume');
-  if (resumeIdx !== -1) {
-    const runId = args[resumeIdx + 1];
-    if (!runId) {
-      console.error(chalk.red('Error: --resume requires a run ID'));
-      process.exit(1);
-    }
-
-    console.log(chalk.dim(`Resuming run ${runId}...`));
-    runner.on((event: WorkflowEvent) => {
-      const ts = new Date().toISOString().slice(11, 19);
-      switch (event.type) {
-        case 'step:started':
-          console.log(chalk.dim(`[${ts}]`), chalk.white(event.stepName), chalk.dim('started'));
-          break;
-        case 'step:completed':
-          console.log(chalk.dim(`[${ts}]`), chalk.green('✔'), event.stepName);
-          break;
-        case 'step:failed':
-          console.log(chalk.dim(`[${ts}]`), chalk.red('✗'), event.stepName, chalk.red(event.error ?? ''));
-          break;
-        case 'step:skipped':
-          console.log(chalk.dim(`[${ts}]`), chalk.dim('⊘'), chalk.dim(event.stepName));
-          break;
-        default:
-          break;
-      }
-    });
-    let result: RunnerResult;
-    try {
-      const resumeConfig = yamlPath ? await runner.parseYamlFile(yamlPath) : undefined;
-      if (resumeConfig) {
-        console.warn(
-          chalk.yellow(
-            '[workflow] warning: resuming with current config from disk — ' +
-              'if the workflow YAML changed since the original run, behaviour may differ'
-          )
-        );
-      }
-      result = await runner.resume(runId, undefined, resumeConfig);
-    } catch (err) {
-      const message = err instanceof Error ? err.message : String(err);
-      const isRunNotFound = message.startsWith(`Run "${runId}" not found`);
-      if (isRunNotFound) {
-        if (fileDb.hasStepOutputs(runId)) {
-          console.error(
-            chalk.red(
-              `Error: ${message}. Step outputs exist for this run, but persisted run state is missing from ${dbPath}. ` +
-                `Use --start-from with --previous-run-id ${runId} to recover from the cached step outputs instead.`
-            )
-          );
-        } else {
-          console.error(chalk.red(`Error: ${message}`));
-        }
-      } else {
-        console.error(chalk.red(`Error: ${message}`));
-      }
-      process.exit(1);
-    }
-
-    if (result.status === 'completed') {
-      console.log(chalk.green('\nWorkflow completed successfully.'));
-      process.exit(0);
-    } else {
-      console.error(chalk.red(`\nWorkflow ${result.status}${result.error ? `: ${result.error}` : ''}`));
-      process.exit(1);
-    }
-    return;
-  }
-
-  // ── Normal / validate / dry-run mode ──────────────────────────────────────
-  let workflowName: string | undefined;
-
-  const workflowIdx = args.indexOf('--workflow');
-  if (workflowIdx !== -1 && args[workflowIdx + 1]) {
-    workflowName = args[workflowIdx + 1];
-  }
-
-  let startFromStep: string | undefined;
-  const startFromIdx = args.indexOf('--start-from');
-  if (startFromIdx !== -1 && args[startFromIdx + 1]) {
-    startFromStep = args[startFromIdx + 1];
-  }
-
-  let previousRunId: string | undefined;
-  const prevRunIdx = args.indexOf('--previous-run-id');
-  if (prevRunIdx !== -1 && args[prevRunIdx + 1]) {
-    previousRunId = args[prevRunIdx + 1];
-  }
-
-  if (!yamlPath) {
-    console.error(chalk.red('Error: workflow YAML path is required'));
-    printUsage();
-    process.exit(1);
-  }
-
-  const isValidate = args.includes('--validate');
-  const isDryRun = !!process.env.DRY_RUN;
-
-  const config = await runner.parseYamlFile(yamlPath);
-
-  if (isValidate) {
-    const { validateWorkflow, formatValidationReport } = await import('./validator.js');
-    const issues = validateWorkflow(config);
-    console.log(formatValidationReport(issues, yamlPath));
-    process.exit(issues.some((issue) => issue.severity === 'error') ? 1 : 0);
-  }
-
-  if (isDryRun) {
-    const { formatDryRunReport } = await import('./dry-run-format.js');
-    const report = runner.dryRun(config, workflowName);
-    console.log(formatDryRunReport(report));
-    process.exit(report.valid ? 0 : 1);
-  }
-
-  const executeOptions = startFromStep ? { startFrom: startFromStep, previousRunId } : undefined;
-  const result = await runWithListr(runner, config, workflowName, executeOptions);
-
-  if (result.status === 'completed') {
-    console.log(chalk.green('\nWorkflow completed successfully.'));
-    process.exit(0);
-  } else {
-    console.error(chalk.red(`\nWorkflow ${result.status}${result.error ? `: ${result.error}` : ''}`));
-    process.exit(1);
-  }
-}
-
-main().catch((err: Error) => {
-  console.error(chalk.red(`Error: ${err.message}`));
-  process.exit(1);
-});
diff --git a/packages/sdk/src/workflows/cloud-runner.ts b/packages/sdk/src/workflows/cloud-runner.ts
deleted file mode 100644
index de653f3f1..000000000
--- a/packages/sdk/src/workflows/cloud-runner.ts
+++ /dev/null
@@ -1,74 +0,0 @@
-/**
- * Cloud workflow runner — submits workflows to AgentWorkforce cloud API
- * and polls for completion.
- */
-import type { RelayYamlConfig, WorkflowRunRow, WorkflowRunStatus } from './types.js';
-
-export interface CloudRunOptions {
-  cloudApiUrl: string;
-  cloudApiToken: string;
-  envSecrets?: Record<string, string>;
-  pollIntervalMs?: number;
-  timeoutMs?: number;
-  onStatusChange?: (status: WorkflowRunStatus, runId: string) => void;
-}
-
-export async function runInCloud(config: RelayYamlConfig, options: CloudRunOptions): Promise<WorkflowRunRow> {
-  const { cloudApiUrl, cloudApiToken, envSecrets, pollIntervalMs = 3000, timeoutMs = 1800000 } = options;
-  const baseUrl = cloudApiUrl.replace(/\/$/, '');
-
-  const { stringify: stringifyYaml } = await import('yaml');
-  const yamlStr = stringifyYaml(config);
-
-  const submitRes = await fetch(`${baseUrl}/api/v1/workflows/run`, {
-    method: 'POST',
-    headers: { 'Content-Type': 'application/json', Authorization: `Bearer ${cloudApiToken}` },
-    body: JSON.stringify({
-      workflow: yamlStr,
-      fileType: 'yaml' as const,
-      ...(envSecrets ? { envSecrets } : {}),
-    }),
-  });
-  if (!submitRes.ok) throw new Error(`Cloud submit failed (${submitRes.status}): ${await submitRes.text()}`);
-
-  const { runId } = (await submitRes.json()) as { runId: string; sandboxId: string; status: string };
-  const deadline = Date.now() + timeoutMs;
-  let lastStatus: WorkflowRunStatus = 'pending';
-
-  while (Date.now() < deadline) {
-    await new Promise((r) => setTimeout(r, pollIntervalMs));
-    const statusRes = await fetch(`${baseUrl}/api/v1/workflows/runs/${runId}`, {
-      headers: { Authorization: `Bearer ${cloudApiToken}` },
-    });
-    if (!statusRes.ok) continue;
-
-    const data = (await statusRes.json()) as {
-      runId: string;
-      status: WorkflowRunStatus;
-      error?: string;
-      createdAt?: string;
-      updatedAt?: string;
-    };
-    if (data.status !== lastStatus) {
-      lastStatus = data.status;
-      options.onStatusChange?.(lastStatus, runId);
-    }
-
-    if (data.status === 'completed' || data.status === 'failed') {
-      return {
-        id: runId,
-        workspaceId: '',
-        workflowName: config.name ?? 'cloud-workflow',
-        pattern: (config.swarm?.pattern as any) ?? 'dag',
-        status: data.status,
-        config,
-        startedAt: data.createdAt ?? new Date().toISOString(),
-        completedAt: data.updatedAt ?? new Date().toISOString(),
-        error: data.error,
-        createdAt: data.createdAt ?? new Date().toISOString(),
-        updatedAt: data.updatedAt ?? new Date().toISOString(),
-      };
-    }
-  }
-  throw new Error(`Cloud workflow timed out after ${timeoutMs}ms (runId: ${runId})`);
-}
diff --git a/packages/sdk/src/workflows/cloud-schedules.ts b/packages/sdk/src/workflows/cloud-schedules.ts
deleted file mode 100644
index 49b8ae0b4..000000000
--- a/packages/sdk/src/workflows/cloud-schedules.ts
+++ /dev/null
@@ -1,3 +0,0 @@
-export { listWorkflowSchedules, scheduleWorkflow } from '@agent-relay/cloud';
-
-export type { ScheduleWorkflowOptions, WorkflowSchedule } from '@agent-relay/cloud';
diff --git a/packages/sdk/src/workflows/collectors/claude.ts b/packages/sdk/src/workflows/collectors/claude.ts
deleted file mode 100644
index 950c0c986..000000000
--- a/packages/sdk/src/workflows/collectors/claude.ts
+++ /dev/null
@@ -1,410 +0,0 @@
-import { createReadStream, existsSync, statSync } from 'node:fs';
-import { access } from 'node:fs/promises';
-import { homedir } from 'node:os';
-import path from 'node:path';
-import { createInterface } from 'node:readline';
-
-import type { CliSessionCollector, CliSessionQuery, CliSessionReport } from '../cli-session-collector.js';
-
-const CLAUDE_HOME = path.join(homedir(), '.claude');
-const HISTORY_PATH = path.join(CLAUDE_HOME, 'history.jsonl');
-const PROJECTS_PATH = path.join(CLAUDE_HOME, 'projects');
-const HISTORY_LOOKBACK_MS = 5_000;
-
-type JsonRecord = Record<string, unknown>;
-
-interface ClaudeHistoryEntry {
-  display?: string;
-  timestamp: number;
-  project: string;
-  sessionId: string;
-}
-
-export class ClaudeCodeCollector implements CliSessionCollector {
-  canCollect(): boolean {
-    return isReadableFile(HISTORY_PATH) && isReadableDirectory(PROJECTS_PATH);
-  }
-
-  async collect(query: CliSessionQuery): Promise<CliSessionReport | null> {
-    const historyEntry = await findMatchingHistoryEntry(query);
-    if (!historyEntry) {
-      return null;
-    }
-
-    const sessionPath = path.join(
-      PROJECTS_PATH,
-      encodeProjectPath(historyEntry.project),
-      `${historyEntry.sessionId}.jsonl`
-    );
-    if (!(await isReadableFileAsync(sessionPath))) {
-      return null;
-    }
-
-    return parseSessionLog(sessionPath, query, historyEntry.sessionId);
-  }
-}
-
-async function findMatchingHistoryEntry(query: CliSessionQuery): Promise<ClaudeHistoryEntry | null> {
-  const history = createInterface({
-    input: createReadStream(HISTORY_PATH, { encoding: 'utf8' }),
-    crlfDelay: Infinity,
-  });
-  let match: ClaudeHistoryEntry | null = null;
-
-  try {
-    for await (const line of history) {
-      const parsed = safeParseRecord(line);
-      if (!parsed) {
-        continue;
-      }
-
-      const entry = toHistoryEntry(parsed);
-      if (!entry) {
-        continue;
-      }
-
-      if (entry.project !== query.cwd) {
-        continue;
-      }
-
-      if (entry.timestamp < query.startedAt - HISTORY_LOOKBACK_MS || entry.timestamp > query.completedAt) {
-        continue;
-      }
-
-      match = entry;
-    }
-  } finally {
-    history.close();
-  }
-
-  return match;
-}
-
-async function parseSessionLog(
-  sessionPath: string,
-  query: CliSessionQuery,
-  sessionId: string
-): Promise<CliSessionReport | null> {
-  const session = createInterface({
-    input: createReadStream(sessionPath, { encoding: 'utf8' }),
-    crlfDelay: Infinity,
-  });
-
-  const rawLines: JsonRecord[] = [];
-  const toolCalls = new Map<string, number>();
-  const errors: { turn: number; text: string }[] = [];
-  const tokens = { input: 0, output: 0, cacheRead: 0 };
-  let turns = 0;
-  let summary: string | null = null;
-  let model: string | null = null;
-  let provider: string | null = null;
-  let finalStatus: CliSessionReport['finalStatus'] = 'unknown';
-
-  try {
-    for await (const line of session) {
-      const parsed = safeParseRecord(line);
-      if (!parsed) {
-        continue;
-      }
-
-      rawLines.push(parsed);
-
-      const entryType = getString(parsed.type);
-      if (entryType === 'user') {
-        turns += 1;
-        continue;
-      }
-
-      if (entryType === 'assistant') {
-        const usage = extractUsage(parsed);
-        if (usage) {
-          tokens.input += usage.input;
-          tokens.output += usage.output;
-          tokens.cacheRead += usage.cacheRead;
-        }
-
-        model ??= extractModel(parsed);
-        provider ??= extractProvider(parsed);
-
-        const assistantText = extractText(parsed);
-        if (assistantText) {
-          summary = assistantText;
-          if (finalStatus !== 'failed') {
-            finalStatus = 'completed';
-          }
-        }
-        continue;
-      }
-
-      if (entryType === 'tool_use') {
-        const toolName = extractToolName(parsed);
-        if (toolName) {
-          toolCalls.set(toolName, (toolCalls.get(toolName) ?? 0) + 1);
-        }
-        continue;
-      }
-
-      if (entryType === 'tool_result') {
-        const errorText = extractErrorText(parsed);
-        if (errorText) {
-          errors.push({ turn: Math.max(turns, 1), text: errorText });
-          finalStatus = 'failed';
-        }
-      }
-    }
-  } finally {
-    session.close();
-  }
-
-  if (rawLines.length === 0) {
-    return null;
-  }
-
-  return {
-    cli: 'claude',
-    sessionId,
-    model,
-    provider,
-    durationMs: Math.max(query.completedAt - query.startedAt, 0),
-    cost: null,
-    tokens: tokens.input || tokens.output || tokens.cacheRead ? tokens : null,
-    turns,
-    toolCalls: Array.from(toolCalls, ([name, count]) => ({ name, count })),
-    errors,
-    finalStatus,
-    summary,
-    raw: {
-      historyPath: HISTORY_PATH,
-      sessionPath,
-      lines: rawLines,
-    },
-  };
-}
-
-function toHistoryEntry(record: JsonRecord): ClaudeHistoryEntry | null {
-  const timestamp = getNumber(record.timestamp);
-  const project = getString(record.project);
-  const sessionId = getString(record.sessionId);
-  if (timestamp === null || !project || !sessionId) {
-    return null;
-  }
-
-  return {
-    display: getString(record.display) ?? undefined,
-    timestamp,
-    project,
-    sessionId,
-  };
-}
-
-function encodeProjectPath(projectPath: string): string {
-  return projectPath.replace(/\//g, '--').replace(/^-+/, '');
-}
-
-function extractUsage(record: JsonRecord): { input: number; output: number; cacheRead: number } | null {
-  const usage = findNestedRecord(record, [
-    'usage',
-    'message.usage',
-    'metadata.usage',
-    'message.metadata.usage',
-  ]);
-  if (!usage) {
-    return null;
-  }
-
-  return {
-    input: firstNumber(usage, ['input_tokens', 'inputTokens']) ?? 0,
-    output: firstNumber(usage, ['output_tokens', 'outputTokens']) ?? 0,
-    cacheRead:
-      firstNumber(usage, ['cache_read_input_tokens', 'cacheReadInputTokens', 'cache_read_tokens']) ?? 0,
-  };
-}
-
-function extractModel(record: JsonRecord): string | null {
-  return (
-    getString(record.model) ??
-    getString(record.modelId) ??
-    getString(findNestedValue(record, ['message.model', 'message.modelId', 'metadata.model']))
-  );
-}
-
-function extractProvider(record: JsonRecord): string | null {
-  return (
-    getString(record.provider) ??
-    getString(record.providerId) ??
-    getString(findNestedValue(record, ['message.provider', 'message.providerId', 'metadata.provider'])) ??
-    'anthropic'
-  );
-}
-
-function extractToolName(record: JsonRecord): string | null {
-  return (
-    getString(record.name) ??
-    getString(record.tool_name) ??
-    getString(findNestedValue(record, ['tool.name', 'content.name']))
-  );
-}
-
-function extractErrorText(record: JsonRecord): string | null {
-  const candidates = [
-    getString(record.error),
-    getString(findNestedValue(record, ['content.error', 'result.error', 'data.error', 'payload.error'])),
-    extractText(record),
-  ];
-
-  for (const candidate of candidates) {
-    const normalized = normalizeError(candidate);
-    if (normalized) {
-      return normalized;
-    }
-  }
-
-  return null;
-}
-
-function extractText(value: unknown): string | null {
-  if (typeof value === 'string') {
-    return value.trim() || null;
-  }
-
-  if (!value || typeof value !== 'object') {
-    return null;
-  }
-
-  if (Array.isArray(value)) {
-    const texts = value.map((entry) => extractText(entry)).filter((entry): entry is string => Boolean(entry));
-    return texts.length > 0 ? texts.join('\n').trim() : null;
-  }
-
-  const record = value as JsonRecord;
-
-  if (typeof record.text === 'string' && record.text.trim()) {
-    return record.text.trim();
-  }
-
-  if (typeof record.content === 'string' && record.content.trim()) {
-    return record.content.trim();
-  }
-
-  if (Array.isArray(record.content)) {
-    const texts = record.content
-      .map((entry) => extractText(entry))
-      .filter((entry): entry is string => Boolean(entry));
-    if (texts.length > 0) {
-      return texts.join('\n').trim();
-    }
-  }
-
-  if (record.message && typeof record.message === 'object') {
-    return extractText(record.message);
-  }
-
-  return null;
-}
-
-function normalizeError(text: string | null): string | null {
-  if (!text) {
-    return null;
-  }
-
-  const line = text
-    .split('\n')
-    .map((entry) => entry.trim())
-    .find((entry) => /(?:^error\b|^error:|^command failed\b|^fail\b|exception|traceback)/i.test(entry));
-
-  return line ?? null;
-}
-
-function safeParseRecord(line: string): JsonRecord | null {
-  const trimmed = line.trim();
-  if (!trimmed) {
-    return null;
-  }
-
-  try {
-    const parsed = JSON.parse(trimmed);
-    if (!parsed || typeof parsed !== 'object' || Array.isArray(parsed)) {
-      return null;
-    }
-
-    return parsed as JsonRecord;
-  } catch {
-    return null;
-  }
-}
-
-function findNestedRecord(root: JsonRecord, paths: string[]): JsonRecord | null {
-  for (const candidate of paths) {
-    const value = findNestedValue(root, [candidate]);
-    if (value && typeof value === 'object' && !Array.isArray(value)) {
-      return value as JsonRecord;
-    }
-  }
-
-  return null;
-}
-
-function findNestedValue(root: JsonRecord, paths: string[]): unknown {
-  for (const candidate of paths) {
-    let current: unknown = root;
-    let found = true;
-
-    for (const segment of candidate.split('.')) {
-      if (!current || typeof current !== 'object' || Array.isArray(current) || !(segment in current)) {
-        found = false;
-        break;
-      }
-      current = (current as JsonRecord)[segment];
-    }
-
-    if (found) {
-      return current;
-    }
-  }
-
-  return undefined;
-}
-
-function firstNumber(record: JsonRecord, keys: string[]): number | null {
-  for (const key of keys) {
-    const value = record[key];
-    if (typeof value === 'number' && Number.isFinite(value)) {
-      return value;
-    }
-  }
-
-  return null;
-}
-
-function getString(value: unknown): string | null {
-  return typeof value === 'string' && value.trim() ? value.trim() : null;
-}
-
-function getNumber(value: unknown): number | null {
-  return typeof value === 'number' && Number.isFinite(value) ? value : null;
-}
-
-function isReadableFile(filePath: string): boolean {
-  try {
-    return existsSync(filePath) && statSync(filePath).isFile();
-  } catch {
-    return false;
-  }
-}
-
-function isReadableDirectory(dirPath: string): boolean {
-  try {
-    return existsSync(dirPath) && statSync(dirPath).isDirectory();
-  } catch {
-    return false;
-  }
-}
-
-async function isReadableFileAsync(filePath: string): Promise<boolean> {
-  try {
-    await access(filePath);
-    return true;
-  } catch {
-    return false;
-  }
-}
diff --git a/packages/sdk/src/workflows/collectors/codex.ts b/packages/sdk/src/workflows/collectors/codex.ts
deleted file mode 100644
index 5f0ffc966..000000000
--- a/packages/sdk/src/workflows/collectors/codex.ts
+++ /dev/null
@@ -1,355 +0,0 @@
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import { createRequire } from 'node:module';
-
-import type { CliSessionCollector, CliSessionQuery, CliSessionReport } from '../cli-session-collector.js';
-
-const require = createRequire(import.meta.url);
-const CODEX_HOME = path.join(os.homedir(), '.codex');
-const DEFAULT_HISTORY_PATH = path.join(CODEX_HOME, 'history.jsonl');
-const DEFAULT_STATE_PATH = path.join(CODEX_HOME, 'state_5.sqlite');
-
-type DatabaseInstance = {
-  prepare(sql: string): {
-    all<T>(params?: unknown): T[];
-  };
-  close?: () => void;
-};
-
-type DatabaseConstructor = new (
-  filename: string,
-  options?: { readonly?: boolean; fileMustExist?: boolean }
-) => DatabaseInstance;
-
-interface DatabaseSyncModule {
-  DatabaseSync: new (filename: string, options?: { readOnly?: boolean; open?: boolean }) => DatabaseInstance;
-}
-
-interface CodexCollectorOptions {
-  historyPath?: string;
-  statePath?: string;
-}
-
-interface HistoryEntry {
-  session_id?: string;
-  ts?: number;
-  text?: string;
-}
-
-interface ThreadRow {
-  id: string;
-  cwd: string;
-  model_provider: string;
-  tokens_used: number;
-  created_at: number;
-  updated_at: number;
-  [key: string]: unknown;
-}
-
-interface LogRow {
-  ts?: number;
-  level?: string;
-  message?: string | null;
-  line?: number | null;
-}
-
-function loadBetterSqlite3(): DatabaseConstructor | null {
-  try {
-    return require('better-sqlite3') as DatabaseConstructor;
-  } catch {
-    return null;
-  }
-}
-
-async function openDatabase(dbPath: string): Promise<DatabaseInstance | null> {
-  const BetterSqlite = loadBetterSqlite3();
-  if (BetterSqlite) {
-    try {
-      return new BetterSqlite(dbPath, { readonly: true, fileMustExist: true });
-    } catch {
-      // Fall through to node:sqlite.
-    }
-  }
-
-  try {
-    const sqlite = (await import('node:sqlite')) as DatabaseSyncModule;
-    return new sqlite.DatabaseSync(dbPath, { readOnly: true, open: true });
-  } catch {
-    return null;
-  }
-}
-
-function normalizeTimestamp(value: unknown): number | null {
-  const numeric =
-    typeof value === 'number' && Number.isFinite(value)
-      ? value
-      : typeof value === 'string' && value.trim()
-        ? Number(value)
-        : null;
-  if (numeric === null || !Number.isFinite(numeric)) {
-    return null;
-  }
-
-  return numeric < 10_000_000_000 ? numeric * 1000 : numeric;
-}
-
-function parseJsonLine<T>(line: string): T | null {
-  try {
-    return JSON.parse(line) as T;
-  } catch {
-    return null;
-  }
-}
-
-function parseModelProvider(value: string | null | undefined): {
-  provider: string | null;
-  model: string | null;
-} {
-  if (!value) {
-    return { provider: null, model: null };
-  }
-
-  if (value.includes('/')) {
-    const [provider, ...rest] = value.split('/');
-    return {
-      provider: provider || null,
-      model: rest.join('/') || null,
-    };
-  }
-
-  if (value.includes(':')) {
-    const [provider, ...rest] = value.split(':');
-    return {
-      provider: provider || null,
-      model: rest.join(':') || null,
-    };
-  }
-
-  return {
-    provider: value,
-    model: null,
-  };
-}
-
-function getNumericField(row: ThreadRow, fieldNames: string[]): number | null {
-  for (const fieldName of fieldNames) {
-    const value = row[fieldName];
-    if (typeof value === 'number' && Number.isFinite(value)) {
-      return value;
-    }
-  }
-
-  return null;
-}
-
-function extractTokens(row: ThreadRow): CliSessionReport['tokens'] {
-  const input = getNumericField(row, ['input_tokens', 'prompt_tokens', 'tokens_input']);
-  const output = getNumericField(row, ['output_tokens', 'completion_tokens', 'tokens_output']);
-  const cacheRead = getNumericField(row, ['cache_read_tokens', 'tokens_cache_read', 'cached_input_tokens']);
-
-  if (input !== null || output !== null || cacheRead !== null) {
-    return {
-      input: input ?? 0,
-      output: output ?? 0,
-      cacheRead: cacheRead ?? 0,
-    };
-  }
-
-  return typeof row.tokens_used === 'number'
-    ? {
-        input: row.tokens_used,
-        output: 0,
-        cacheRead: 0,
-      }
-    : null;
-}
-
-export class CodexCollector implements CliSessionCollector {
-  private readonly historyPath: string;
-  private readonly statePath: string;
-
-  constructor(options: CodexCollectorOptions = {}) {
-    this.historyPath = options.historyPath ?? DEFAULT_HISTORY_PATH;
-    this.statePath = options.statePath ?? DEFAULT_STATE_PATH;
-  }
-
-  canCollect(): boolean {
-    return fs.existsSync(this.statePath) || fs.existsSync(this.historyPath);
-  }
-
-  async collect(query: CliSessionQuery): Promise<CliSessionReport | null> {
-    const historyEntries = this.readHistoryEntries();
-    const matchedThread = await this.findMatchingThread(query);
-
-    if (matchedThread) {
-      const errors = await this.readThreadErrors(matchedThread.id);
-      const { provider, model } = parseModelProvider(matchedThread.model_provider);
-      const createdAtMs = normalizeTimestamp(matchedThread.created_at);
-      const updatedAtMs = normalizeTimestamp(matchedThread.updated_at);
-
-      return {
-        cli: 'codex',
-        sessionId: matchedThread.id,
-        model,
-        provider,
-        durationMs:
-          createdAtMs !== null && updatedAtMs !== null && updatedAtMs >= createdAtMs
-            ? updatedAtMs - createdAtMs
-            : Math.max(query.completedAt - query.startedAt, 0),
-        cost: null,
-        tokens: extractTokens(matchedThread),
-        turns: historyEntries.filter((entry) => entry.session_id === matchedThread.id).length,
-        toolCalls: [],
-        errors,
-        finalStatus: errors.length > 0 ? 'failed' : 'unknown',
-        summary: null,
-        raw: {
-          matchedVia: 'threads',
-          thread: matchedThread,
-        },
-      };
-    }
-
-    const historyMatch = this.findMatchingHistoryEntry(query, historyEntries);
-    if (!historyMatch) {
-      return null;
-    }
-
-    return {
-      cli: 'codex',
-      sessionId: historyMatch.session_id ?? null,
-      model: null,
-      provider: null,
-      durationMs: Math.max(query.completedAt - query.startedAt, 0),
-      cost: null,
-      tokens: null,
-      turns: historyMatch.session_id
-        ? historyEntries.filter((entry) => entry.session_id === historyMatch.session_id).length
-        : 0,
-      toolCalls: [],
-      errors: [],
-      finalStatus: 'unknown',
-      summary: null,
-      raw: {
-        matchedVia: 'history',
-        entry: historyMatch,
-      },
-    };
-  }
-
-  private readHistoryEntries(): HistoryEntry[] {
-    if (!fs.existsSync(this.historyPath)) {
-      return [];
-    }
-
-    try {
-      return fs
-        .readFileSync(this.historyPath, 'utf8')
-        .split(/\r?\n/)
-        .map((line) => line.trim())
-        .filter(Boolean)
-        .flatMap((line) => {
-          const parsed = parseJsonLine<HistoryEntry>(line);
-          return parsed ? [parsed] : [];
-        });
-    } catch {
-      return [];
-    }
-  }
-
-  private findMatchingHistoryEntry(query: CliSessionQuery, entries: HistoryEntry[]): HistoryEntry | null {
-    for (let index = entries.length - 1; index >= 0; index -= 1) {
-      const entry = entries[index];
-      const timestamp = normalizeTimestamp(entry.ts);
-      if (timestamp === null) {
-        continue;
-      }
-
-      if (timestamp >= query.startedAt && timestamp <= query.completedAt) {
-        return entry;
-      }
-    }
-
-    return null;
-  }
-
-  private async findMatchingThread(query: CliSessionQuery): Promise<ThreadRow | null> {
-    if (!fs.existsSync(this.statePath)) {
-      return null;
-    }
-
-    const db = await openDatabase(this.statePath);
-    if (!db) {
-      return null;
-    }
-
-    try {
-      const threads = db
-        .prepare(
-          `
-          SELECT *
-          FROM threads
-          WHERE cwd = ?
-          ORDER BY created_at DESC
-          LIMIT 100
-        `
-        )
-        .all<ThreadRow>(query.cwd);
-
-      return (
-        threads.find((thread) => {
-          const createdAt = normalizeTimestamp(thread.created_at);
-          return createdAt !== null && createdAt >= query.startedAt && createdAt <= query.completedAt;
-        }) ?? null
-      );
-    } catch {
-      return null;
-    } finally {
-      db.close?.();
-    }
-  }
-
-  private async readThreadErrors(threadId: string): Promise<CliSessionReport['errors']> {
-    if (!fs.existsSync(this.statePath)) {
-      return [];
-    }
-
-    const db = await openDatabase(this.statePath);
-    if (!db) {
-      return [];
-    }
-
-    try {
-      const rows = db
-        .prepare(
-          `
-          SELECT ts, level, message, line
-          FROM logs
-          WHERE thread_id = ?
-            AND lower(level) = 'error'
-          ORDER BY ts ASC
-        `
-        )
-        .all<LogRow>(threadId);
-
-      return rows
-        .map((row, index) => {
-          const message = typeof row.message === 'string' ? row.message.trim() : '';
-          if (!message) {
-            return null;
-          }
-
-          return {
-            turn: index + 1,
-            text: message,
-          };
-        })
-        .filter((row): row is { turn: number; text: string } => row !== null);
-    } catch {
-      return [];
-    } finally {
-      db.close?.();
-    }
-  }
-}
diff --git a/packages/sdk/src/workflows/collectors/opencode.ts b/packages/sdk/src/workflows/collectors/opencode.ts
deleted file mode 100644
index 4ceb7884b..000000000
--- a/packages/sdk/src/workflows/collectors/opencode.ts
+++ /dev/null
@@ -1,321 +0,0 @@
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import { createRequire } from 'node:module';
-
-import type { CliSessionCollector, CliSessionQuery, CliSessionReport } from '../cli-session-collector.js';
-
-const require = createRequire(import.meta.url);
-const OPENCODE_DB_PATH = path.join(os.homedir(), '.local', 'share', 'opencode', 'opencode.db');
-const MATCH_WINDOW_GRACE_MS = 5_000;
-const ERROR_LINE_PATTERN = /^(Error|error:|Command failed|FAIL)\b/;
-
-type DatabaseInstance = {
-  prepare(sql: string): {
-    get<T>(params?: unknown): T | undefined;
-    all<T>(params?: unknown): T[];
-  };
-  pragma(source: string): unknown;
-  close(): void;
-};
-
-type DatabaseConstructor = new (
-  filename: string,
-  options?: { readonly?: boolean; fileMustExist?: boolean }
-) => DatabaseInstance;
-
-interface SessionRow {
-  id: string;
-  directory: string;
-  time_created: number;
-}
-
-interface MessageRow {
-  id: string;
-  session_id: string;
-  time_created: number;
-  data: string;
-}
-
-interface PartRow {
-  id: string;
-  message_id: string;
-  session_id: string;
-  time_created: number;
-  data: string;
-}
-
-interface OpenCodeMessageData {
-  role?: string;
-  modelID?: string;
-  providerID?: string;
-  cost?: number;
-  finish?: string;
-  tokens?: {
-    input?: number;
-    output?: number;
-    cache?: {
-      read?: number;
-    };
-  };
-}
-
-interface OpenCodePartData {
-  type?: string;
-  text?: string;
-  name?: string;
-}
-
-function loadDatabaseConstructor(): DatabaseConstructor | null {
-  try {
-    return require('better-sqlite3') as DatabaseConstructor;
-  } catch {
-    // fall through
-  }
-
-  // Fall back to Node 22+ native node:sqlite (experimental)
-  try {
-    // eslint-disable-next-line @typescript-eslint/no-require-imports
-    const { DatabaseSync } = require('node:sqlite');
-    return function NativeSqliteWrapper(
-      filename: string,
-      options?: { readonly?: boolean; fileMustExist?: boolean }
-    ) {
-      const db = new DatabaseSync(filename, { open: true, readOnly: options?.readonly ?? false });
-      return {
-        prepare(sql: string) {
-          const stmt = db.prepare(sql);
-          return {
-            get<T>(params?: unknown): T | undefined {
-              return params != null ? (stmt.get(params) as T | undefined) : (stmt.get() as T | undefined);
-            },
-            all<T>(params?: unknown): T[] {
-              return (params != null ? stmt.all(params) : stmt.all()) as T[];
-            },
-          };
-        },
-        pragma(source: string) {
-          db.exec(`PRAGMA ${source}`);
-          return undefined;
-        },
-        close() {
-          db.close();
-        },
-      };
-    } as unknown as DatabaseConstructor;
-  } catch {
-    return null;
-  }
-}
-
-function parseJson<T>(value: string): T | null {
-  try {
-    return JSON.parse(value) as T;
-  } catch {
-    return null;
-  }
-}
-
-function toNumber(value: unknown): number {
-  return typeof value === 'number' && Number.isFinite(value) ? value : 0;
-}
-
-function normalizeStatus(finish: string | undefined, hasErrors: boolean): CliSessionReport['finalStatus'] {
-  if (finish === 'stop' || finish === 'completed') {
-    return 'completed';
-  }
-
-  if (finish === 'error' || finish === 'failed' || hasErrors) {
-    return 'failed';
-  }
-
-  return 'unknown';
-}
-
-function isToolPart(part: OpenCodePartData | null): part is OpenCodePartData {
-  return !!part?.type && part.type.toLowerCase().includes('tool');
-}
-
-export class OpenCodeCollector implements CliSessionCollector {
-  canCollect(): boolean {
-    if (!fs.existsSync(OPENCODE_DB_PATH)) {
-      return false;
-    }
-
-    const Database = loadDatabaseConstructor();
-    if (!Database) {
-      return false;
-    }
-
-    let db: DatabaseInstance | null = null;
-
-    try {
-      db = new Database(OPENCODE_DB_PATH, { readonly: true, fileMustExist: true });
-      db.pragma('query_only = ON');
-      db.prepare('SELECT 1').get();
-      return true;
-    } catch {
-      return false;
-    } finally {
-      db?.close();
-    }
-  }
-
-  async collect(query: CliSessionQuery): Promise<CliSessionReport | null> {
-    const Database = loadDatabaseConstructor();
-    if (!Database) {
-      return null;
-    }
-
-    let db: DatabaseInstance | null = null;
-
-    try {
-      db = new Database(OPENCODE_DB_PATH, { readonly: true, fileMustExist: true });
-      db.pragma('query_only = ON');
-
-      const session = db
-        .prepare(
-          `
-          SELECT id, directory, time_created
-          FROM session
-          WHERE directory = @cwd
-            AND time_created BETWEEN @startedAt AND @completedAt
-          ORDER BY time_created DESC
-          LIMIT 1
-        `
-        )
-        .get<SessionRow>({
-          cwd: query.cwd,
-          startedAt: query.startedAt - MATCH_WINDOW_GRACE_MS,
-          completedAt: query.completedAt,
-        });
-
-      if (!session) {
-        return null;
-      }
-
-      const messages = db
-        .prepare(
-          `
-          SELECT id, session_id, time_created, data
-          FROM message
-          WHERE session_id = ?
-          ORDER BY time_created ASC
-        `
-        )
-        .all<MessageRow>(session.id);
-
-      const parts = db
-        .prepare(
-          `
-          SELECT id, message_id, session_id, time_created, data
-          FROM part
-          WHERE session_id = ?
-          ORDER BY time_created ASC
-        `
-        )
-        .all<PartRow>(session.id);
-
-      const parsedMessages = messages.map((message) => ({
-        ...message,
-        parsed: parseJson<OpenCodeMessageData>(message.data),
-      }));
-      const parsedParts = parts.map((part) => ({
-        ...part,
-        parsed: parseJson<OpenCodePartData>(part.data),
-      }));
-
-      const lastMessageWithMetadata = [...parsedMessages]
-        .reverse()
-        .find((message) => message.parsed?.modelID || message.parsed?.providerID || message.parsed?.finish);
-
-      const tokenTotals = parsedMessages.reduce(
-        (totals, message) => {
-          const tokens = message.parsed?.tokens;
-          totals.input += toNumber(tokens?.input);
-          totals.output += toNumber(tokens?.output);
-          totals.cacheRead += toNumber(tokens?.cache?.read);
-          return totals;
-        },
-        { input: 0, output: 0, cacheRead: 0 }
-      );
-
-      const hasCostData = parsedMessages.some(
-        (message) => typeof message.parsed?.cost === 'number' && Number.isFinite(message.parsed.cost)
-      );
-      const totalCost = parsedMessages.reduce((sum, message) => sum + toNumber(message.parsed?.cost), 0);
-
-      const toolCallCounts = new Map<string, number>();
-      for (const part of parsedParts) {
-        if (!isToolPart(part.parsed)) {
-          continue;
-        }
-
-        const name = part.parsed.name?.trim();
-        if (!name) {
-          continue;
-        }
-
-        toolCallCounts.set(name, (toolCallCounts.get(name) ?? 0) + 1);
-      }
-
-      const errors: CliSessionReport['errors'] = [];
-      for (const [index, part] of parsedParts.entries()) {
-        const text = part.parsed?.type === 'text' ? part.parsed.text : undefined;
-        if (!text) {
-          continue;
-        }
-
-        for (const line of text.split(/\r?\n/)) {
-          const trimmed = line.trim();
-          if (!trimmed || !ERROR_LINE_PATTERN.test(trimmed)) {
-            continue;
-          }
-
-          errors.push({ turn: index + 1, text: trimmed });
-        }
-      }
-
-      const summary =
-        [...parsedParts]
-          .reverse()
-          .find((part) => part.parsed?.type === 'text' && part.parsed.text?.trim())
-          ?.parsed?.text?.trim() ?? null;
-
-      const turns =
-        parsedMessages.filter(
-          (message) => message.parsed?.role === 'assistant' || message.parsed?.role === 'user'
-        ).length || parsedMessages.length;
-
-      return {
-        cli: 'opencode',
-        sessionId: session.id,
-        model: lastMessageWithMetadata?.parsed?.modelID ?? null,
-        provider: lastMessageWithMetadata?.parsed?.providerID ?? null,
-        durationMs:
-          parsedMessages.length > 0
-            ? Math.max(0, parsedMessages[parsedMessages.length - 1].time_created - session.time_created)
-            : null,
-        cost: hasCostData ? totalCost : null,
-        tokens: tokenTotals,
-        turns,
-        toolCalls: [...toolCallCounts.entries()].map(([name, count]) => ({ name, count })),
-        errors,
-        finalStatus: normalizeStatus(lastMessageWithMetadata?.parsed?.finish, errors.length > 0),
-        summary,
-        raw: {
-          session,
-          messages: parsedMessages.map(({ parsed, ...message }) => ({
-            ...message,
-            data: parsed ?? message.data,
-          })),
-          parts: parsedParts.map(({ parsed, ...part }) => ({ ...part, data: parsed ?? part.data })),
-        },
-      };
-    } catch {
-      return null;
-    } finally {
-      db?.close();
-    }
-  }
-}
diff --git a/packages/sdk/src/workflows/coordinator.ts b/packages/sdk/src/workflows/coordinator.ts
deleted file mode 100644
index b04e880dc..000000000
--- a/packages/sdk/src/workflows/coordinator.ts
+++ /dev/null
@@ -1,834 +0,0 @@
-/**
- * Swarm Coordinator — pattern selection, agent topology, and workflow lifecycle.
- *
- * Orchestrates workflow runs: picks the right swarm pattern (or auto-selects),
- * resolves agent topology from the config, and drives the run through its
- * lifecycle states (pending → running → completed / failed / cancelled).
- */
-
-import { randomBytes } from 'node:crypto';
-import { EventEmitter } from 'node:events';
-import type {
-  AgentDefinition,
-  RelayYamlConfig,
-  SwarmPattern,
-  WorkflowRunRow,
-  WorkflowRunStatus,
-  WorkflowStepRow,
-  WorkflowStepStatus,
-} from './types.js';
-
-// ── Database interface ──────────────────────────────────────────────────────
-
-/** Minimal database client contract accepted by all services. */
-export interface DbClient {
-  query<T = Record<string, unknown>>(sql: string, params?: unknown[]): Promise<{ rows: T[] }>;
-}
-
-// ── Topology types ──────────────────────────────────────────────────────────
-
-/** Describes the communication graph for a set of agents. */
-export interface AgentTopology {
-  pattern: SwarmPattern;
-  agents: AgentDefinition[];
-  /** Agent name → names it can send messages to. */
-  edges: Map<string, string[]>;
-  /** Optional hub agent for hub-spoke / hierarchical. */
-  hub?: string;
-  /** Ordered pipeline stages (pipeline pattern only). */
-  pipelineOrder?: string[];
-}
-
-// ── Pattern auto-selection ──────────────────────────────────────────────────
-
-/**
- * Mapping used when auto-selecting a pattern from config heuristics.
- * The coordinator checks the config shape and picks the best match.
- */
-const PATTERN_HEURISTICS: Array<{
-  test: (config: RelayYamlConfig) => boolean;
-  pattern: SwarmPattern;
-}> = [
-  // ── Dependency-based patterns (highest priority) ──────────────────────
-  {
-    test: (c) =>
-      Array.isArray(c.workflows) && c.workflows.some((w) => w.steps.some((s) => s.dependsOn?.length)),
-    pattern: 'dag',
-  },
-  {
-    test: (c) => c.coordination?.consensusStrategy !== undefined,
-    pattern: 'consensus',
-  },
-
-  // ── Specific role-based patterns (check before generic hub patterns) ──
-  {
-    // Map-reduce: requires BOTH mapper AND reducer roles
-    test: (c) => c.agents.some((a) => a.role === 'mapper') && c.agents.some((a) => a.role === 'reducer'),
-    pattern: 'map-reduce',
-  },
-  {
-    // Red-team: requires BOTH attacker/red-team AND defender/blue-team
-    test: (c) =>
-      c.agents.some((a) => a.role === 'attacker' || a.role === 'red-team') &&
-      c.agents.some((a) => a.role === 'defender' || a.role === 'blue-team'),
-    pattern: 'red-team',
-  },
-  {
-    // Reflection: requires critic role (not just reviewer, which is too common)
-    test: (c) => c.agents.some((a) => a.role === 'critic'),
-    pattern: 'reflection',
-  },
-  {
-    // Escalation: has tier-N roles
-    test: (c) => c.agents.some((a) => a.role?.startsWith('tier-')),
-    pattern: 'escalation',
-  },
-  {
-    // Auction: has auctioneer role
-    test: (c) => c.agents.some((a) => a.role === 'auctioneer'),
-    pattern: 'auction',
-  },
-  {
-    // Saga: has saga-orchestrator or compensate-handler roles
-    test: (c) => c.agents.some((a) => a.role === 'saga-orchestrator' || a.role === 'compensate-handler'),
-    pattern: 'saga',
-  },
-  {
-    // Circuit-breaker: has fallback or backup roles
-    test: (c) => c.agents.some((a) => a.role === 'fallback' || a.role === 'backup' || a.role === 'primary'),
-    pattern: 'circuit-breaker',
-  },
-  {
-    // Blackboard: has blackboard or shared-workspace role
-    test: (c) => c.agents.some((a) => a.role === 'blackboard' || a.role === 'shared-workspace'),
-    pattern: 'blackboard',
-  },
-  {
-    // Swarm: has hive-mind or swarm-agent roles
-    test: (c) => c.agents.some((a) => a.role === 'hive-mind' || a.role === 'swarm-agent'),
-    pattern: 'swarm',
-  },
-  {
-    // Verifier: has verifier role
-    test: (c) => c.agents.some((a) => a.role === 'verifier'),
-    pattern: 'verifier',
-  },
-  {
-    // Supervisor: has supervisor role
-    test: (c) => c.agents.some((a) => a.role === 'supervisor'),
-    pattern: 'supervisor',
-  },
-  {
-    // Review-loop: implementer + multiple reviewers (code review with feedback loop)
-    test: (c) => {
-      const hasImplementer = c.agents.some(
-        (a) => a.role?.toLowerCase().includes('implement') || a.name.toLowerCase().includes('implement')
-      );
-      const reviewerCount = c.agents.filter(
-        (a) => a.role?.toLowerCase().includes('reviewer') || a.name.toLowerCase().includes('reviewer')
-      ).length;
-      return hasImplementer && reviewerCount >= 2;
-    },
-    pattern: 'review-loop',
-  },
-
-  // ── Generic hub-based patterns ────────────────────────────────────────
-  {
-    test: (c) => c.agents.length > 3 && c.agents.some((a) => a.role === 'lead'),
-    pattern: 'hierarchical',
-  },
-  {
-    test: (c) => c.agents.some((a) => a.role === 'hub' || a.role === 'coordinator'),
-    pattern: 'hub-spoke',
-  },
-
-  // ── Structural patterns ───────────────────────────────────────────────
-  {
-    test: (c) =>
-      Array.isArray(c.workflows) &&
-      c.workflows.some((w) => {
-        // Filter to only agent steps
-        const names = w.steps.filter((s) => s.agent).map((s) => s.agent!);
-        return new Set(names).size === names.length && names.length > 2;
-      }),
-    pattern: 'pipeline',
-  },
-
-  // ── Default fallback ──────────────────────────────────────────────────
-  {
-    test: () => true,
-    pattern: 'fan-out',
-  },
-];
-
-// ── Coordinator events ──────────────────────────────────────────────────────
-
-export interface SwarmCoordinatorEvents {
-  'run:created': (run: WorkflowRunRow) => void;
-  'run:started': (run: WorkflowRunRow) => void;
-  'run:completed': (run: WorkflowRunRow) => void;
-  'run:failed': (run: WorkflowRunRow) => void;
-  'run:cancelled': (run: WorkflowRunRow) => void;
-  'step:started': (step: WorkflowStepRow) => void;
-  'step:completed': (step: WorkflowStepRow) => void;
-  'step:failed': (step: WorkflowStepRow) => void;
-}
-
-// ── Coordinator ─────────────────────────────────────────────────────────────
-
-export class SwarmCoordinator extends EventEmitter {
-  private db: DbClient;
-
-  constructor(db: DbClient) {
-    super();
-    this.db = db;
-  }
-
-  // ── Pattern selection ───────────────────────────────────────────────────
-
-  /**
-   * Select the swarm pattern to use for a config. If the config already
-   * specifies a pattern, it is returned as-is. Otherwise heuristics apply.
-   */
-  selectPattern(config: RelayYamlConfig): SwarmPattern {
-    if (config.swarm.pattern) {
-      return config.swarm.pattern;
-    }
-    for (const h of PATTERN_HEURISTICS) {
-      if (h.test(config)) return h.pattern;
-    }
-    return 'fan-out';
-  }
-
-  // ── Topology resolution ─────────────────────────────────────────────────
-
-  /**
-   * Build the agent communication topology for a given config and pattern.
-   * Non-interactive agents are excluded from message edges — they only communicate
-   * through step output chaining ({{steps.X.output}}).
-   */
-  resolveTopology(config: RelayYamlConfig, pattern?: SwarmPattern): AgentTopology {
-    const p = pattern ?? this.selectPattern(config);
-    const agents = config.agents;
-    const edges = new Map<string, string[]>();
-
-    // Non-interactive agents have no inbound or outbound message edges
-    const nonInteractiveNames = new Set(agents.filter((a) => a.interactive === false).map((a) => a.name));
-    const names = agents.map((a) => a.name).filter((n) => !nonInteractiveNames.has(n));
-
-    const topology = this.resolveInteractiveTopology(p, config, agents, edges, names);
-
-    // Apply non-interactive filtering to the actual topology edges (not the local
-    // `edges` variable, which may not be the same map — e.g., DAG creates its own).
-    const topologyEdges = topology.edges;
-
-    // Ensure non-interactive agents have empty edge entries (no messaging)
-    for (const name of nonInteractiveNames) {
-      topologyEdges.set(name, []);
-    }
-    // Also filter out non-interactive agents from any edge targets
-    for (const [agent, targets] of topologyEdges) {
-      topologyEdges.set(
-        agent,
-        targets.filter((t) => !nonInteractiveNames.has(t))
-      );
-    }
-
-    return topology;
-  }
-
-  /** Internal: resolve topology edges for interactive agents only. */
-  private resolveInteractiveTopology(
-    p: SwarmPattern,
-    config: RelayYamlConfig,
-    agents: AgentDefinition[],
-    edges: Map<string, string[]>,
-    names: string[]
-  ): AgentTopology {
-    switch (p) {
-      case 'fan-out': {
-        // Hub (first agent or role=lead) fans out to all others; no inter-worker edges.
-        const hub = this.pickHub(agents);
-        const others = names.filter((n) => n !== hub);
-        edges.set(hub, others);
-        for (const o of others) edges.set(o, [hub]);
-        return { pattern: p, agents, edges, hub };
-      }
-
-      case 'pipeline': {
-        // Linear chain following workflow step order or agent list order.
-        const order = this.resolvePipelineOrder(config, names);
-        for (let i = 0; i < order.length; i++) {
-          edges.set(order[i], i < order.length - 1 ? [order[i + 1]] : []);
-        }
-        return { pattern: p, agents, edges, pipelineOrder: order };
-      }
-
-      case 'hub-spoke': {
-        const hub = this.pickHub(agents);
-        const spokes = names.filter((n) => n !== hub);
-        edges.set(hub, spokes);
-        for (const s of spokes) edges.set(s, [hub]);
-        return { pattern: p, agents, edges, hub };
-      }
-
-      case 'consensus':
-      case 'debate':
-      case 'mesh': {
-        // Full mesh — every agent can talk to every other.
-        for (const n of names) {
-          edges.set(
-            n,
-            names.filter((o) => o !== n)
-          );
-        }
-        return { pattern: p, agents, edges };
-      }
-
-      case 'handoff': {
-        // Chain with explicit handoff: each agent passes to the next.
-        const order = this.resolvePipelineOrder(config, names);
-        for (let i = 0; i < order.length; i++) {
-          edges.set(order[i], i < order.length - 1 ? [order[i + 1]] : []);
-        }
-        return { pattern: p, agents, edges, pipelineOrder: order };
-      }
-
-      case 'cascade': {
-        // Primary tries first; on failure, falls through to next.
-        for (let i = 0; i < names.length; i++) {
-          edges.set(names[i], i < names.length - 1 ? [names[i + 1]] : []);
-        }
-        return { pattern: p, agents, edges, pipelineOrder: names };
-      }
-
-      case 'dag': {
-        // Edges derived from workflow step dependencies.
-        const stepEdges = this.resolveDAGEdges(config);
-        for (const n of names) {
-          if (!stepEdges.has(n)) stepEdges.set(n, []);
-        }
-        return { pattern: p, agents, edges: stepEdges };
-      }
-
-      case 'hierarchical': {
-        const hub = this.pickHub(agents);
-        const subordinates = names.filter((n) => n !== hub);
-        edges.set(hub, subordinates);
-        for (const s of subordinates) edges.set(s, [hub]);
-        return { pattern: p, agents, edges, hub };
-      }
-
-      // ── Additional patterns ────────────────────────────────────────────
-
-      case 'map-reduce': {
-        // Mappers fan out from coordinator, all feed into reducer(s)
-        const coordinator = this.pickHub(agents);
-        const mappers = agents.filter((a) => a.role === 'mapper').map((a) => a.name);
-        const reducers = agents.filter((a) => a.role === 'reducer').map((a) => a.name);
-        const others = names.filter(
-          (n) => n !== coordinator && !mappers.includes(n) && !reducers.includes(n)
-        );
-
-        // Coordinator → mappers (excluding self if coordinator is also a mapper)
-        edges.set(coordinator, [...mappers.filter((m) => m !== coordinator), ...others]);
-        // Mappers → reducers (skip coordinator to avoid overwriting its edges)
-        for (const m of mappers) {
-          if (m === coordinator) continue;
-          edges.set(m, reducers.length > 0 ? reducers : [coordinator]);
-        }
-        // Reducers → coordinator
-        for (const r of reducers) edges.set(r, [coordinator]);
-        // Others → coordinator
-        for (const o of others) edges.set(o, [coordinator]);
-
-        return { pattern: p, agents, edges, hub: coordinator };
-      }
-
-      case 'scatter-gather': {
-        // Hub scatters to all workers, gathers responses back
-        const hub = this.pickHub(agents);
-        const workers = names.filter((n) => n !== hub);
-        edges.set(hub, workers);
-        for (const w of workers) edges.set(w, [hub]);
-        return { pattern: p, agents, edges, hub };
-      }
-
-      case 'supervisor': {
-        // Supervisor monitors all workers; workers report to supervisor
-        const supervisor = agents.find((a) => a.role === 'supervisor')?.name ?? this.pickHub(agents);
-        const workers = names.filter((n) => n !== supervisor);
-        edges.set(supervisor, workers);
-        for (const w of workers) edges.set(w, [supervisor]);
-        return { pattern: p, agents, edges, hub: supervisor };
-      }
-
-      case 'reflection': {
-        // Agent produces output, critic reviews and sends feedback
-        // Linear: producer → critic → producer (loop-capable)
-        const critic = agents.find((a) => a.role === 'critic' || a.role === 'reviewer')?.name;
-        const producers = names.filter((n) => n !== critic);
-        if (critic) {
-          for (const prod of producers) {
-            edges.set(prod, [critic]);
-          }
-          edges.set(critic, producers);
-        } else {
-          // Fallback: self-reflection via mesh
-          for (const n of names)
-            edges.set(
-              n,
-              names.filter((o) => o !== n)
-            );
-        }
-        return { pattern: p, agents, edges };
-      }
-
-      case 'red-team': {
-        // Attacker ↔ Defender adversarial communication
-        const attackers = agents
-          .filter((a) => a.role === 'attacker' || a.role === 'red-team')
-          .map((a) => a.name);
-        const defenders = agents
-          .filter((a) => a.role === 'defender' || a.role === 'blue-team')
-          .map((a) => a.name);
-        const judges = names.filter((n) => !attackers.includes(n) && !defenders.includes(n));
-
-        // Attackers → defenders and judges
-        for (const a of attackers) edges.set(a, [...defenders, ...judges]);
-        // Defenders → attackers and judges
-        for (const d of defenders) edges.set(d, [...attackers, ...judges]);
-        // Judges receive from both, can communicate with all
-        for (const j of judges) edges.set(j, [...attackers, ...defenders]);
-
-        return { pattern: p, agents, edges };
-      }
-
-      case 'verifier': {
-        // Producer → Verifier chain; verifier can reject back to producer
-        const verifiers = agents.filter((a) => a.role === 'verifier').map((a) => a.name);
-        const producers = names.filter((n) => !verifiers.includes(n));
-
-        for (const prod of producers) edges.set(prod, verifiers.length > 0 ? verifiers : []);
-        for (const v of verifiers) edges.set(v, producers); // Can send rejections back
-
-        return { pattern: p, agents, edges };
-      }
-
-      case 'auction': {
-        // Auctioneer broadcasts tasks; bidders respond to auctioneer only
-        const auctioneer = agents.find((a) => a.role === 'auctioneer')?.name ?? this.pickHub(agents);
-        const bidders = names.filter((n) => n !== auctioneer);
-        edges.set(auctioneer, bidders);
-        for (const b of bidders) edges.set(b, [auctioneer]);
-        return { pattern: p, agents, edges, hub: auctioneer };
-      }
-
-      case 'escalation': {
-        // Tiered chain: each level can escalate to the next
-        // Uses agent order or tier role numbers
-        const order = this.resolveEscalationOrder(agents);
-        for (let i = 0; i < order.length; i++) {
-          // Each tier can escalate up and report down
-          const canEscalateTo = i < order.length - 1 ? [order[i + 1]] : [];
-          const canReportTo = i > 0 ? [order[i - 1]] : [];
-          edges.set(order[i], [...canEscalateTo, ...canReportTo]);
-        }
-        // Ensure non-tiered agents still have edge entries (prevents undefined)
-        for (const n of names) {
-          if (!edges.has(n)) edges.set(n, []);
-        }
-        return { pattern: p, agents, edges, pipelineOrder: order };
-      }
-
-      case 'saga': {
-        // Orchestrator coordinates saga steps; each step can trigger compensate
-        const orchestrator = agents.find((a) => a.role === 'saga-orchestrator')?.name ?? this.pickHub(agents);
-        const participants = names.filter((n) => n !== orchestrator);
-        // Orchestrator → all participants (for commands)
-        edges.set(orchestrator, participants);
-        // Participants → orchestrator (for completion/failure signals)
-        for (const part of participants) edges.set(part, [orchestrator]);
-        return { pattern: p, agents, edges, hub: orchestrator };
-      }
-
-      case 'circuit-breaker': {
-        // Primary agent with fallback chain
-        const order = names; // First agent is primary, rest are fallbacks
-        for (let i = 0; i < order.length; i++) {
-          // Each can trigger next fallback
-          edges.set(order[i], i < order.length - 1 ? [order[i + 1]] : []);
-        }
-        return { pattern: p, agents, edges, pipelineOrder: order };
-      }
-
-      case 'blackboard': {
-        // All agents can read/write to shared blackboard (full mesh)
-        // Plus optional moderator
-        const moderator = agents.find((a) => a.role === 'moderator')?.name;
-        for (const n of names) {
-          edges.set(
-            n,
-            names.filter((o) => o !== n)
-          );
-        }
-        return { pattern: p, agents, edges, hub: moderator };
-      }
-
-      case 'swarm': {
-        // Emergent swarm: agents communicate with nearest neighbors
-        // For simplicity, partial mesh based on agent index proximity
-        const hiveMind = agents.find((a) => a.role === 'hive-mind')?.name;
-        for (let i = 0; i < names.length; i++) {
-          const neighbors: string[] = [];
-          if (i > 0) neighbors.push(names[i - 1]);
-          if (i < names.length - 1) neighbors.push(names[i + 1]);
-          // Also connect to hive mind if present (avoid duplicates if already adjacent)
-          if (hiveMind && hiveMind !== names[i] && !neighbors.includes(hiveMind)) neighbors.push(hiveMind);
-          edges.set(names[i], neighbors);
-        }
-        return { pattern: p, agents, edges, hub: hiveMind };
-      }
-
-      case 'review-loop': {
-        // Implementer is hub; reviewers can communicate with implementer AND each other
-        // This enables collaborative review where reviewers can discuss findings
-        const implementer =
-          agents.find(
-            (a) => a.role?.toLowerCase().includes('implement') || a.name.toLowerCase().includes('implement')
-          )?.name ?? this.pickHub(agents);
-        const reviewers = agents
-          .filter(
-            (a) =>
-              a.name !== implementer &&
-              (a.role?.toLowerCase().includes('reviewer') || a.name.toLowerCase().includes('reviewer'))
-          )
-          .map((a) => a.name);
-        const others = names.filter((n) => n !== implementer && !reviewers.includes(n));
-
-        // Implementer → all reviewers and others
-        edges.set(implementer, [...reviewers, ...others]);
-        // Reviewers → implementer + other reviewers (collaborative review)
-        for (const r of reviewers) {
-          const otherReviewers = reviewers.filter((or) => or !== r);
-          edges.set(r, [implementer, ...otherReviewers]);
-        }
-        // Others → implementer
-        for (const o of others) edges.set(o, [implementer]);
-
-        return { pattern: p, agents, edges, hub: implementer };
-      }
-
-      default: {
-        // Fallback: full mesh.
-        for (const n of names) {
-          edges.set(
-            n,
-            names.filter((o) => o !== n)
-          );
-        }
-        return { pattern: p, agents, edges };
-      }
-    }
-  }
-
-  // ── Lifecycle: create run ───────────────────────────────────────────────
-
-  async createRun(workspaceId: string, config: RelayYamlConfig): Promise<WorkflowRunRow> {
-    const id = `run_${Date.now()}_${randomBytes(4).toString('hex')}`;
-    const pattern = this.selectPattern(config);
-    const now = new Date().toISOString();
-
-    const { rows } = await this.db.query<WorkflowRunRow>(
-      `INSERT INTO workflow_runs (id, workspace_id, workflow_name, pattern, status, config, started_at, created_at, updated_at)
-       VALUES ($1, $2, $3, $4, 'pending', $5, $6, $6, $6)
-       RETURNING *`,
-      [id, workspaceId, config.name, pattern, JSON.stringify(config), now]
-    );
-
-    const run = rows[0];
-    this.emit('run:created', run);
-    return run;
-  }
-
-  // ── Lifecycle: start run ────────────────────────────────────────────────
-
-  async startRun(runId: string): Promise<WorkflowRunRow> {
-    const now = new Date().toISOString();
-    const { rows } = await this.db.query<WorkflowRunRow>(
-      `UPDATE workflow_runs SET status = 'running', started_at = $2, updated_at = $2
-       WHERE id = $1 AND status = 'pending'
-       RETURNING *`,
-      [runId, now]
-    );
-
-    if (rows.length === 0) {
-      throw new Error(`Run ${runId} not found or not in pending state`);
-    }
-
-    const run = rows[0];
-    this.emit('run:started', run);
-    return run;
-  }
-
-  // ── Lifecycle: complete / fail / cancel ─────────────────────────────────
-
-  async completeRun(runId: string, stateSnapshot?: Record<string, unknown>): Promise<WorkflowRunRow> {
-    return this.transitionRun(runId, 'completed', undefined, stateSnapshot);
-  }
-
-  async failRun(runId: string, error: string): Promise<WorkflowRunRow> {
-    return this.transitionRun(runId, 'failed', error);
-  }
-
-  async cancelRun(runId: string): Promise<WorkflowRunRow> {
-    return this.transitionRun(runId, 'cancelled');
-  }
-
-  // ── Step management ─────────────────────────────────────────────────────
-
-  async createSteps(runId: string, config: RelayYamlConfig): Promise<WorkflowStepRow[]> {
-    const workflows = config.workflows ?? [];
-    const created: WorkflowStepRow[] = [];
-
-    for (const wf of workflows) {
-      for (const step of wf.steps) {
-        const id = `step_${Date.now()}_${randomBytes(4).toString('hex')}`;
-        const now = new Date().toISOString();
-
-        const { rows } = await this.db.query<WorkflowStepRow>(
-          `INSERT INTO workflow_steps (id, run_id, step_name, agent_name, status, task, depends_on, created_at, updated_at)
-           VALUES ($1, $2, $3, $4, 'pending', $5, $6, $7, $7)
-           RETURNING *`,
-          [
-            id,
-            runId,
-            step.name,
-            step.agent ?? null,
-            step.task ?? step.command ?? '',
-            JSON.stringify(step.dependsOn ?? []),
-            now,
-          ]
-        );
-
-        created.push(rows[0]);
-      }
-    }
-
-    return created;
-  }
-
-  async startStep(stepId: string): Promise<WorkflowStepRow> {
-    const now = new Date().toISOString();
-    const { rows } = await this.db.query<WorkflowStepRow>(
-      `UPDATE workflow_steps SET status = 'running', started_at = $2, updated_at = $2
-       WHERE id = $1 AND status = 'pending'
-       RETURNING *`,
-      [stepId, now]
-    );
-
-    if (rows.length === 0) {
-      throw new Error(`Step ${stepId} not found or not in pending state`);
-    }
-
-    const step = rows[0];
-    this.emit('step:started', step);
-    return step;
-  }
-
-  async completeStep(stepId: string, output?: string): Promise<WorkflowStepRow> {
-    const now = new Date().toISOString();
-    const { rows } = await this.db.query<WorkflowStepRow>(
-      `UPDATE workflow_steps SET status = 'completed', output = $2, completed_at = $3, updated_at = $3
-       WHERE id = $1 AND status = 'running'
-       RETURNING *`,
-      [stepId, output ?? null, now]
-    );
-
-    if (rows.length === 0) {
-      throw new Error(`Step ${stepId} not found or not in running state`);
-    }
-
-    const step = rows[0];
-    this.emit('step:completed', step);
-    return step;
-  }
-
-  async failStep(stepId: string, error: string): Promise<WorkflowStepRow> {
-    const now = new Date().toISOString();
-    const { rows } = await this.db.query<WorkflowStepRow>(
-      `UPDATE workflow_steps SET status = 'failed', error = $2, completed_at = $3, updated_at = $3
-       WHERE id = $1 AND status = 'running'
-       RETURNING *`,
-      [stepId, error, now]
-    );
-
-    if (rows.length === 0) {
-      throw new Error(`Step ${stepId} not found or not in running state`);
-    }
-
-    const step = rows[0];
-    this.emit('step:failed', step);
-    return step;
-  }
-
-  async skipStep(stepId: string): Promise<WorkflowStepRow> {
-    const now = new Date().toISOString();
-    const { rows } = await this.db.query<WorkflowStepRow>(
-      `UPDATE workflow_steps SET status = 'skipped', completed_at = $2, updated_at = $2
-       WHERE id = $1
-       RETURNING *`,
-      [stepId, now]
-    );
-
-    if (rows.length === 0) {
-      throw new Error(`Step ${stepId} not found`);
-    }
-
-    return rows[0];
-  }
-
-  // ── Queries ─────────────────────────────────────────────────────────────
-
-  async getRun(runId: string): Promise<WorkflowRunRow | null> {
-    const { rows } = await this.db.query<WorkflowRunRow>(`SELECT * FROM workflow_runs WHERE id = $1`, [
-      runId,
-    ]);
-    return rows[0] ?? null;
-  }
-
-  async getSteps(runId: string): Promise<WorkflowStepRow[]> {
-    const { rows } = await this.db.query<WorkflowStepRow>(
-      `SELECT * FROM workflow_steps WHERE run_id = $1 ORDER BY created_at ASC`,
-      [runId]
-    );
-    return rows;
-  }
-
-  async getReadySteps(runId: string): Promise<WorkflowStepRow[]> {
-    const steps = await this.getSteps(runId);
-    const completedNames = new Set(steps.filter((s) => s.status === 'completed').map((s) => s.stepName));
-
-    return steps.filter((s) => {
-      if (s.status !== 'pending') return false;
-      const deps: string[] = Array.isArray(s.dependsOn) ? s.dependsOn : [];
-      return deps.every((d) => completedNames.has(d));
-    });
-  }
-
-  async getRunsByWorkspace(workspaceId: string, status?: WorkflowRunStatus): Promise<WorkflowRunRow[]> {
-    if (status) {
-      const { rows } = await this.db.query<WorkflowRunRow>(
-        `SELECT * FROM workflow_runs WHERE workspace_id = $1 AND status = $2 ORDER BY created_at DESC`,
-        [workspaceId, status]
-      );
-      return rows;
-    }
-    const { rows } = await this.db.query<WorkflowRunRow>(
-      `SELECT * FROM workflow_runs WHERE workspace_id = $1 ORDER BY created_at DESC`,
-      [workspaceId]
-    );
-    return rows;
-  }
-
-  // ── Private helpers ─────────────────────────────────────────────────────
-
-  private async transitionRun(
-    runId: string,
-    status: WorkflowRunStatus,
-    error?: string,
-    stateSnapshot?: Record<string, unknown>
-  ): Promise<WorkflowRunRow> {
-    const now = new Date().toISOString();
-    const { rows } = await this.db.query<WorkflowRunRow>(
-      `UPDATE workflow_runs
-       SET status = $2, completed_at = $3, error = $4, state_snapshot = $5, updated_at = $3
-       WHERE id = $1
-       RETURNING *`,
-      [runId, status, now, error ?? null, stateSnapshot ? JSON.stringify(stateSnapshot) : null]
-    );
-
-    if (rows.length === 0) {
-      throw new Error(`Run ${runId} not found`);
-    }
-
-    const run = rows[0];
-    const eventName = `run:${status}` as keyof SwarmCoordinatorEvents;
-    this.emit(eventName, run);
-    return run;
-  }
-
-  private pickHub(agents: AgentDefinition[]): string {
-    // Prefer interactive agents as hub — non-interactive agents cannot receive messages
-    const interactiveAgents = agents.filter((a) => a.interactive !== false);
-    const pool = interactiveAgents.length > 0 ? interactiveAgents : agents;
-    const lead = pool.find((a) => a.role === 'lead' || a.role === 'hub' || a.role === 'coordinator');
-    return lead?.name ?? pool[0].name;
-  }
-
-  private resolvePipelineOrder(config: RelayYamlConfig, fallback: string[]): string[] {
-    const workflow = config.workflows?.[0];
-    if (!workflow) return fallback;
-
-    // Use step order — each step's agent in sequence, deduped.
-    const seen = new Set<string>();
-    const order: string[] = [];
-    for (const step of workflow.steps) {
-      // Skip deterministic steps (no agent)
-      if (!step.agent) continue;
-      if (!seen.has(step.agent)) {
-        seen.add(step.agent);
-        order.push(step.agent);
-      }
-    }
-    return order.length > 0 ? order : fallback;
-  }
-
-  private resolveEscalationOrder(agents: AgentDefinition[]): string[] {
-    // Sort by tier role (e.g., "tier-1", "tier-2") or by agent order
-    const tiered = agents.filter((a) => a.role?.startsWith('tier-'));
-    if (tiered.length > 0) {
-      return tiered
-        .sort((a, b) => {
-          const tierA = parseInt(a.role?.replace('tier-', '') ?? '0', 10);
-          const tierB = parseInt(b.role?.replace('tier-', '') ?? '0', 10);
-          return tierA - tierB;
-        })
-        .map((a) => a.name);
-    }
-    // Fallback: use agent order
-    return agents.map((a) => a.name);
-  }
-
-  private resolveDAGEdges(config: RelayYamlConfig): Map<string, string[]> {
-    const edges = new Map<string, string[]>();
-    const workflows = config.workflows ?? [];
-
-    for (const wf of workflows) {
-      // Build step-name → agent-name mapping (skip deterministic steps)
-      const stepAgent = new Map<string, string>();
-      for (const step of wf.steps) {
-        if (step.agent) {
-          stepAgent.set(step.name, step.agent);
-        }
-      }
-
-      for (const step of wf.steps) {
-        // Skip deterministic steps
-        if (!step.agent) continue;
-        if (!step.dependsOn?.length) continue;
-        for (const dep of step.dependsOn) {
-          const fromAgent = stepAgent.get(dep);
-          if (!fromAgent) continue;
-          const existing = edges.get(fromAgent) ?? [];
-          if (!existing.includes(step.agent)) {
-            existing.push(step.agent);
-          }
-          edges.set(fromAgent, existing);
-        }
-      }
-    }
-
-    return edges;
-  }
-}
diff --git a/packages/sdk/src/workflows/custom-steps.ts b/packages/sdk/src/workflows/custom-steps.ts
deleted file mode 100644
index 5ac686513..000000000
--- a/packages/sdk/src/workflows/custom-steps.ts
+++ /dev/null
@@ -1,442 +0,0 @@
-/**
- * Custom Steps Loader
- *
- * Loads and resolves custom step definitions from .relay/steps.yaml
- */
-
-import { existsSync, readFileSync } from 'node:fs';
-import path from 'node:path';
-import { parse as parseYaml } from 'yaml';
-import type { CustomStepsConfig, CustomStepDefinition, CustomStepParam, WorkflowStep } from './types.js';
-
-/** Default location for custom steps configuration. */
-export const CUSTOM_STEPS_FILE = '.relay/steps.yaml';
-
-/** Result of validating custom steps usage in a workflow. */
-export interface CustomStepsValidationResult {
-  valid: boolean;
-  errors: string[];
-  warnings: string[];
-  /** Custom steps that were referenced but not found. */
-  missingSteps: string[];
-  /** Parameters that were required but not provided. */
-  missingParams: Array<{ step: string; use: string; param: string }>;
-  /** Unreferenced variables in step definitions. */
-  unresolvedVariables: Array<{ step: string; variable: string }>;
-}
-
-/**
- * Load custom step definitions from .relay/steps.yaml.
- * Returns an empty map if the file doesn't exist.
- */
-export function loadCustomSteps(cwd: string): Map<string, CustomStepDefinition> {
-  const stepsPath = path.join(cwd, CUSTOM_STEPS_FILE);
-  const steps = new Map<string, CustomStepDefinition>();
-
-  if (!existsSync(stepsPath)) {
-    return steps;
-  }
-
-  try {
-    const content = readFileSync(stepsPath, 'utf-8');
-
-    // Handle empty file
-    if (!content.trim()) {
-      return steps;
-    }
-
-    const config = parseYaml(content) as CustomStepsConfig;
-
-    if (!config || typeof config !== 'object') {
-      throw new CustomStepsParseError(
-        'Invalid file format',
-        'The file must contain a valid YAML object with a "steps" key',
-        stepsPath
-      );
-    }
-
-    if (!config.steps) {
-      throw new CustomStepsParseError(
-        'Missing "steps" key',
-        'Add a "steps" object containing your custom step definitions:\n\n' +
-          'steps:\n' +
-          '  my-step:\n' +
-          '    command: "echo hello"',
-        stepsPath
-      );
-    }
-
-    if (typeof config.steps !== 'object' || Array.isArray(config.steps)) {
-      throw new CustomStepsParseError(
-        'Invalid "steps" format',
-        'The "steps" key must be an object (not an array) mapping step names to definitions',
-        stepsPath
-      );
-    }
-
-    for (const [name, definition] of Object.entries(config.steps)) {
-      validateCustomStepDefinition(name, definition, stepsPath);
-      steps.set(name, definition);
-    }
-
-    return steps;
-  } catch (err) {
-    if (err instanceof CustomStepsParseError) {
-      throw err;
-    }
-    const message = err instanceof Error ? err.message : String(err);
-    throw new CustomStepsParseError('Failed to parse file', message, stepsPath);
-  }
-}
-
-/**
- * Custom error class for parse errors with helpful context.
- */
-export class CustomStepsParseError extends Error {
-  constructor(
-    public readonly issue: string,
-    public readonly suggestion: string,
-    public readonly filePath: string
-  ) {
-    super(`${filePath}: ${issue}\n\n${suggestion}`);
-    this.name = 'CustomStepsParseError';
-  }
-}
-
-/**
- * Custom error class for step resolution errors.
- */
-export class CustomStepResolutionError extends Error {
-  constructor(
-    public readonly stepName: string,
-    public readonly issue: string,
-    public readonly suggestion: string
-  ) {
-    super(`Step "${stepName}": ${issue}\n\n${suggestion}`);
-    this.name = 'CustomStepResolutionError';
-  }
-}
-
-/**
- * Validate a custom step definition with clear error messages.
- */
-function validateCustomStepDefinition(
-  name: string,
-  def: unknown,
-  filePath: string
-): asserts def is CustomStepDefinition {
-  if (!def || typeof def !== 'object') {
-    throw new CustomStepsParseError(
-      `Invalid step "${name}"`,
-      'Each step must be an object with at least a "command" or "branch" field:\n\n' +
-        `steps:\n` +
-        `  ${name}:\n` +
-        `    command: "your-command-here"`,
-      filePath
-    );
-  }
-
-  const stepDef = def as Record<string, unknown>;
-
-  // Validate type if specified
-  if (stepDef.type !== undefined) {
-    if (stepDef.type !== 'deterministic' && stepDef.type !== 'worktree') {
-      throw new CustomStepsParseError(
-        `Invalid type "${stepDef.type}" for step "${name}"`,
-        'Step type must be either "deterministic" or "worktree"',
-        filePath
-      );
-    }
-  }
-
-  // Determine step type (default to deterministic if command is provided)
-  const hasCommand = typeof stepDef.command === 'string';
-  const hasBranch = typeof stepDef.branch === 'string';
-  const explicitType = stepDef.type as string | undefined;
-  const stepType = explicitType ?? (hasCommand ? 'deterministic' : hasBranch ? 'worktree' : undefined);
-
-  if (!stepType) {
-    throw new CustomStepsParseError(
-      `Step "${name}" is missing required fields`,
-      'Deterministic steps need "command", worktree steps need "branch":\n\n' +
-        '# Deterministic step:\n' +
-        `  ${name}:\n` +
-        '    command: "your-command {{param}}"\n\n' +
-        '# Worktree step:\n' +
-        `  ${name}:\n` +
-        '    type: worktree\n' +
-        '    branch: "{{branch-name}}"',
-      filePath
-    );
-  }
-
-  if (stepType === 'deterministic' && !hasCommand) {
-    throw new CustomStepsParseError(
-      `Deterministic step "${name}" is missing "command"`,
-      'Add a command field:\n\n' + `  ${name}:\n` + '    command: "your-shell-command"',
-      filePath
-    );
-  }
-
-  if (stepType === 'worktree' && !hasBranch) {
-    throw new CustomStepsParseError(
-      `Worktree step "${name}" is missing "branch"`,
-      'Add a branch field:\n\n' +
-        `  ${name}:\n` +
-        '    type: worktree\n' +
-        '    branch: "feature/{{branch-name}}"',
-      filePath
-    );
-  }
-
-  // Validate params if present
-  if (stepDef.params !== undefined) {
-    if (!Array.isArray(stepDef.params)) {
-      throw new CustomStepsParseError(
-        `Invalid params for step "${name}"`,
-        'Params must be an array:\n\n' +
-          `  ${name}:\n` +
-          '    params:\n' +
-          '      - name: myParam\n' +
-          '        required: true\n' +
-          '      - name: optionalParam\n' +
-          '        default: "value"',
-        filePath
-      );
-    }
-
-    for (let i = 0; i < stepDef.params.length; i++) {
-      const param = stepDef.params[i] as Record<string, unknown>;
-      if (!param || typeof param !== 'object') {
-        throw new CustomStepsParseError(
-          `Invalid param at index ${i} for step "${name}"`,
-          'Each param must be an object with at least a "name" field',
-          filePath
-        );
-      }
-      if (!param.name || typeof param.name !== 'string') {
-        throw new CustomStepsParseError(
-          `Param at index ${i} for step "${name}" is missing "name"`,
-          'Add a name to the parameter:\n\n' + '    params:\n' + '      - name: myParam',
-          filePath
-        );
-      }
-      if (param.required !== undefined && typeof param.required !== 'boolean') {
-        throw new CustomStepsParseError(
-          `Invalid "required" value for param "${param.name}" in step "${name}"`,
-          'The "required" field must be true or false',
-          filePath
-        );
-      }
-    }
-  }
-}
-
-/**
- * Extract all variable references ({{varName}}) from a string.
- */
-function extractVariables(text: string): string[] {
-  const matches = text.match(/\{\{(\w+)\}\}/g) ?? [];
-  return matches.map((m) => m.slice(2, -2));
-}
-
-/**
- * Validate custom step usage in workflow steps without resolving.
- * Returns validation errors and warnings for dry-run.
- */
-export function validateCustomStepsUsage(
-  steps: WorkflowStep[],
-  customSteps: Map<string, CustomStepDefinition>
-): CustomStepsValidationResult {
-  const errors: string[] = [];
-  const warnings: string[] = [];
-  const missingSteps: string[] = [];
-  const missingParams: Array<{ step: string; use: string; param: string }> = [];
-  const unresolvedVariables: Array<{ step: string; variable: string }> = [];
-
-  for (const step of steps) {
-    if (!step.use) continue;
-
-    const customDef = customSteps.get(step.use);
-    if (!customDef) {
-      missingSteps.push(step.use);
-      errors.push(
-        `Step "${step.name}" uses undefined custom step "${step.use}". ` +
-          `Add it to .relay/steps.yaml or check for typos.`
-      );
-      continue;
-    }
-
-    // Check required parameters
-    const stepAny = step as unknown as Record<string, unknown>;
-    const providedParams = new Set<string>();
-
-    if (customDef.params) {
-      for (const param of customDef.params) {
-        const providedValue = stepAny[param.name];
-        if (providedValue !== undefined) {
-          providedParams.add(param.name);
-        } else if (param.default !== undefined) {
-          providedParams.add(param.name);
-        } else if (param.required) {
-          missingParams.push({ step: step.name, use: step.use, param: param.name });
-          errors.push(
-            `Step "${step.name}" is missing required parameter "${param.name}" for custom step "${step.use}".`
-          );
-        }
-      }
-    }
-
-    // Check for unresolved variables in the resolved command/branch
-    const textToCheck = customDef.command ?? customDef.branch ?? '';
-    const variables = extractVariables(textToCheck);
-    for (const variable of variables) {
-      if (!providedParams.has(variable)) {
-        // Check if it's a known param with a default
-        const paramDef = customDef.params?.find((p) => p.name === variable);
-        if (!paramDef) {
-          unresolvedVariables.push({ step: step.name, variable });
-          warnings.push(
-            `Step "${step.name}": Variable "{{${variable}}}" in custom step "${step.use}" ` +
-              `is not defined as a parameter. It will not be interpolated.`
-          );
-        }
-      }
-    }
-
-    // Check for extra parameters that aren't defined
-    const definedParams = new Set((customDef.params ?? []).map((p) => p.name));
-    const stepKeys = Object.keys(stepAny).filter(
-      (k) => !['name', 'use', 'dependsOn', 'timeoutMs'].includes(k)
-    );
-    for (const key of stepKeys) {
-      if (!definedParams.has(key)) {
-        warnings.push(
-          `Step "${step.name}": Parameter "${key}" is not defined in custom step "${step.use}" and will be ignored.`
-        );
-      }
-    }
-  }
-
-  return {
-    valid: errors.length === 0,
-    errors,
-    warnings,
-    missingSteps,
-    missingParams,
-    unresolvedVariables,
-  };
-}
-
-/**
- * Resolve a workflow step that uses a custom step definition.
- * Returns a new step with the custom definition merged in.
- */
-export function resolveCustomStep(
-  step: WorkflowStep,
-  customSteps: Map<string, CustomStepDefinition>
-): WorkflowStep {
-  if (!step.use) {
-    return step;
-  }
-
-  const customDef = customSteps.get(step.use);
-  if (!customDef) {
-    throw new CustomStepResolutionError(
-      step.name,
-      `Custom step "${step.use}" not found`,
-      `Make sure "${step.use}" is defined in .relay/steps.yaml:\n\n` +
-        'steps:\n' +
-        `  ${step.use}:\n` +
-        '    command: "your-command"'
-    );
-  }
-
-  // Build parameter values from step properties and defaults
-  const paramValues: Record<string, string> = {};
-  const missingRequired: string[] = [];
-
-  if (customDef.params) {
-    // Cast step to access arbitrary parameters (custom step params are passed as extra properties)
-    const stepAny = step as unknown as Record<string, unknown>;
-    for (const param of customDef.params) {
-      // Check if value provided in step
-      const providedValue = stepAny[param.name];
-      if (providedValue !== undefined) {
-        paramValues[param.name] = String(providedValue);
-      } else if (param.default !== undefined) {
-        paramValues[param.name] = param.default;
-      } else if (param.required) {
-        missingRequired.push(param.name);
-      }
-    }
-  }
-
-  if (missingRequired.length > 0) {
-    const paramList = missingRequired.map((p) => `  - ${p}`).join('\n');
-    throw new CustomStepResolutionError(
-      step.name,
-      `Missing required parameter(s) for custom step "${step.use}"`,
-      `Add the following to your step:\n\n` +
-        `- name: ${step.name}\n` +
-        `  use: ${step.use}\n` +
-        missingRequired.map((p) => `  ${p}: <value>`).join('\n')
-    );
-  }
-
-  // Determine step type
-  const stepType = customDef.type ?? (customDef.command ? 'deterministic' : 'worktree');
-
-  // Interpolate parameter values into the definition
-  const interpolate = (value: string | undefined): string | undefined => {
-    if (!value) return value;
-    return value.replace(/\{\{(\w+)\}\}/g, (match, paramName) => {
-      return paramValues[paramName] ?? match;
-    });
-  };
-
-  // Build resolved step
-  const resolvedStep: WorkflowStep = {
-    name: step.name,
-    type: stepType as 'deterministic' | 'worktree',
-    dependsOn: step.dependsOn,
-    timeoutMs: step.timeoutMs ?? customDef.timeoutMs,
-  };
-
-  if (stepType === 'deterministic') {
-    resolvedStep.command = interpolate(customDef.command);
-    resolvedStep.failOnError = customDef.failOnError;
-    resolvedStep.captureOutput = customDef.captureOutput;
-  } else if (stepType === 'worktree') {
-    resolvedStep.branch = interpolate(customDef.branch);
-    resolvedStep.baseBranch = interpolate(customDef.baseBranch);
-    resolvedStep.path = interpolate(customDef.path);
-    resolvedStep.createBranch = customDef.createBranch;
-  }
-
-  return resolvedStep;
-}
-
-/**
- * Resolve all custom steps in a workflow's steps array.
- */
-export function resolveAllCustomSteps(
-  steps: WorkflowStep[],
-  customSteps: Map<string, CustomStepDefinition>
-): WorkflowStep[] {
-  return steps.map((step) => resolveCustomStep(step, customSteps));
-}
-
-/**
- * Check if .relay/steps.yaml exists.
- */
-export function customStepsFileExists(cwd: string): boolean {
-  return existsSync(path.join(cwd, CUSTOM_STEPS_FILE));
-}
-
-/**
- * Get the full path to the custom steps file.
- */
-export function getCustomStepsPath(cwd: string): string {
-  return path.join(cwd, CUSTOM_STEPS_FILE);
-}
diff --git a/packages/sdk/src/workflows/default-logger.ts b/packages/sdk/src/workflows/default-logger.ts
deleted file mode 100644
index 11a3a93e2..000000000
--- a/packages/sdk/src/workflows/default-logger.ts
+++ /dev/null
@@ -1,122 +0,0 @@
-import chalk from 'chalk';
-import type { WorkflowEvent, WorkflowEventListener } from './runner.js';
-
-export type LogLevel = 'verbose' | 'normal' | 'quiet' | false;
-
-const noop: WorkflowEventListener = () => {};
-
-/**
- * Create a default event logger that writes workflow progress to the console.
- *
- * @param level - Log verbosity: "verbose" | "normal" (default) | "quiet" | false (no-op)
- */
-export function createDefaultEventLogger(level: LogLevel = 'normal'): WorkflowEventListener {
-  if (level === false) return noop;
-
-  return (event: WorkflowEvent) => {
-    switch (event.type) {
-      // ── Run lifecycle ──
-      case 'run:started':
-        if (level !== 'quiet') {
-          console.log(chalk.cyan(`[workflow] run ${event.runId}`));
-        }
-        break;
-
-      case 'run:completed':
-        console.log(chalk.green(`[workflow] completed`));
-        break;
-
-      case 'run:failed':
-        console.log(chalk.red(`[workflow] FAILED: ${event.error}`));
-        break;
-
-      case 'run:cancelled':
-        if (level !== 'quiet') {
-          console.log(chalk.yellow(`[workflow] cancelled`));
-        }
-        break;
-
-      // ── Step lifecycle ──
-      case 'step:started':
-        if (level !== 'quiet') {
-          console.log(chalk.blue(`  ● ${event.stepName} — started`));
-        }
-        break;
-
-      case 'step:completed':
-        if (level !== 'quiet') {
-          console.log(chalk.green(`  ✓ ${event.stepName} — completed`));
-        }
-        break;
-
-      case 'step:failed':
-        console.log(chalk.red(`  ✗ ${event.stepName} — FAILED: ${event.error}`));
-        break;
-
-      case 'step:skipped':
-        if (level !== 'quiet') {
-          console.log(chalk.gray(`  ○ ${event.stepName} — skipped`));
-        }
-        break;
-
-      case 'step:retrying':
-        if (level !== 'quiet') {
-          console.log(chalk.yellow(`  ↻ ${event.stepName} — retrying (attempt ${event.attempt})`));
-        }
-        break;
-
-      case 'step:nudged':
-        if (level !== 'quiet') {
-          console.log(chalk.yellow(`  ⚡ ${event.stepName} — nudged (${event.nudgeCount})`));
-        }
-        break;
-
-      case 'step:agent-report': {
-        if (level !== 'quiet') {
-          const r = event.report;
-          const parts: string[] = [];
-          if (r.model) parts.push(r.model);
-          if (r.cost != null) parts.push(`$${r.cost.toFixed(2)}`);
-          if (r.tokens) parts.push(`${r.tokens.input}+${r.tokens.output} tokens`);
-          parts.push(`${r.errors.length} errors`);
-          console.log(chalk.dim(`  📊 ${event.stepName} — ${parts.join(' · ')}`));
-        }
-        break;
-      }
-
-      // ── Broker-level events (verbose only) ──
-      case 'broker:event':
-        if (level === 'verbose') {
-          console.log(chalk.dim(`  [broker] ${JSON.stringify(event.event)}`));
-        }
-        break;
-
-      // ── Other events (verbose only) ──
-      case 'step:owner-assigned':
-        if (level === 'verbose') {
-          console.log(
-            chalk.dim(`  ${event.stepName} — owner: ${event.ownerName}, specialist: ${event.specialistName}`)
-          );
-        }
-        break;
-
-      case 'step:review-completed':
-        if (level === 'verbose') {
-          console.log(chalk.dim(`  ${event.stepName} — review: ${event.decision} by ${event.reviewerName}`));
-        }
-        break;
-
-      case 'step:owner-timeout':
-        if (level !== 'quiet') {
-          console.log(chalk.yellow(`  ⏱ ${event.stepName} — owner timeout (${event.ownerName})`));
-        }
-        break;
-
-      case 'step:force-released':
-        if (level === 'verbose') {
-          console.log(chalk.dim(`  ${event.stepName} — force-released`));
-        }
-        break;
-    }
-  };
-}
diff --git a/packages/sdk/src/workflows/dry-run-format.ts b/packages/sdk/src/workflows/dry-run-format.ts
deleted file mode 100644
index aadb97c9b..000000000
--- a/packages/sdk/src/workflows/dry-run-format.ts
+++ /dev/null
@@ -1,88 +0,0 @@
-import type { DryRunReport } from './types.js';
-
-/**
- * Format a DryRunReport as human-readable text for terminal output.
- */
-export function formatDryRunReport(report: DryRunReport): string {
-  const lines: string[] = [];
-
-  // Header
-  lines.push(`Dry Run: ${report.name}`);
-  const meta: string[] = [`Pattern: ${report.pattern}`];
-  if (report.maxConcurrency !== undefined) {
-    meta.push(`Max Concurrency: ${report.maxConcurrency}`);
-  }
-  lines.push(meta.join(' | '));
-  if (report.description) {
-    lines.push(report.description);
-  }
-  lines.push('');
-
-  // Agents
-  if (report.agents.length > 0) {
-    lines.push(`Agents (${report.agents.length}):`);
-    const maxNameLen = Math.max(...report.agents.map((a) => a.name.length));
-    const maxCliLen = Math.max(...report.agents.map((a) => a.cli.length));
-    for (const agent of report.agents) {
-      const stepLabel = agent.stepCount === 1 ? '1 step' : `${agent.stepCount} steps`;
-      const cwdInfo = agent.cwd ? ` [cwd: ${agent.cwd}]` : '';
-      lines.push(
-        `  ${agent.name.padEnd(maxNameLen)}  ${agent.cli.padEnd(maxCliLen)}  ${stepLabel}${cwdInfo}`
-      );
-    }
-    lines.push('');
-  }
-
-  // Permissions
-  if (report.permissions && report.permissions.length > 0) {
-    lines.push(`Permissions (${report.permissions.length} agents):`);
-    for (const perm of report.permissions) {
-      lines.push(
-        `  ${perm.agent}: ${perm.access} (read: ${perm.readPaths}, write: ${perm.writePaths}, deny: ${perm.denyPaths}, scopes: ${perm.scopes}) [${perm.source}]`
-      );
-    }
-    lines.push('');
-  }
-
-  // Execution Plan
-  if (report.waves.length > 0) {
-    lines.push(`Execution Plan (${report.totalSteps} steps, ${report.estimatedWaves} waves):`);
-    lines.push('');
-    for (const wave of report.waves) {
-      for (let i = 0; i < wave.steps.length; i++) {
-        const step = wave.steps[i];
-        const prefix = i === 0 ? `  Wave ${String(wave.wave).padStart(2)}:` : '          ';
-        lines.push(`${prefix}  ${step.name} (${step.agent})`);
-      }
-    }
-    lines.push('');
-  }
-
-  // Resource estimation
-  if (report.estimatedPeakConcurrency !== undefined) {
-    lines.push(`Resource Estimate:`);
-    lines.push(`  Peak Concurrency: ${report.estimatedPeakConcurrency} agents`);
-    if (report.estimatedTotalAgentSteps !== undefined) {
-      lines.push(`  Total Agent Steps: ${report.estimatedTotalAgentSteps}`);
-    }
-    lines.push('');
-  }
-
-  // Validation summary
-  if (report.errors.length > 0) {
-    lines.push(`Validation: FAIL (${report.errors.length} errors, ${report.warnings.length} warnings)`);
-    for (const err of report.errors) {
-      lines.push(`  ERROR: ${err}`);
-    }
-  } else {
-    lines.push(`Validation: PASS (0 errors, ${report.warnings.length} warnings)`);
-  }
-
-  if (report.warnings.length > 0) {
-    for (const warn of report.warnings) {
-      lines.push(`  WARNING: ${warn}`);
-    }
-  }
-
-  return lines.join('\n');
-}
diff --git a/packages/sdk/src/workflows/file-db.ts b/packages/sdk/src/workflows/file-db.ts
deleted file mode 100644
index 12b43fe11..000000000
--- a/packages/sdk/src/workflows/file-db.ts
+++ /dev/null
@@ -1,277 +0,0 @@
-import {
-  accessSync,
-  appendFileSync,
-  constants as fsConstants,
-  existsSync,
-  mkdirSync,
-  readdirSync,
-  readFileSync,
-} from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-
-import type { WorkflowRunRow, WorkflowStepRow } from './types.js';
-import type { WorkflowDb } from './runner.js';
-
-type DbEntry = { kind: 'run'; row: WorkflowRunRow } | { kind: 'step'; row: WorkflowStepRow };
-
-/**
- * Optional hook: fired whenever a persistence write fails (e.g. EACCES,
- * ENOSPC). Surfaced so the CLI, dashboard, or bootstrap can decide how
- * to react beyond the single console.warn. Not called for the initial
- * "directory unwritable" detection — that's stored in {@link isWritable}.
- */
-export type DbWriteFailureListener = (err: unknown, filePath: string) => void;
-
-export interface JsonFileWorkflowDbOptions {
-  /** Override the resolved filePath. Kept for tests / advanced callers. */
-  filePath?: string;
-  /** Notified on every underlying write error. */
-  onWriteFailure?: DbWriteFailureListener;
-  /**
-   * When true, if the preferred file path is unwritable, fall back to
-   * `$HOME/.agent-relay/workflow-runs-<basename>.jsonl` so `--resume`
-   * still works in environments where the workflow cwd is read-only
-   * (cloud sandboxes with restrictive workspace ACLs).
-   *
-   * Defaults to `false` — strict "write to this path or run in-memory"
-   * semantics, matching the pre-cache behavior. Opt-in via `true`.
-   */
-  homeFallback?: boolean;
-}
-
-/**
- * JSONL-backed WorkflowDb for the CLI.
- *
- * Design: the **in-memory cache is the single source of truth** for the
- * process lifetime. Every mutation updates the cache synchronously and
- * then best-effort appends to the jsonl file for durability / `--resume`.
- *
- * This matters because the runtime correctness of a running workflow
- * must not depend on disk writes succeeding. If the storage path is
- * unwritable (ACL-restricted workspace, full disk, ENOSPC), the workflow
- * still progresses through its state machine correctly — we just lose
- * the ability to resume a future process from that run.
- *
- * Read paths used to re-snapshot the jsonl on every call, which meant
- * a failed `updateRun(..., { status: 'completed' })` would leave a
- * subsequent `getRun` returning the stale 'running' row from disk.
- * That bug surfaced as workflows passing per-step but reporting
- * `status: 'running'` to callers.
- *
- * Storage path resolution:
- *   1. Try the caller-supplied file path. If the parent directory is
- *      writable, use it.
- *   2. If (1) fails and `homeFallback` is true (opt-in, default false),
- *      try `$HOME/.agent-relay/workflow-runs-<basename>.jsonl`. This is
- *      outside any workspace mount in cloud sandboxes and almost always
- *      writable by the agent.
- *   3. If both fail, run in memory-only mode. The workflow still
- *      executes correctly; `--resume` won't be available for this run.
- *
- * File: `.agent-relay/workflow-runs.jsonl` in the workflow cwd by default.
- */
-export class JsonFileWorkflowDb implements WorkflowDb {
-  private readonly filePath: string;
-
-  /** Whether persistence is active. False = in-memory-only mode. */
-  private readonly writable: boolean;
-  private appendFailedOnce = false;
-  private readonly onWriteFailure?: DbWriteFailureListener;
-
-  /**
-   * Authoritative in-memory mirror. Every mutation updates this; reads
-   * return from here. The jsonl file is only consulted at construction
-   * (to replay prior state for `--resume`) and is otherwise write-only.
-   */
-  private readonly cache: {
-    runs: Map<string, WorkflowRunRow>;
-    steps: Map<string, WorkflowStepRow>;
-  };
-
-  constructor(filePathOrOptions: string | JsonFileWorkflowDbOptions) {
-    const options: JsonFileWorkflowDbOptions =
-      typeof filePathOrOptions === 'string' ? { filePath: filePathOrOptions } : filePathOrOptions;
-    this.onWriteFailure = options.onWriteFailure;
-
-    const requestedPath = options.filePath ?? path.join('.agent-relay', 'workflow-runs.jsonl');
-    const homeFallback = options.homeFallback ?? false;
-
-    const { resolvedPath, writable } = JsonFileWorkflowDb.resolveStoragePath(requestedPath, homeFallback);
-    this.filePath = resolvedPath;
-    this.writable = writable;
-
-    // Load existing state from disk (for --resume) once at construction.
-    // From this point on, the cache is authoritative.
-    this.cache = JsonFileWorkflowDb.loadSnapshot(this.filePath);
-  }
-
-  /** Returns false if persistence is not active (in-memory-only mode). */
-  isWritable(): boolean {
-    return this.writable;
-  }
-
-  /** Resolved path on disk. For tests + diagnostics. */
-  getStoragePath(): string {
-    return this.filePath;
-  }
-
-  hasStepOutputs(runId: string): boolean {
-    try {
-      const dir = path.join(path.dirname(this.filePath), 'step-outputs', runId);
-      return existsSync(dir) && readdirSync(dir).length > 0;
-    } catch {
-      return false;
-    }
-  }
-
-  // ── Private helpers ─────────────────────────────────────────────────────
-
-  private static resolveStoragePath(
-    requestedPath: string,
-    homeFallback: boolean
-  ): { resolvedPath: string; writable: boolean } {
-    const candidates: string[] = [requestedPath];
-    if (homeFallback) {
-      const base = path.basename(requestedPath) || 'workflow-runs.jsonl';
-      candidates.push(path.join(os.homedir(), '.agent-relay', `workflow-runs-${base}`));
-    }
-
-    for (let i = 0; i < candidates.length; i++) {
-      const candidate = candidates[i];
-      const isLastCandidate = i === candidates.length - 1;
-      try {
-        mkdirSync(path.dirname(candidate), { recursive: true });
-        // If there's a later fallback to try, actively probe writability
-        // so we know whether to move on. Two levels matter:
-        //   1. Directory must be writable to create the jsonl file.
-        //   2. If the jsonl file already exists, IT must also be writable
-        //      — a writable directory does not guarantee a writable file.
-        //      Relayfile-mount, for example, can sync a file and chmod it
-        //      to 0o444 while leaving the parent dir at 0o755; the old
-        //      dir-only check would accept the path and every append would
-        //      then lazy-fail, bypassing the fallback.
-        // If this is already the last candidate, skip the probe and be
-        // optimistic — an unwritable path will surface as a lazy append()
-        // failure handled by the cache + onWriteFailure path. Matches the
-        // pre-cache "warn on first failure" semantic callers expect.
-        if (!isLastCandidate) {
-          accessSync(path.dirname(candidate), fsConstants.W_OK);
-          if (existsSync(candidate)) {
-            accessSync(candidate, fsConstants.W_OK);
-          }
-        }
-        return { resolvedPath: candidate, writable: true };
-      } catch {
-        // Try the next candidate; if this was the last, fall through
-        // to memory-only.
-      }
-    }
-
-    // Memory-only mode. Path is reported for diagnostics but nothing
-    // is written to it.
-    return { resolvedPath: requestedPath, writable: false };
-  }
-
-  private static loadSnapshot(filePath: string): {
-    runs: Map<string, WorkflowRunRow>;
-    steps: Map<string, WorkflowStepRow>;
-  } {
-    const runs = new Map<string, WorkflowRunRow>();
-    const steps = new Map<string, WorkflowStepRow>();
-    let raw = '';
-    try {
-      raw = readFileSync(filePath, 'utf8');
-    } catch {
-      return { runs, steps };
-    }
-    for (const line of raw.split('\n')) {
-      const trimmed = line.trim();
-      if (!trimmed) continue;
-      try {
-        const entry = JSON.parse(trimmed) as DbEntry;
-        if (entry.kind === 'run') {
-          runs.set(entry.row.id, entry.row);
-        } else {
-          steps.set(entry.row.id, entry.row);
-        }
-      } catch {
-        // Skip malformed lines
-      }
-    }
-    return { runs, steps };
-  }
-
-  private append(entry: DbEntry): void {
-    if (!this.writable) return;
-    try {
-      appendFileSync(this.filePath, JSON.stringify(entry) + '\n', 'utf8');
-    } catch (err) {
-      // Notify every failure so callers can aggregate / surface.
-      this.onWriteFailure?.(err, this.filePath);
-      // Warn to console once per process — subsequent failures are noise.
-      if (!this.appendFailedOnce) {
-        this.appendFailedOnce = true;
-        console.warn(
-          '[workflow] warning: failed to write run state to ' +
-            this.filePath +
-            ' — --resume will not be available for this run. Use --start-from instead. ' +
-            'Error: ' +
-            (err instanceof Error ? err.message : String(err))
-        );
-      }
-    }
-  }
-
-  // ── WorkflowDb interface ─────────────────────────────────────────────────
-
-  async insertRun(run: WorkflowRunRow): Promise<void> {
-    // Shallow-copy so later mutations on the caller's object don't silently
-    // alias into the cache. Matches InMemoryWorkflowDb semantics. The runner
-    // keeps inserted rows in its own stepStates map and occasionally mutates
-    // state.row.status directly before calling updateRun — without this copy
-    // the mutation would land in the cache and bypass updateRun's
-    // updatedAt + append path, causing exactly the observability hazard this
-    // cache is meant to prevent.
-    this.cache.runs.set(run.id, { ...run });
-    this.append({ kind: 'run', row: run });
-  }
-
-  async updateRun(id: string, patch: Partial<WorkflowRunRow>): Promise<void> {
-    const existing = this.cache.runs.get(id);
-    if (!existing) return;
-    const updated: WorkflowRunRow = {
-      ...existing,
-      ...patch,
-      updatedAt: new Date().toISOString(),
-    };
-    this.cache.runs.set(id, updated);
-    this.append({ kind: 'run', row: updated });
-  }
-
-  async getRun(id: string): Promise<WorkflowRunRow | null> {
-    return this.cache.runs.get(id) ?? null;
-  }
-
-  async insertStep(step: WorkflowStepRow): Promise<void> {
-    // Shallow-copy to prevent caller-mutation aliasing — see insertRun.
-    this.cache.steps.set(step.id, { ...step });
-    this.append({ kind: 'step', row: step });
-  }
-
-  async updateStep(id: string, patch: Partial<WorkflowStepRow>): Promise<void> {
-    const existing = this.cache.steps.get(id);
-    if (!existing) return;
-    const updated: WorkflowStepRow = {
-      ...existing,
-      ...patch,
-      updatedAt: new Date().toISOString(),
-    };
-    this.cache.steps.set(id, updated);
-    this.append({ kind: 'step', row: updated });
-  }
-
-  async getStepsByRunId(runId: string): Promise<WorkflowStepRow[]> {
-    return Array.from(this.cache.steps.values()).filter((s) => s.runId === runId);
-  }
-}
diff --git a/packages/sdk/src/workflows/index.ts b/packages/sdk/src/workflows/index.ts
deleted file mode 100644
index 95a8ed6dd..000000000
--- a/packages/sdk/src/workflows/index.ts
+++ /dev/null
@@ -1,64 +0,0 @@
-export * from './types.js';
-export * from './runner.js';
-export * from './custom-steps.js';
-export * from './cli-session-collector.js';
-export * from './channel-messenger.js';
-export * from './process-spawner.js';
-export {
-  createProcessBackendExecutor,
-  type ProcessBackendExecutorOptions,
-} from './process-backend-executor.js';
-export * from './run-summary-table.js';
-export * from './template-resolver.js';
-export * from './verification.js';
-export {
-  StepExecutor,
-  /** @deprecated Use {@link StepExecutor} instead. */
-  StepExecutor as WorkflowStepLifecycleExecutor,
-  type StepExecutorDeps,
-  type StepResult,
-  type StepSchedule,
-} from './step-executor.js';
-export {
-  Models,
-  ClaudeModels,
-  CodexModels,
-  GeminiModels,
-  CursorModels,
-  CLIs,
-  CLIVersions,
-  CLIRegistry,
-  SwarmPatterns,
-} from '../models.js';
-export * from './memory-db.js';
-export * from './file-db.js';
-export * from './run.js';
-export * from './cloud-schedules.js';
-export * from './builder.js';
-export * from './coordinator.js';
-export * from './barrier.js';
-export * from './state.js';
-export * from './templates.js';
-export { WorkflowTrajectory, type StepOutcome } from './trajectory.js';
-export { formatDryRunReport } from './dry-run-format.js';
-export { createWorkflowRenderer, type WorkflowRenderer } from './listr-renderer.js';
-export { createDefaultEventLogger } from './default-logger.js';
-export { executeApiStep, type ApiExecutorOptions } from './api-executor.js';
-export type { CloudRunOptions } from './cloud-runner.js';
-export * from './proxy-env.js';
-export * from './budget-tracker.js';
-export { applySiblingLinks, buildSiblingLinkScript } from './sibling-links.js';
-export type { SiblingLink, SiblingLinkOptions } from './sibling-links.js';
-export {
-  runScriptWorkflow,
-  parseTsxStderr,
-  formatWorkflowParseError,
-  findLocalSdkWorkspace,
-  ensureLocalSdkWorkflowRuntime,
-} from './run-script.js';
-export type {
-  RunScriptWorkflowOptions,
-  ParsedWorkflowError,
-  LocalSdkWorkspace,
-  ExecFileSyncLike,
-} from './run-script.js';
diff --git a/packages/sdk/src/workflows/listr-renderer.ts b/packages/sdk/src/workflows/listr-renderer.ts
deleted file mode 100644
index f88a8be23..000000000
--- a/packages/sdk/src/workflows/listr-renderer.ts
+++ /dev/null
@@ -1,276 +0,0 @@
-import chalk from 'chalk';
-import type { ListrTask } from 'listr2';
-import type { WorkflowEvent, WorkflowEventListener } from './runner.js';
-
-// Filter console.log while listr owns the terminal.
-// Blocks [broker] noise and [workflow HH:MM] timing lines, but lets the
-// observer URL and channel name through so users can track the run.
-function installOutputFilter(): () => void {
-  const orig = console.log.bind(console);
-  console.log = (...args: unknown[]) => {
-    const str = String(args[0] ?? '');
-    // Always show the observer URL and channel so users can follow the run
-    if (str.includes('Observer:') || str.includes('agentrelay.com') || str.includes('Channel: wf-')) {
-      orig(...args);
-      return;
-    }
-    // Block [broker] lines and [workflow HH:MM] timing lines
-    if (/\[broker\]/.test(str) || /\[workflow\s+\d{2}:\d{2}\]/.test(str)) return;
-    orig(...args);
-  };
-  return () => {
-    console.log = orig;
-  };
-}
-
-interface RenderableTask {
-  title: string;
-  output: string;
-}
-
-interface StepHandle {
-  resolve: () => void;
-  reject: (error: Error) => void;
-  setOutput: (text: string) => void;
-  markSkipped: () => void;
-}
-
-export interface WorkflowRenderer {
-  /** Pass this to `.run({ onEvent })` in your TypeScript workflow. */
-  onEvent: WorkflowEventListener;
-  /** Start the listr renderer. Run this concurrently with your workflow. */
-  start: () => Promise<void>;
-  /** Restore console.log after the workflow finishes. */
-  unmount: () => void;
-}
-
-/**
- * Creates a listr2-based renderer for TypeScript workflows.
- *
- * @example
- * ```typescript
- * import { workflow, createWorkflowRenderer } from '@agent-relay/sdk/workflows';
- *
- * const renderer = createWorkflowRenderer();
- * const [result] = await Promise.all([
- *   workflow('my-workflow').step(...).run({ onEvent: renderer.onEvent }),
- *   renderer.start(),
- * ]);
- * renderer.unmount();
- * ```
- */
-export function createWorkflowRenderer(): WorkflowRenderer {
-  const stepHandles = new Map<string, StepHandle>();
-
-  let resolveWorkflow!: () => void;
-  let rejectWorkflow!: (error: Error) => void;
-  const workflowDone = new Promise<void>((resolve, reject) => {
-    resolveWorkflow = resolve;
-    rejectWorkflow = reject;
-  });
-  // Prevent unhandled rejection if run:failed fires before the header task
-  // reaches `await workflowDone`.
-  workflowDone.catch(() => {});
-
-  let setHeader: (text: string) => void = () => {};
-  // eslint-disable-next-line @typescript-eslint/no-explicit-any
-  let listr: any = null;
-  const pendingAdds: ListrTask[] = [];
-
-  async function ensureListr(): Promise<any> {
-    if (listr) return listr;
-    const { Listr } = await import('listr2');
-    listr = new (Listr as any)(
-      [
-        {
-          title: chalk.dim('Workflow starting...'),
-          task: async (_ctx, task): Promise<void> => {
-            setHeader = (text: string): void => {
-              task.title = text;
-            };
-            await workflowDone;
-          },
-        } as ListrTask,
-      ],
-      {
-        concurrent: true,
-        renderer: process.stdout.isTTY ? 'default' : 'verbose',
-        rendererOptions: {
-          collapseErrors: false,
-          showErrorMessage: true,
-        },
-      }
-    );
-    for (const task of pendingAdds) listr.add(task);
-    pendingAdds.length = 0;
-    return listr;
-  }
-
-  const addTask = (task: ListrTask): void => {
-    if (listr) listr.add(task);
-    else pendingAdds.push(task);
-  };
-
-  const onEvent: WorkflowEventListener = (event: WorkflowEvent) => {
-    switch (event.type) {
-      case 'run:started': {
-        setHeader(chalk.dim(`[workflow] run ${event.runId.slice(0, 8)}...`));
-        break;
-      }
-
-      case 'step:started': {
-        let resolveStep!: () => void;
-        let rejectStep!: (error: Error) => void;
-        let taskRef: RenderableTask | null = null;
-        let skipped = false;
-
-        const done = new Promise<void>((resolve, reject) => {
-          resolveStep = resolve;
-          rejectStep = reject;
-        });
-        // Prevent unhandled rejection if the step fails before the listr
-        // task function has started and reached `await done`.
-        done.catch(() => {});
-
-        stepHandles.set(event.stepName, {
-          resolve: resolveStep,
-          reject: rejectStep,
-          setOutput: (text: string) => {
-            if (taskRef) taskRef.output = text;
-          },
-          markSkipped: () => {
-            skipped = true;
-            if (taskRef) taskRef.title = chalk.dim(`${event.stepName} (skipped)`);
-          },
-        });
-
-        addTask({
-          title: chalk.white(event.stepName),
-          task: async (_ctx, task): Promise<void> => {
-            taskRef = task as RenderableTask;
-            if (skipped) taskRef.title = chalk.dim(`${event.stepName} (skipped)`);
-            await done;
-          },
-          rendererOptions: { persistentOutput: true },
-        } as ListrTask);
-        break;
-      }
-
-      case 'step:owner-assigned': {
-        const handle = stepHandles.get(event.stepName);
-        if (handle) {
-          handle.setOutput(
-            chalk.dim(`> Owner: ${event.ownerName}`) +
-              (event.specialistName ? chalk.dim(` · specialist: ${event.specialistName}`) : '')
-          );
-        }
-        break;
-      }
-
-      case 'step:retrying': {
-        stepHandles.get(event.stepName)?.setOutput(chalk.yellow(`Retrying (attempt ${event.attempt})`));
-        break;
-      }
-
-      case 'step:nudged': {
-        stepHandles.get(event.stepName)?.setOutput(chalk.dim(`> Nudge #${event.nudgeCount}`));
-        break;
-      }
-
-      case 'step:force-released': {
-        stepHandles.get(event.stepName)?.setOutput(chalk.yellow('> Force-released'));
-        break;
-      }
-
-      case 'step:review-completed': {
-        stepHandles
-          .get(event.stepName)
-          ?.setOutput(chalk.dim(`> Review: ${event.decision} by ${event.reviewerName}`));
-        break;
-      }
-
-      case 'step:owner-timeout': {
-        stepHandles.get(event.stepName)?.setOutput(chalk.red(`> Owner ${event.ownerName} timed out`));
-        break;
-      }
-
-      case 'step:agent-report': {
-        const handle = stepHandles.get(event.stepName);
-        if (handle) {
-          const model = event.report.model ? `:${event.report.model}` : '';
-          handle.setOutput(chalk.dim(`> Report collected (${event.report.cli}${model})`));
-        }
-        break;
-      }
-
-      case 'step:completed': {
-        stepHandles.get(event.stepName)?.resolve();
-        break;
-      }
-
-      case 'step:skipped': {
-        const handle = stepHandles.get(event.stepName);
-        if (handle) {
-          handle.markSkipped();
-          handle.resolve();
-        } else {
-          // Step was skipped without ever being started (downstream of a failure).
-          addTask({
-            title: chalk.dim(`${event.stepName} (skipped)`),
-            task: async (): Promise<void> => {},
-            rendererOptions: { persistentOutput: true },
-          } as ListrTask);
-        }
-        break;
-      }
-
-      case 'step:failed': {
-        stepHandles.get(event.stepName)?.reject(new Error(event.error ?? 'Step failed'));
-        break;
-      }
-
-      case 'run:completed': {
-        setHeader(chalk.green('Workflow completed'));
-        resolveWorkflow();
-        break;
-      }
-
-      case 'run:failed': {
-        setHeader(chalk.red(`Workflow failed: ${event.error ?? 'unknown error'}`));
-        rejectWorkflow(new Error(event.error ?? 'Workflow failed'));
-        break;
-      }
-
-      case 'run:cancelled': {
-        setHeader(chalk.yellow('Workflow cancelled'));
-        resolveWorkflow();
-        break;
-      }
-
-      case 'broker:event':
-        break;
-
-      default: {
-        const _exhaustive: never = event;
-        void _exhaustive;
-      }
-    }
-  };
-
-  let restoreConsole: (() => void) | undefined;
-
-  return {
-    onEvent,
-    start: async () => {
-      restoreConsole = installOutputFilter();
-      const l = await ensureListr();
-      return l.run().catch(() => {
-        // Step failures are already represented in the workflow result.
-      });
-    },
-    unmount: () => {
-      restoreConsole?.();
-      restoreConsole = undefined;
-    },
-  };
-}
diff --git a/packages/sdk/src/workflows/memory-db.ts b/packages/sdk/src/workflows/memory-db.ts
deleted file mode 100644
index 980bace38..000000000
--- a/packages/sdk/src/workflows/memory-db.ts
+++ /dev/null
@@ -1,39 +0,0 @@
-import type { WorkflowRunRow, WorkflowStepRow } from './types.js';
-import type { WorkflowDb } from './runner.js';
-
-/**
- * In-memory implementation of WorkflowDb for local workflow runs.
- * No persistence — state lives only for the duration of the process.
- */
-export class InMemoryWorkflowDb implements WorkflowDb {
-  private runs = new Map<string, WorkflowRunRow>();
-  private steps = new Map<string, WorkflowStepRow>();
-
-  async insertRun(run: WorkflowRunRow): Promise<void> {
-    this.runs.set(run.id, { ...run });
-  }
-
-  async updateRun(id: string, patch: Partial<WorkflowRunRow>): Promise<void> {
-    const existing = this.runs.get(id);
-    if (!existing) return;
-    this.runs.set(id, { ...existing, ...patch, updatedAt: new Date().toISOString() });
-  }
-
-  async getRun(id: string): Promise<WorkflowRunRow | null> {
-    return this.runs.get(id) ?? null;
-  }
-
-  async insertStep(step: WorkflowStepRow): Promise<void> {
-    this.steps.set(step.id, { ...step });
-  }
-
-  async updateStep(id: string, patch: Partial<WorkflowStepRow>): Promise<void> {
-    const existing = this.steps.get(id);
-    if (!existing) return;
-    this.steps.set(id, { ...existing, ...patch, updatedAt: new Date().toISOString() });
-  }
-
-  async getStepsByRunId(runId: string): Promise<WorkflowStepRow[]> {
-    return Array.from(this.steps.values()).filter((s) => s.runId === runId);
-  }
-}
diff --git a/packages/sdk/src/workflows/process-backend-executor.ts b/packages/sdk/src/workflows/process-backend-executor.ts
deleted file mode 100644
index d578fcea7..000000000
--- a/packages/sdk/src/workflows/process-backend-executor.ts
+++ /dev/null
@@ -1,102 +0,0 @@
-/**
- * Adapter that implements {@link RunnerStepExecutor} on top of a
- * {@link ProcessBackend}. Relay owns command construction (CLI flags, env,
- * cwd, timeout); the backend only provides "where to run" — create an
- * isolated environment, exec the command, destroy.
- *
- * The WorkflowRunner synthesizes one of these when a caller passes
- * `processBackend` without an explicit `executor`, so every existing
- * `executor.executeAgentStep(...)` call site transparently flows through
- * the backend (e.g. a cloud sandbox) without any further plumbing.
- */
-
-import { buildCommand } from './process-spawner.js';
-import type { ProcessBackend, AgentDefinition, WorkflowStep, RunnerStepExecutor } from './types.js';
-
-function shellEscape(value: string): string {
-  if (value === '') return "''";
-  if (/^[A-Za-z0-9_\/.:,=+@%-]+$/.test(value)) return value;
-  return `'${value.replace(/'/g, `'\\''`)}'`;
-}
-
-function commandToShell(argv: string[]): string {
-  return argv.map(shellEscape).join(' ');
-}
-
-export interface ProcessBackendExecutorOptions {
-  /** Env vars injected into every step (e.g. auth tokens, relayfile config). */
-  env?: Record<string, string>;
-}
-
-export function createProcessBackendExecutor(
-  backend: ProcessBackend,
-  options: ProcessBackendExecutorOptions = {}
-): RunnerStepExecutor {
-  const baseEnv = options.env ?? {};
-
-  return {
-    async executeAgentStep(
-      step: WorkflowStep,
-      agentDef: AgentDefinition,
-      resolvedTask: string,
-      timeoutMs?: number
-    ): Promise<string> {
-      if (agentDef.cli === 'api') {
-        throw new Error(
-          `processBackend cannot execute cli "api" agents — api agents call the Anthropic API directly. ` +
-            `Route agent "${agentDef.name}" through a subprocess CLI (claude, codex, etc.) or omit processBackend.`
-        );
-      }
-
-      const extraArgs = agentDef.constraints?.model ? ['--model', agentDef.constraints.model] : [];
-      const argv = buildCommand(agentDef.cli, extraArgs, resolvedTask);
-      const commandString = commandToShell(argv);
-
-      const env = await backend.createEnvironment(step.name);
-      try {
-        const execOpts: {
-          cwd?: string;
-          env?: Record<string, string>;
-          timeoutSeconds?: number;
-        } = {};
-        if (agentDef.cwd) execOpts.cwd = agentDef.cwd;
-        if (Object.keys(baseEnv).length > 0) execOpts.env = baseEnv;
-        // timeoutSeconds is ceil-rounded from the caller's timeoutMs; a 500ms
-        // timeout becomes 1s because the backend protocol uses seconds.
-        if (timeoutMs && timeoutMs > 0) {
-          execOpts.timeoutSeconds = Math.max(1, Math.ceil(timeoutMs / 1000));
-        }
-        const result = await env.exec(commandString, execOpts);
-        if (result.exitCode !== 0) {
-          const tail = result.output.slice(-2000);
-          throw new Error(`Agent step "${step.name}" exited with code ${result.exitCode}: ${tail}`);
-        }
-        return result.output;
-      } finally {
-        await env.destroy().catch(() => undefined);
-      }
-    },
-
-    async executeDeterministicStep(
-      step: WorkflowStep,
-      resolvedCommand: string,
-      cwd: string
-    ): Promise<{ output: string; exitCode: number }> {
-      const env = await backend.createEnvironment(step.name);
-      try {
-        const execOpts: {
-          cwd?: string;
-          env?: Record<string, string>;
-          timeoutSeconds?: number;
-        } = { cwd };
-        if (Object.keys(baseEnv).length > 0) execOpts.env = baseEnv;
-        if (step.timeoutMs && step.timeoutMs > 0) {
-          execOpts.timeoutSeconds = Math.max(1, Math.ceil(step.timeoutMs / 1000));
-        }
-        return await env.exec(resolvedCommand, execOpts);
-      } finally {
-        await env.destroy().catch(() => undefined);
-      }
-    },
-  };
-}
diff --git a/packages/sdk/src/workflows/process-spawner.ts b/packages/sdk/src/workflows/process-spawner.ts
deleted file mode 100644
index 2c3c74fd7..000000000
--- a/packages/sdk/src/workflows/process-spawner.ts
+++ /dev/null
@@ -1,201 +0,0 @@
-import { spawn as cpSpawn } from 'node:child_process';
-import type { ChildProcess, SpawnOptions } from 'node:child_process';
-
-import { getCliDefinition } from '../cli-registry.js';
-import { resolveCliSync } from '../cli-resolver.js';
-import { runVerification } from './verification.js';
-import type { AgentCli, AgentDefinition, VerificationCheck } from './types.js';
-
-export interface SpawnOutcome {
-  output: string;
-  exitCode?: number;
-  exitSignal?: string;
-}
-
-export interface SpawnCommand {
-  bin: string;
-  args: string[];
-  env?: Record<string, string>;
-}
-
-export interface ShellOpts {
-  cwd: string;
-  timeoutMs?: number;
-}
-
-// eslint-disable-next-line @typescript-eslint/no-empty-object-type
-export interface AgentOpts extends ShellOpts {}
-
-// eslint-disable-next-line @typescript-eslint/no-empty-object-type
-export interface InteractiveOpts extends ShellOpts {}
-
-export interface ProcessSpawnerDeps {
-  cwd: string;
-}
-
-export interface ProcessSpawner {
-  spawnShell(command: string, opts: ShellOpts): Promise<SpawnOutcome>;
-  spawnAgent(agent: AgentDefinition, task: string, opts: AgentOpts): Promise<SpawnOutcome>;
-  spawnInteractive(agent: AgentDefinition, task: string, opts: InteractiveOpts): Promise<SpawnOutcome>;
-  buildCommand(agent: AgentDefinition, task: string): SpawnCommand;
-}
-
-function resolveNonInteractiveCli(cli: AgentCli): AgentCli {
-  if (cli !== 'cursor') {
-    return cli;
-  }
-
-  const resolved = resolveCliSync('cursor');
-  return (resolved?.binary as 'cursor-agent' | 'agent' | undefined) ?? 'agent';
-}
-
-export function buildCommand(cli: AgentCli, extraArgs: string[] = [], task: string): string[] {
-  if (cli === 'api') {
-    throw new Error('cli "api" uses direct API calls, not a subprocess command');
-  }
-
-  const resolvedCli = resolveNonInteractiveCli(cli);
-  const definition = getCliDefinition(resolvedCli);
-  if (!definition || definition.binaries.length === 0) {
-    throw new Error(`Unknown or non-executable CLI: ${resolvedCli}`);
-  }
-
-  return [definition.binaries[0], ...definition.nonInteractiveArgs(task, extraArgs)];
-}
-
-export function spawnProcess(command: string[], options: SpawnOptions): ChildProcess {
-  const [bin, ...args] = command;
-  return cpSpawn(bin, args, options);
-}
-
-export function collectOutput(process: ChildProcess): Promise<string> {
-  return new Promise<string>((resolve, reject) => {
-    let settled = false;
-    const stdout: string[] = [];
-    const stderr: string[] = [];
-
-    process.stdout?.on('data', (chunk: Buffer | string) => {
-      stdout.push(chunk.toString());
-    });
-
-    process.stderr?.on('data', (chunk: Buffer | string) => {
-      stderr.push(chunk.toString());
-    });
-
-    process.once('error', (err) => {
-      if (!settled) {
-        settled = true;
-        reject(err);
-      }
-    });
-    process.once('close', () => {
-      if (!settled) {
-        settled = true;
-        resolve(`${stdout.join('')}${stderr.join('')}`);
-      }
-    });
-  });
-}
-
-export function detectCompletion(output: string, verification?: VerificationCheck): boolean {
-  if (/OWNER_DECISION:\s*(?:INCOMPLETE_RETRY|INCOMPLETE_FAIL|NEEDS_CLARIFICATION)\b/i.test(output)) {
-    return false;
-  }
-
-  if (/OWNER_DECISION:\s*COMPLETE\b/i.test(output)) {
-    return true;
-  }
-
-  if (/\bSTEP_COMPLETE:([A-Za-z0-9_.:-]+)/.test(output)) {
-    return true;
-  }
-
-  if (!verification) {
-    return false;
-  }
-
-  return runVerification(verification, output, 'process', undefined, { allowFailure: true }).passed;
-}
-
-async function runCommand(command: SpawnCommand, opts: ShellOpts): Promise<SpawnOutcome> {
-  const child = spawnProcess([command.bin, ...command.args], {
-    cwd: opts.cwd,
-    env: { ...process.env, ...command.env },
-    stdio: 'pipe',
-  });
-
-  const outputPromise = collectOutput(child);
-  const exitPromise = new Promise<{ exitCode?: number; exitSignal?: string }>((resolve, reject) => {
-    let timedOut = false;
-    let timer: ReturnType<typeof setTimeout> | undefined;
-    let killTimer: ReturnType<typeof setTimeout> | undefined;
-
-    if (opts.timeoutMs) {
-      timer = setTimeout(() => {
-        timedOut = true;
-        child.kill('SIGTERM');
-        killTimer = setTimeout(() => child.kill('SIGKILL'), 5000);
-      }, opts.timeoutMs);
-    }
-
-    const clearTimer = () => {
-      if (timer) clearTimeout(timer);
-      if (killTimer) clearTimeout(killTimer);
-    };
-
-    child.once('error', (error) => {
-      clearTimer();
-      reject(error);
-    });
-
-    child.once('close', (exitCode, exitSignal) => {
-      clearTimer();
-
-      if (timedOut) {
-        reject(new Error(`Process timed out after ${opts.timeoutMs ?? 'unknown'}ms`));
-        return;
-      }
-
-      resolve({
-        exitCode: exitCode ?? undefined,
-        exitSignal: exitSignal ?? undefined,
-      });
-    });
-  });
-
-  const [outputResult, exitResult] = await Promise.allSettled([outputPromise, exitPromise]);
-  const output = outputResult.status === 'fulfilled' ? outputResult.value : '';
-  if (exitResult.status === 'rejected') {
-    const err = exitResult.reason instanceof Error ? exitResult.reason : new Error(String(exitResult.reason));
-    (err as Error & { partialOutput?: string }).partialOutput = output;
-    throw err;
-  }
-  return {
-    output,
-    exitCode: exitResult.value.exitCode,
-    exitSignal: exitResult.value.exitSignal,
-  };
-}
-
-export function createProcessSpawner(deps: ProcessSpawnerDeps): ProcessSpawner {
-  const buildAgentCommand = (agent: AgentDefinition, task: string): SpawnCommand => {
-    const extraArgs = agent.constraints?.model ? ['--model', agent.constraints.model] : [];
-    const [bin, ...args] = buildCommand(agent.cli, extraArgs, task);
-    return { bin, args };
-  };
-
-  return {
-    async spawnShell(command, opts) {
-      return runCommand({ bin: 'sh', args: ['-c', command] }, { ...opts, cwd: opts.cwd ?? deps.cwd });
-    },
-    async spawnAgent(agent, task, opts) {
-      return runCommand(buildAgentCommand(agent, task), { ...opts, cwd: opts.cwd ?? deps.cwd });
-    },
-    async spawnInteractive(agent, task, opts) {
-      return runCommand(buildAgentCommand(agent, task), { ...opts, cwd: opts.cwd ?? deps.cwd });
-    },
-    buildCommand(agent, task) {
-      return buildAgentCommand(agent, task);
-    },
-  };
-}
diff --git a/packages/sdk/src/workflows/proxy-env.ts b/packages/sdk/src/workflows/proxy-env.ts
deleted file mode 100644
index 29fb641e7..000000000
--- a/packages/sdk/src/workflows/proxy-env.ts
+++ /dev/null
@@ -1,133 +0,0 @@
-import { getCliDefinition } from '../cli-registry.js';
-import type { AgentDefinition, SwarmConfig } from './types.js';
-
-export interface ProxyEnvBinding {
-  baseUrlVar: string;
-  apiKeyVar: string;
-}
-
-export type ProxyEnvRegistry = Record<string, readonly ProxyEnvBinding[]>;
-
-export const RELAY_PROXY_URL_ENV = 'RELAY_LLM_PROXY' as const;
-export const RELAY_PROXY_URL_ENV_ALIAS = 'RELAY_LLM_PROXY_URL' as const;
-export const RELAY_PROXY_TOKEN_ENV = 'CREDENTIAL_PROXY_TOKEN' as const;
-export const RELAY_PROXY_TOKEN_ENV_ALIAS = 'RELAY_LLM_PROXY_TOKEN' as const;
-
-const OPENAI_COMPATIBLE_BINDINGS = [
-  { baseUrlVar: 'OPENAI_BASE_URL', apiKeyVar: 'OPENAI_API_KEY' },
-] as const satisfies readonly ProxyEnvBinding[];
-
-const ANTHROPIC_BINDINGS = [
-  { baseUrlVar: 'ANTHROPIC_BASE_URL', apiKeyVar: 'ANTHROPIC_API_KEY' },
-] as const satisfies readonly ProxyEnvBinding[];
-
-const AIDER_BINDINGS = [
-  { baseUrlVar: 'OPENAI_API_BASE', apiKeyVar: 'OPENAI_API_KEY' },
-] as const satisfies readonly ProxyEnvBinding[];
-
-const GEMINI_BINDINGS = [
-  { baseUrlVar: 'GOOGLE_API_BASE', apiKeyVar: 'GOOGLE_API_KEY' },
-] as const satisfies readonly ProxyEnvBinding[];
-
-const GENERIC_FALLBACK_BINDINGS = [
-  ...OPENAI_COMPATIBLE_BINDINGS,
-  ...ANTHROPIC_BINDINGS,
-] as const satisfies readonly ProxyEnvBinding[];
-
-const STRIPPED_API_KEY_VARS = [
-  'OPENAI_API_KEY',
-  'ANTHROPIC_API_KEY',
-  'OPENROUTER_API_KEY',
-  'GOOGLE_API_KEY',
-  'OPENAI_BASE_URL',
-  'ANTHROPIC_BASE_URL',
-  'OPENAI_API_BASE',
-  'GOOGLE_API_BASE',
-] as const;
-
-const CLI_ALIASES: Record<string, string> = {
-  agent: 'cursor',
-  'cursor-agent': 'cursor',
-};
-
-export const DEFAULT_PROXY_ENV_REGISTRY = {
-  claude: ANTHROPIC_BINDINGS,
-  codex: OPENAI_COMPATIBLE_BINDINGS,
-  opencode: OPENAI_COMPATIBLE_BINDINGS,
-  aider: AIDER_BINDINGS,
-  gemini: GEMINI_BINDINGS,
-  goose: OPENAI_COMPATIBLE_BINDINGS,
-  droid: OPENAI_COMPATIBLE_BINDINGS,
-  cursor: OPENAI_COMPATIBLE_BINDINGS,
-} as const satisfies ProxyEnvRegistry;
-
-function normalizeCli(cli: string): string {
-  const baseCli = cli.includes(':') ? cli.split(':')[0] : cli;
-  return CLI_ALIASES[baseCli] ?? baseCli;
-}
-
-function buildProxyEnv(
-  bindings: readonly ProxyEnvBinding[],
-  proxyUrl: string,
-  proxyToken: string
-): Record<string, string> {
-  return bindings.reduce<Record<string, string>>((env, binding) => {
-    env[binding.baseUrlVar] = proxyUrl;
-    env[binding.apiKeyVar] = proxyToken;
-    return env;
-  }, {});
-}
-
-export function createProxyEnvResolver(registry: ProxyEnvRegistry = DEFAULT_PROXY_ENV_REGISTRY) {
-  return (cli: string, proxyUrl: string, proxyToken: string): Record<string, string> => {
-    const normalizedCli = normalizeCli(cli);
-    const bindings = registry[normalizedCli];
-
-    if (bindings) {
-      return buildProxyEnv(bindings, proxyUrl, proxyToken);
-    }
-
-    const knownCli = getCliDefinition(normalizedCli);
-    const warningPrefix = knownCli ? 'No proxy env registry entry' : 'Unknown CLI';
-    console.warn(
-      `[proxy-env] ${warningPrefix} for "${normalizedCli}". ` +
-        'Falling back to generic OpenAI/Anthropic proxy env overrides.'
-    );
-
-    return buildProxyEnv(GENERIC_FALLBACK_BINDINGS, proxyUrl, proxyToken);
-  };
-}
-
-export const resolveProxyEnv = createProxyEnvResolver();
-
-export function resolveProxyUrlFromEnv(
-  env: Record<string, string | undefined> = process.env
-): string | undefined {
-  return env[RELAY_PROXY_URL_ENV] ?? env[RELAY_PROXY_URL_ENV_ALIAS];
-}
-
-export function resolveProxyTokenFromEnv(
-  env: Record<string, string | undefined> = process.env
-): string | undefined {
-  return env[RELAY_PROXY_TOKEN_ENV] ?? env[RELAY_PROXY_TOKEN_ENV_ALIAS];
-}
-
-export function buildNormalizedProxyEnv(proxyUrl: string, proxyToken: string): Record<string, string> {
-  return {
-    [RELAY_PROXY_URL_ENV]: proxyUrl,
-    [RELAY_PROXY_URL_ENV_ALIAS]: proxyUrl,
-    [RELAY_PROXY_TOKEN_ENV]: proxyToken,
-    [RELAY_PROXY_TOKEN_ENV_ALIAS]: proxyToken,
-  };
-}
-
-export function getStrippedApiKeyVars(): string[] {
-  return [...STRIPPED_API_KEY_VARS];
-}
-
-export function isProxyEnabled(
-  agentDef?: Pick<AgentDefinition, 'credentials'> | null,
-  swarmConfig?: Pick<SwarmConfig, 'credentialProxy'> | null
-): boolean {
-  return Boolean(agentDef?.credentials?.proxy && swarmConfig?.credentialProxy);
-}
diff --git a/packages/sdk/src/workflows/run-script.ts b/packages/sdk/src/workflows/run-script.ts
deleted file mode 100644
index 2ca667b39..000000000
--- a/packages/sdk/src/workflows/run-script.ts
+++ /dev/null
@@ -1,630 +0,0 @@
-/**
- * Programmatic local runner for `.ts` / `.tsx` / `.py` workflow scripts.
- *
- * This is the body of the `agent-relay run <script>` command extracted into
- * the SDK so other tools (e.g. `ricky run`) can drive the same execution
- * flow without shelling out to the `agent-relay` binary.
- *
- * Behavior is preserved exactly — the relay CLI's `run` command now
- * delegates to `runScriptWorkflow()` with no semantic change.
- */
-
-import fs from 'node:fs';
-import path from 'node:path';
-import { execFileSync, spawn as spawnProcess, spawnSync } from 'node:child_process';
-
-// ── Types ────────────────────────────────────────────────────────────────────
-
-export type ExecFileSyncLike = typeof execFileSync;
-
-export interface RunScriptWorkflowOptions {
-  /** Validate without running. Sets `DRY_RUN=true` in the child env. */
-  dryRun?: boolean;
-  /** Resume a previously failed workflow run by id. */
-  resume?: string;
-  /** Start from the given step name, skipping predecessors. */
-  startFrom?: string;
-  /** Use cached outputs from this previous run id. Pairs with `startFrom`. */
-  previousRunId?: string;
-}
-
-/**
- * Parsed workflow parse error, normalized from whatever shape the tsx/esbuild
- * subprocess produced on stderr. Decoupling this from any specific error class
- * means the formatter is testable in isolation and works regardless of how
- * the error surfaced (TransformError from tsx, Bun-bundled esbuild error, etc.).
- */
-export interface ParsedWorkflowError {
-  file: string;
-  line?: number;
-  column?: number;
-  message: string;
-  lineText?: string;
-}
-
-export interface LocalSdkWorkspace {
-  rootDir: string;
-  sdkDir: string;
-}
-
-interface SpawnRunnerResult {
-  status: number | null;
-  stderr: string;
-  error?: NodeJS.ErrnoException;
-}
-
-// ── Diagnostics ──────────────────────────────────────────────────────────────
-
-function diag(msg: string): void {
-  try {
-    process.stderr.write(`[agent-relay] ${msg}\n`);
-  } catch {
-    try {
-      process.stdout.write(`[agent-relay] ${msg}\n`);
-    } catch {
-      // Both streams closed — silently give up. Never throw from diag().
-    }
-  }
-}
-
-// ── Local SDK workspace detection ────────────────────────────────────────────
-
-/**
- * Walk upward from `startDir` looking for a workspace where the root
- * `package.json` is `agent-relay` and `packages/sdk/package.json` is
- * `@agent-relay/sdk`. Returns the matched paths or `null`.
- */
-export function findLocalSdkWorkspace(startDir: string): LocalSdkWorkspace | null {
-  let current = path.resolve(startDir);
-  const root = path.parse(current).root;
-
-  while (true) {
-    const packageJsonPath = path.join(current, 'package.json');
-    const sdkDir = path.join(current, 'packages', 'sdk');
-    const sdkPackageJsonPath = path.join(sdkDir, 'package.json');
-
-    try {
-      if (fs.existsSync(packageJsonPath) && fs.existsSync(sdkPackageJsonPath)) {
-        const pkg = JSON.parse(fs.readFileSync(packageJsonPath, 'utf8')) as { name?: string };
-        const sdkPkg = JSON.parse(fs.readFileSync(sdkPackageJsonPath, 'utf8')) as { name?: string };
-        if (pkg.name === 'agent-relay' && sdkPkg.name === '@agent-relay/sdk') {
-          return { rootDir: current, sdkDir };
-        }
-      }
-    } catch {
-      // Ignore parse/read errors and continue walking upward.
-    }
-
-    if (current === root) return null;
-    current = path.dirname(current);
-  }
-}
-
-/**
- * When running inside the relay monorepo, ensure `packages/sdk/dist/workflows`
- * is built so the script can resolve `@agent-relay/sdk/workflows`. No-op
- * outside the monorepo or when the build is already present.
- */
-export function ensureLocalSdkWorkflowRuntime(
-  startDir: string,
-  execRunner: ExecFileSyncLike = execFileSync
-): void {
-  const workspace = findLocalSdkWorkspace(startDir);
-  if (!workspace) return;
-
-  const workflowsEntry = path.join(workspace.sdkDir, 'dist', 'workflows', 'index.js');
-  if (fs.existsSync(workflowsEntry)) return;
-
-  console.log(
-    '[agent-relay] Detected local @agent-relay/sdk workspace without built workflows runtime; building SDK workflow dependencies...'
-  );
-  const buildCommands: string[][] = [
-    ['run', 'build:config'],
-    ['--prefix', 'packages/workflow-types', 'run', 'build'],
-    ['--prefix', 'packages/github-primitive', 'run', 'build'],
-    ['--prefix', 'packages/slack-primitive', 'run', 'build'],
-    ['--prefix', 'packages/cloud', 'run', 'build'],
-    ['run', 'build:sdk'],
-  ];
-  for (const args of buildCommands) {
-    execRunner('npm', args, {
-      cwd: workspace.rootDir,
-      stdio: 'inherit',
-      env: process.env,
-    });
-  }
-
-  if (!fs.existsSync(workflowsEntry)) {
-    throw new Error(`Local SDK workflows runtime is still missing after build: ${workflowsEntry}`);
-  }
-}
-
-// ── Workflow parse error normalization ───────────────────────────────────────
-
-/**
- * Parse tsx's stderr for the esbuild parse-error fingerprint and extract a
- * normalized {@link ParsedWorkflowError}. Returns null if nothing looks like
- * a parse error — runtime errors, module-not-found, etc. pass through.
- *
- * We match two common esbuild output formats:
- *   1. `/path/file.ts:LINE:COL: ERROR: message` (most common, one-liner)
- *   2. `✘ [ERROR] message\n\n    /path/file.ts:LINE:COL:\n      LINE │ text\n           ╵ pointer`
- *      (pretty-printed, multi-line)
- */
-export function parseTsxStderr(stderr: string): ParsedWorkflowError | null {
-  // Strip ANSI color codes so our regex isn't thrown off by escape sequences.
-  // eslint-disable-next-line no-control-regex
-  const clean = stderr.replace(/\x1b\[[0-9;]*m/g, '');
-
-  // Format 1: file:line:col: ERROR: message
-  const inlineMatch = clean.match(/(\/[^\s:]+\.(?:ts|tsx|mts|cts)):(\d+):(\d+):\s*ERROR:\s*([^\n]+)/);
-  if (inlineMatch) {
-    return {
-      file: inlineMatch[1]!,
-      line: Number(inlineMatch[2]),
-      column: Number(inlineMatch[3]),
-      message: inlineMatch[4]!.trim(),
-    };
-  }
-
-  // Format 2: ✘ [ERROR] message ... file:line:col:
-  const prettyError = clean.match(/✘\s*\[ERROR\]\s*([^\n]+)/);
-  if (prettyError) {
-    const locationMatch = clean.match(/(\/[^\s:]+\.(?:ts|tsx|mts|cts)):(\d+):(\d+):/);
-    if (locationMatch) {
-      return {
-        file: locationMatch[1]!,
-        line: Number(locationMatch[2]),
-        column: Number(locationMatch[3]),
-        message: prettyError[1]!.trim(),
-      };
-    }
-  }
-
-  // Format 3: "Transform failed with N errors" — loose fallback, any file+loc pair
-  if (/Transform failed with \d+ error/i.test(clean) || /TransformError/.test(clean)) {
-    const looseMatch = clean.match(/(\/[^\s:]+\.(?:ts|tsx|mts|cts)):(\d+):(\d+)/);
-    if (looseMatch) {
-      return {
-        file: looseMatch[1]!,
-        line: Number(looseMatch[2]),
-        column: Number(looseMatch[3]),
-        message: 'TypeScript parse error (see tsx output above)',
-      };
-    }
-  }
-
-  return null;
-}
-
-function resolveLocalTypeScriptImport(fromFile: string, specifier: string): string | null {
-  if (!specifier.startsWith('.') && !specifier.startsWith('/')) {
-    return null;
-  }
-
-  const basePath = specifier.startsWith('/')
-    ? path.resolve(specifier)
-    : path.resolve(path.dirname(fromFile), specifier);
-  const ext = path.extname(basePath);
-  const candidates =
-    ext === '.js' || ext === '.mjs' || ext === '.cjs'
-      ? [
-          `${basePath.slice(0, -ext.length)}.ts`,
-          `${basePath.slice(0, -ext.length)}.tsx`,
-          `${basePath.slice(0, -ext.length)}.mts`,
-          `${basePath.slice(0, -ext.length)}.cts`,
-          basePath,
-        ]
-      : ext
-        ? [basePath]
-        : [
-            `${basePath}.ts`,
-            `${basePath}.tsx`,
-            `${basePath}.mts`,
-            `${basePath}.cts`,
-            path.join(basePath, 'index.ts'),
-            path.join(basePath, 'index.tsx'),
-            path.join(basePath, 'index.mts'),
-            path.join(basePath, 'index.cts'),
-          ];
-
-  for (const candidate of candidates) {
-    if (/\.(?:ts|tsx|mts|cts)$/.test(candidate) && fs.existsSync(candidate)) {
-      return candidate;
-    }
-  }
-  return null;
-}
-
-function findStaticLocalTypeScriptImports(filePath: string, source: string): string[] {
-  const imports: string[] = [];
-  const staticImportPattern =
-    /(?:^|[\n;])\s*(?:import\s+(?:type\s+)?(?:[^'"]*?\s+from\s+)?|export\s+(?:type\s+)?[^'"]*?\s+from\s+)['"]([^'"]+)['"]/g;
-  for (const match of source.matchAll(staticImportPattern)) {
-    const resolved = resolveLocalTypeScriptImport(filePath, match[1]!);
-    if (resolved) {
-      imports.push(resolved);
-    }
-  }
-  return imports;
-}
-
-export function shouldSkipNodeStripTypesPreflight(
-  filePath: string,
-  seen = new Set<string>(),
-  isEntry = true
-): boolean {
-  const resolvedPath = path.resolve(filePath);
-  if (seen.has(resolvedPath)) {
-    return false;
-  }
-  seen.add(resolvedPath);
-
-  let source: string;
-  try {
-    source = fs.readFileSync(resolvedPath, 'utf8');
-  } catch {
-    return !isEntry;
-  }
-
-  // Node's strip-only runner cannot parse TypeScript constructs that require
-  // code generation. Detecting them before execution lets valid workflows go
-  // straight to tsx without retrying after user code may have already run.
-  if (containsNodeStripTypesUnsupportedSyntax(source)) {
-    return true;
-  }
-  return findStaticLocalTypeScriptImports(resolvedPath, source).some((importPath) =>
-    shouldSkipNodeStripTypesPreflight(importPath, seen, false)
-  );
-}
-
-function stripCommentsAndStringsForSyntaxScan(source: string): string {
-  let output = '';
-  for (let index = 0; index < source.length; index += 1) {
-    const char = source[index]!;
-    const next = source[index + 1];
-
-    if (char === '/' && next === '/') {
-      output += '  ';
-      index += 1;
-      while (index + 1 < source.length && source[index + 1] !== '\n') {
-        output += ' ';
-        index += 1;
-      }
-      continue;
-    }
-
-    if (char === '/' && next === '*') {
-      output += '  ';
-      index += 1;
-      while (index + 1 < source.length) {
-        index += 1;
-        const current = source[index]!;
-        output += current === '\n' ? '\n' : ' ';
-        if (current === '*' && source[index + 1] === '/') {
-          output += ' ';
-          index += 1;
-          break;
-        }
-      }
-      continue;
-    }
-
-    if (char === '"' || char === "'" || char === '`') {
-      const quote = char;
-      output += ' ';
-      while (index + 1 < source.length) {
-        index += 1;
-        const current = source[index]!;
-        output += current === '\n' ? '\n' : ' ';
-        if (current === '\\') {
-          if (index + 1 < source.length) {
-            index += 1;
-            output += source[index] === '\n' ? '\n' : ' ';
-          }
-          continue;
-        }
-        if (current === quote) {
-          break;
-        }
-      }
-      continue;
-    }
-
-    output += char;
-  }
-  return output;
-}
-
-function containsNodeStripTypesUnsupportedSyntax(source: string): boolean {
-  const scanSource = stripCommentsAndStringsForSyntaxScan(source);
-  return (
-    /(?:^|[;\n{}])\s*(?:export\s+)?(?:const\s+)?enum\s+[A-Za-z_$][\w$]*/.test(scanSource) ||
-    /(?:^|[;\n{}])\s*(?:export\s+)?(?:declare\s+)?(?:namespace|module)\s+[A-Za-z_$][\w$]*/.test(scanSource) ||
-    /\bconstructor\s*\([^)]*\b(?:public|private|protected|readonly)\s+(?:readonly\s+)?[A-Za-z_$][\w$]*/.test(
-      scanSource
-    ) ||
-    /(?:^|[;\n{}])\s*import\s+[A-Za-z_$][\w$]*\s*=\s*(?:require\s*\(|[A-Za-z_$][\w$]*(?:\.[A-Za-z_$][\w$]*)*)/.test(
-      scanSource
-    ) ||
-    /(?:^|[;\n{}])\s*export\s*=\s*/.test(scanSource)
-  );
-}
-
-/**
- * Format a {@link ParsedWorkflowError} as an actionable workflow-author error
- * message with hints keyed off the most common mistakes in `command:` /
- * `task:` template literals.
- */
-export function formatWorkflowParseError(parsed: ParsedWorkflowError): Error {
-  const where =
-    parsed.line !== undefined
-      ? `${parsed.file}:${parsed.line}${parsed.column !== undefined ? `:${parsed.column}` : ''}`
-      : parsed.file;
-
-  const hints: string[] = [];
-  const text = parsed.message;
-
-  if (/Expected "\}" but found/i.test(text) || /Unterminated template literal/i.test(text)) {
-    hints.push(
-      'Likely a JavaScript template literal metacharacter inside a `command:` or `task:` block. ' +
-        'Inside workflow .ts files every `command: \\`...\\`` is a JavaScript template literal — ' +
-        'backticks terminate it and `${...}` triggers JS interpolation before the shell ever sees the string.',
-      'Fixes: use single quotes instead of backticks in prose/commit messages; ' +
-        'for shell variables use `$VAR` (no braces) or escape as `\\${VAR}`; ' +
-        'never write literal `\\n` inside a shell comment (it becomes a real newline).'
-    );
-  }
-
-  if (/Unexpected "\$"/.test(text)) {
-    hints.push(
-      'Unexpected `$` inside a template literal usually means `${...}` was interpreted as JS interpolation. ' +
-        'Escape it as `\\${...}` or drop the braces and use plain `$VAR`.'
-    );
-  }
-
-  if (/Expected identifier/.test(text) && /template/i.test(text)) {
-    hints.push(
-      'A template literal interpolation `${...}` needs a valid JS expression inside. ' +
-        'If you meant a shell variable, escape the `$` or drop the braces.'
-    );
-  }
-
-  const lines = ['', `Workflow file failed to parse: ${where}`, `  ${text}`];
-  if (parsed.lineText) {
-    lines.push(`  | ${parsed.lineText}`);
-    if (parsed.column !== undefined && parsed.column >= 0) {
-      lines.push(`  | ${' '.repeat(parsed.column)}^`);
-    }
-  }
-  if (hints.length > 0) {
-    lines.push('');
-    for (const hint of hints) {
-      lines.push(`Hint: ${hint}`);
-    }
-  }
-  lines.push('');
-
-  const wrapped = new Error(lines.join('\n'));
-  (wrapped as Error & { code?: string }).code = 'WORKFLOW_PARSE_ERROR';
-  return wrapped;
-}
-
-// ── Spawn helper ─────────────────────────────────────────────────────────────
-
-/**
- * Spawn a TypeScript runner (tsx, ts-node, npx tsx) with stdin/stdout
- * inherited and stderr tee'd to both the user's terminal and an internal
- * buffer. The buffer is inspected on non-zero exit to produce actionable
- * error messages for workflow parse errors.
- *
- * Why this instead of `spawnSync({ stdio: 'inherit' })`: sync + inherit makes
- * it impossible to post-process stderr. Async + tee gives us the best of
- * both worlds — live progress for the user AND captured stderr for the
- * parse-error wrapper.
- */
-async function spawnRunnerWithStderrCapture(
-  command: string,
-  args: string[],
-  env: NodeJS.ProcessEnv
-): Promise<SpawnRunnerResult> {
-  return new Promise((resolve) => {
-    const child = spawnProcess(command, args, {
-      stdio: ['inherit', 'inherit', 'pipe'],
-      env,
-    });
-
-    let stderrBuf = '';
-
-    child.stderr?.on('data', (chunk: Buffer | string) => {
-      const text = typeof chunk === 'string' ? chunk : chunk.toString('utf8');
-      stderrBuf += text;
-      try {
-        process.stderr.write(text);
-      } catch {
-        // stderr closed — keep buffering for post-processing.
-      }
-    });
-
-    child.on('error', (err: NodeJS.ErrnoException) => {
-      resolve({ status: null, stderr: stderrBuf, error: err });
-    });
-
-    child.on('close', (status) => {
-      resolve({ status, stderr: stderrBuf });
-    });
-  });
-}
-
-// ── Main entry ───────────────────────────────────────────────────────────────
-
-/**
- * Run a `.ts`, `.tsx`, or `.py` workflow script locally.
- *
- * For TypeScript files, tries Node's `--experimental-strip-types` first
- * (Node 22.6+), then falls back to `tsx`, `ts-node`, and finally `npx tsx`.
- * For Python files, tries `python3` then `python`.
- *
- * Throws on non-zero exit. The error message includes the run id (when
- * the script wrote one to `AGENT_RELAY_RUN_ID_FILE`) so callers can resume
- * with `--start-from <step> --previous-run-id <id>`.
- */
-export async function runScriptWorkflow(
-  filePath: string,
-  options: RunScriptWorkflowOptions = {}
-): Promise<void> {
-  diag(`runScriptWorkflow: resolving ${filePath}`);
-  const resolved = path.resolve(filePath);
-  if (!fs.existsSync(resolved)) {
-    throw new Error(`File not found: ${resolved}`);
-  }
-  const ext = path.extname(resolved).toLowerCase();
-  const runIdFile = path.join(
-    process.cwd(),
-    '.agent-relay',
-    `script-run-id-${process.pid}-${Date.now()}.txt`
-  );
-  try {
-    fs.mkdirSync(path.dirname(runIdFile), { recursive: true });
-  } catch {
-    // Run-id hint is optional — don't abort if directory is not writable
-  }
-  const childEnv: NodeJS.ProcessEnv = { ...process.env, AGENT_RELAY_RUN_ID_FILE: runIdFile };
-  if (options.dryRun) childEnv.DRY_RUN = 'true';
-  if (options.resume) childEnv.RESUME_RUN_ID = options.resume;
-  if (options.startFrom) childEnv.START_FROM = options.startFrom;
-  if (options.previousRunId) childEnv.PREVIOUS_RUN_ID = options.previousRunId;
-
-  const augmentErrorWithRunId = (err: any): never => {
-    try {
-      if (fs.existsSync(runIdFile)) {
-        const runId = fs.readFileSync(runIdFile, 'utf8').trim();
-        if (runId && typeof err?.message === 'string' && !err.message.includes('Run ID:')) {
-          err.message += `
-Run ID: ${runId}`;
-        }
-      }
-    } catch {
-      // Ignore run-id hint failures and preserve the original error.
-    } finally {
-      try {
-        fs.rmSync(runIdFile, { force: true });
-      } catch {
-        // Ignore cleanup failure.
-      }
-    }
-    throw err;
-  };
-  const cleanupRunIdFile = () => {
-    try {
-      fs.rmSync(runIdFile, { force: true });
-    } catch {
-      /* ignore */
-    }
-  };
-
-  if (ext === '.ts' || ext === '.tsx') {
-    diag('runScriptWorkflow: ensureLocalSdkWorkflowRuntime start');
-    ensureLocalSdkWorkflowRuntime(path.dirname(resolved));
-    diag('runScriptWorkflow: ensureLocalSdkWorkflowRuntime done');
-
-    // Wrap a runner exit in an actionable workflow parse error if the
-    // captured stderr looks like esbuild tripped on a template literal.
-    // Otherwise fall through to a plain exit-code error (stderr was
-    // already live-streamed to the terminal).
-    const wrapRunnerError = (runner: string, result: SpawnRunnerResult): Error => {
-      const parsed = parseTsxStderr(result.stderr);
-      if (parsed) {
-        return formatWorkflowParseError(parsed);
-      }
-      return new Error(`${runner} exited with code ${result.status}`);
-    };
-
-    // Prefer Node's built-in type stripping (Node 22.6+) — no extra deps,
-    // no tsx CJS resolver quirks walking node_modules. Falls through to
-    // tsx/ts-node on older Nodes (they exit non-zero with an unknown-flag
-    // error, not ENOENT, so we treat any non-zero from this runner as a
-    // "try the next runner" signal rather than a real user error).
-    const runners: Array<{ label: string; bin: string; preArgs: string[] }> = [
-      {
-        label: 'node --experimental-strip-types',
-        bin: 'node',
-        preArgs: ['--experimental-strip-types', '--no-warnings=ExperimentalWarning'],
-      },
-      { label: 'tsx', bin: 'tsx', preArgs: [] },
-      { label: 'ts-node', bin: 'ts-node', preArgs: [] },
-    ];
-    for (const { label, bin, preArgs } of runners) {
-      if (bin === 'node' && shouldSkipNodeStripTypesPreflight(resolved)) {
-        diag(`runScriptWorkflow: ${label} cannot parse this TypeScript file — trying next`);
-        continue;
-      }
-      diag(`runScriptWorkflow: trying runner ${label}`);
-      const result = await spawnRunnerWithStderrCapture(bin, [...preArgs, resolved], childEnv);
-      if (result.error) {
-        if ((result.error as NodeJS.ErrnoException).code === 'ENOENT') {
-          diag(`runScriptWorkflow: runner ${label} returned ENOENT — trying next`);
-          continue;
-        }
-        return augmentErrorWithRunId(result.error);
-      }
-      if (result.status !== 0) {
-        // Node exits with code 9 ("Invalid Argument") when it doesn't
-        // recognise --experimental-strip-types (Node <22.6). Other non-zero
-        // exits may have occurred after entry module evaluation, so do not
-        // retry them under another runner.
-        if (bin === 'node' && result.status === 9) {
-          diag(`runScriptWorkflow: runner ${label} cannot handle this TypeScript file — trying next`);
-          continue;
-        }
-        return augmentErrorWithRunId(wrapRunnerError(label, result));
-      }
-      diag(`runScriptWorkflow: runner ${label} completed exit=0`);
-      cleanupRunIdFile();
-      return;
-    }
-    diag('runScriptWorkflow: falling back to npx tsx');
-    const npxResult = await spawnRunnerWithStderrCapture('npx', ['tsx', resolved], childEnv);
-    if (npxResult.error) {
-      return augmentErrorWithRunId(npxResult.error);
-    }
-    if (npxResult.status !== 0) {
-      return augmentErrorWithRunId(wrapRunnerError('npx tsx', npxResult));
-    }
-    diag('runScriptWorkflow: npx tsx completed');
-    cleanupRunIdFile();
-    return;
-  }
-  if (ext === '.py') {
-    const runners = ['python3', 'python'];
-    for (const runner of runners) {
-      diag(`runScriptWorkflow: trying runner ${runner}`);
-      const spawnResult = spawnSync(runner, [resolved], {
-        stdio: 'inherit',
-        env: childEnv,
-      });
-      if (spawnResult.error) {
-        if ((spawnResult.error as NodeJS.ErrnoException).code === 'ENOENT') {
-          diag(`runScriptWorkflow: runner ${runner} returned ENOENT — trying next`);
-          continue;
-        }
-        return augmentErrorWithRunId(spawnResult.error);
-      }
-      if (spawnResult.status !== 0) {
-        const err = new Error(`${runner} exited with code ${spawnResult.status}`);
-        return augmentErrorWithRunId(err);
-      }
-      diag(`runScriptWorkflow: runner ${runner} completed exit=0`);
-      cleanupRunIdFile();
-      return;
-    }
-    cleanupRunIdFile();
-    throw new Error('Python not found. Install Python 3.10+ to run .py workflow files.');
-  }
-  try {
-    fs.rmSync(runIdFile, { force: true });
-  } catch {
-    // Ignore cleanup failure.
-  }
-  throw new Error(`Unsupported file type: ${ext}. Use .yaml, .yml, .ts, or .py`);
-}
diff --git a/packages/sdk/src/workflows/run-summary-table.ts b/packages/sdk/src/workflows/run-summary-table.ts
deleted file mode 100644
index 9211a1a1f..000000000
--- a/packages/sdk/src/workflows/run-summary-table.ts
+++ /dev/null
@@ -1,152 +0,0 @@
-import type { CliSessionReport } from './cli-session-collector.js';
-import type { RunSummaryBudgetData, StepBudgetStatus } from './budget-tracker.js';
-import type { StepOutcome } from './trajectory.js';
-
-function formatCurrency(value: number | null | undefined): string {
-  return typeof value === 'number' ? `$${value.toFixed(2)}` : '--';
-}
-
-function formatTokens(report: CliSessionReport | undefined): string {
-  if (!report?.tokens) return '--';
-  const total = report.tokens.input + report.tokens.output + report.tokens.cacheRead;
-  return total.toLocaleString('en-US');
-}
-
-function formatBudgetValue(value: number | undefined): string {
-  return typeof value === 'number' ? value.toLocaleString('en-US') : '--';
-}
-
-function formatBudget(status: StepBudgetStatus | undefined): string {
-  if (!status) return '--';
-
-  const rendered = `${formatBudgetValue(status.used)}/${formatBudgetValue(status.limit)}`;
-  return status.over ? `${rendered} [OVER]` : rendered;
-}
-
-function formatDuration(durationMs: number | null | undefined): string {
-  if (typeof durationMs !== 'number' || !Number.isFinite(durationMs)) return '--';
-  if (durationMs < 1000) return `${durationMs}ms`;
-
-  const totalSeconds = Math.round(durationMs / 1000);
-  const minutes = Math.floor(totalSeconds / 60);
-  const seconds = totalSeconds % 60;
-  return minutes > 0 ? `${minutes}m ${seconds}s` : `${seconds}s`;
-}
-
-function truncate(value: string, length: number): string {
-  if (value.length <= length) return value;
-  if (length <= 1) return value.slice(0, length);
-  return `${value.slice(0, length - 1)}…`;
-}
-
-function pad(value: string, width: number, align: 'left' | 'right' = 'left'): string {
-  return align === 'right' ? value.padStart(width, ' ') : value.padEnd(width, ' ');
-}
-
-function formatErrors(outcome: StepOutcome, report: CliSessionReport | undefined): string {
-  const count = report?.errors.length ?? 0;
-  if (count === 0) return outcome.status === 'failed' && outcome.error ? '1' : '--';
-  if (outcome.status === 'completed') return `${count} (fixed)`;
-  return String(count);
-}
-
-export function formatRunSummaryTable(
-  outcomes: StepOutcome[],
-  reports: Map<string, CliSessionReport>,
-  budgetData?: RunSummaryBudgetData
-): string {
-  // Only show the Cost column when at least one report has reliable cost data
-  // (currently only OpenCode populates cost; Claude and Codex return null)
-  const hasCost = Array.from(reports.values()).some((r) => typeof r.cost === 'number' && r.cost > 0);
-  const hasBudget = Boolean(budgetData);
-
-  const headers = hasCost
-    ? hasBudget
-      ? ['Step', 'Status', 'Model', 'Cost', 'Tokens', 'Budget', 'Duration', 'Errors']
-      : ['Step', 'Status', 'Model', 'Cost', 'Tokens', 'Duration', 'Errors']
-    : hasBudget
-      ? ['Step', 'Status', 'Model', 'Tokens', 'Budget', 'Duration', 'Errors']
-      : ['Step', 'Status', 'Model', 'Tokens', 'Duration', 'Errors'];
-  const widths = hasCost
-    ? hasBudget
-      ? [20, 6, 16, 8, 10, 18, 10, 10]
-      : [20, 6, 16, 8, 10, 10, 10]
-    : hasBudget
-      ? [20, 6, 16, 10, 18, 10, 10]
-      : [20, 6, 16, 10, 10, 10];
-  const lines: string[] = [];
-
-  lines.push(
-    headers
-      .map((h, i) => {
-        const align = i <= 2 ? 'left' : 'right';
-        return pad(h, widths[i], align);
-      })
-      .join('  ')
-  );
-
-  let totalCost = 0;
-  let totalTokens = 0;
-  let totalDurationMs = 0;
-
-  for (const outcome of outcomes) {
-    const report = reports.get(outcome.name);
-    const reportDuration = report?.durationMs ?? outcome.durationMs;
-    const reportTokens = report?.tokens
-      ? report.tokens.input + report.tokens.output + report.tokens.cacheRead
-      : 0;
-    const budgetStatus = budgetData?.steps.get(outcome.name);
-
-    if (typeof report?.cost === 'number') totalCost += report.cost;
-    totalTokens += reportTokens;
-    if (typeof reportDuration === 'number') totalDurationMs += reportDuration;
-
-    const cols: string[] = [
-      pad(truncate(outcome.name, widths[0]), widths[0]),
-      pad(outcome.status === 'failed' ? 'FAIL' : outcome.status === 'completed' ? 'pass' : 'skip', widths[1]),
-      pad(truncate(report?.model ?? '--', widths[2]), widths[2]),
-    ];
-    if (hasCost) cols.push(pad(formatCurrency(report?.cost), widths[3], 'right'));
-    const tokenIdx = hasCost ? 4 : 3;
-    cols.push(pad(formatTokens(report), widths[tokenIdx], 'right'));
-    if (hasBudget) cols.push(pad(formatBudget(budgetStatus), widths[tokenIdx + 1], 'right'));
-    const durationIdx = hasBudget ? tokenIdx + 2 : tokenIdx + 1;
-    const errorsIdx = hasBudget ? tokenIdx + 3 : tokenIdx + 2;
-    cols.push(pad(formatDuration(reportDuration), widths[durationIdx], 'right'));
-    cols.push(pad(formatErrors(outcome, report), widths[errorsIdx], 'right'));
-
-    lines.push(cols.join('  '));
-
-    if (outcome.status === 'failed') {
-      const firstError = report?.errors[0];
-      if (firstError) {
-        lines.push(`  └─ Error [turn ${firstError.turn}] ${truncate(firstError.text, 120)}`);
-      }
-    }
-  }
-
-  const totalLabelWidth = widths[0] + widths[1] + widths[2] + 4;
-  lines.push('─'.repeat(lines[0].length));
-
-  const totalCols: string[] = [pad('Total', totalLabelWidth)];
-  if (hasCost) totalCols.push(pad(formatCurrency(totalCost), widths[3], 'right'));
-  const tokenIdx = hasCost ? 4 : 3;
-  totalCols.push(
-    pad(totalTokens > 0 ? totalTokens.toLocaleString('en-US') : '--', widths[tokenIdx], 'right')
-  );
-  if (hasBudget) {
-    const workflowBudget = budgetData?.workflow;
-    const budgetTotal =
-      workflowBudget && (workflowBudget.limit !== undefined || workflowBudget.used > 0)
-        ? `${formatBudgetValue(workflowBudget.used)}/${formatBudgetValue(workflowBudget.limit)}`
-        : '--';
-    totalCols.push(pad(budgetTotal, widths[tokenIdx + 1], 'right'));
-  }
-  const durationIdx = hasBudget ? tokenIdx + 2 : tokenIdx + 1;
-  const errorsIdx = hasBudget ? tokenIdx + 3 : tokenIdx + 2;
-  totalCols.push(pad(formatDuration(totalDurationMs), widths[durationIdx], 'right'));
-  totalCols.push(pad('', widths[errorsIdx], 'right'));
-  lines.push(totalCols.join('  '));
-
-  return lines.map((line) => `  ${line}`).join('\n');
-}
diff --git a/packages/sdk/src/workflows/run.ts b/packages/sdk/src/workflows/run.ts
deleted file mode 100644
index 9e3614b24..000000000
--- a/packages/sdk/src/workflows/run.ts
+++ /dev/null
@@ -1,94 +0,0 @@
-import type { AgentRelayOptions } from '../relay.js';
-import type { DryRunReport, TrajectoryConfig, WorkflowRunRow } from './types.js';
-import { WorkflowRunner, type WorkflowEventListener } from './runner.js';
-import { createDefaultEventLogger } from './default-logger.js';
-import { formatDryRunReport } from './dry-run-format.js';
-import type { VariableContext } from './template-resolver.js';
-
-/**
- * Options for the `runWorkflow` convenience function.
- */
-export interface RunWorkflowOptions {
-  /** Workflow name within the YAML file. Defaults to the first workflow. */
-  workflow?: string;
-  /** Template variable substitutions for {{variable}} placeholders. */
-  vars?: VariableContext;
-  /** Working directory. Defaults to process.cwd(). */
-  cwd?: string;
-  /** AgentRelay options (all optional — broker starts automatically). */
-  relay?: AgentRelayOptions;
-  /** Progress callback for workflow events. */
-  onEvent?: WorkflowEventListener;
-  /** Override trajectory config. Set to false to disable trajectory recording. */
-  trajectories?: TrajectoryConfig | false;
-  /** Validate and show execution plan without running. */
-  dryRun?: boolean;
-  /** Resume a failed run by its ID instead of starting fresh. */
-  resume?: string;
-  /** Skip to a specific step (re-uses cached outputs from earlier steps). */
-  startFrom?: string;
-  /** Previous run ID whose cached step outputs are used with startFrom. */
-  previousRunId?: string;
-}
-
-/**
- * Run a workflow from a relay.yaml file with zero configuration.
- *
- * @example
- * ```typescript
- * import { runWorkflow } from "@agent-relay/sdk/workflows";
- *
- * const result = await runWorkflow("workflows/daytona-migration.yaml");
- * console.log(result.status); // "completed" | "failed"
- * ```
- */
-export async function runWorkflow(
-  yamlPath: string,
-  options: RunWorkflowOptions & { dryRun: true }
-): Promise<DryRunReport>;
-export async function runWorkflow(yamlPath: string, options?: RunWorkflowOptions): Promise<WorkflowRunRow>;
-export async function runWorkflow(
-  yamlPath: string,
-  options: RunWorkflowOptions = {}
-): Promise<WorkflowRunRow | DryRunReport> {
-  const runner = new WorkflowRunner({
-    cwd: options.cwd,
-    relay: options.relay,
-  });
-
-  const config = await runner.parseYamlFile(yamlPath);
-
-  // Allow programmatic trajectory override
-  if (options.trajectories !== undefined) {
-    config.trajectories = options.trajectories;
-  }
-
-  // Auto-detect DRY_RUN env var so existing scripts get dry-run for free
-  const isDryRun = options.dryRun ?? !!process.env.DRY_RUN;
-
-  if (isDryRun) {
-    const report = runner.dryRun(config, options.workflow, options.vars);
-    console.log(formatDryRunReport(report));
-    return report;
-  }
-
-  // Attach default console logger so callers get progress output without
-  // needing to wire up their own handler.
-  runner.on(createDefaultEventLogger('normal'));
-
-  if (options.onEvent) {
-    runner.on(options.onEvent);
-  }
-
-  // Resume a previous run if requested
-  const resumeRunId = options.resume ?? process.env.RESUME_RUN_ID;
-  if (resumeRunId) {
-    return runner.resume(resumeRunId, options.vars);
-  }
-
-  const startFrom = options.startFrom ?? process.env.START_FROM;
-  const previousRunId = options.previousRunId ?? process.env.PREVIOUS_RUN_ID;
-  const executeOptions = startFrom ? { startFrom, previousRunId } : undefined;
-
-  return runner.execute(config, options.workflow, options.vars, executeOptions);
-}
diff --git a/packages/sdk/src/workflows/runner.ts b/packages/sdk/src/workflows/runner.ts
deleted file mode 100644
index 278a1fe94..000000000
--- a/packages/sdk/src/workflows/runner.ts
+++ /dev/null
@@ -1,8059 +0,0 @@
-/**
- * WorkflowRunner — parses relay.yaml, validates config, resolves templates,
- * executes steps (sequential/parallel/DAG), runs verification checks,
- * persists state to DB, and supports pause/resume/abort with retries.
- */
-
-import { spawn as cpSpawn } from 'node:child_process';
-import { randomBytes } from 'node:crypto';
-import {
-  createWriteStream,
-  existsSync,
-  mkdtempSync,
-  mkdirSync,
-  readFileSync,
-  readdirSync,
-  renameSync,
-  statSync,
-  writeFileSync,
-} from 'node:fs';
-import type { Dirent, WriteStream } from 'node:fs';
-import { readFile, writeFile, mkdir, unlink } from 'node:fs/promises';
-import { tmpdir } from 'node:os';
-import path from 'node:path';
-import chalk from 'chalk';
-import ignore from 'ignore';
-
-import { parse as parseYaml } from 'yaml';
-import { stripAnsi as stripAnsiFn } from '../pty.js';
-import type { BrokerEvent } from '../protocol.js';
-import { resolveSpawnPolicy } from '../spawn-from-env.js';
-import { getCliDefinition } from '../cli-registry.js';
-import { resolveCliSync } from '../cli-resolver.js';
-import {
-  buildNormalizedProxyEnv,
-  getStrippedApiKeyVars,
-  resolveProxyEnv,
-  resolveProxyTokenFromEnv,
-  resolveProxyUrlFromEnv,
-} from './proxy-env.js';
-
-import {
-  loadCustomSteps,
-  resolveAllCustomSteps,
-  validateCustomStepsUsage,
-  CustomStepsParseError,
-  CustomStepResolutionError,
-} from './custom-steps.js';
-import { provisionWorkflowAgents, resolveAgentPermissions } from '../provisioner/index.js';
-import {
-  createLocalJwksKeyPair,
-  importPrivateKeyPem,
-  RELAYAUTH_JWT_KID_ENV,
-  RELAYAUTH_JWT_PRIVATE_KEY_PEM_ENV,
-  type LocalJwksSigningKey,
-} from '../provisioner/local-jwks.js';
-import type { MountHandle } from '../provisioner/mount.js';
-import { collectCliSession, type CliSessionReport } from './cli-session-collector.js';
-import { executeApiStep } from './api-executor.js';
-import { BudgetExceededError, BudgetTracker } from './budget-tracker.js';
-import { ChannelMessenger, scrubForChannel as scrubWorkflowOutputForChannel } from './channel-messenger.js';
-import { InMemoryWorkflowDb } from './memory-db.js';
-import { buildCommand as buildProcessCommand, spawnProcess } from './process-spawner.js';
-import { createProcessBackendExecutor } from './process-backend-executor.js';
-import { formatRunSummaryTable } from './run-summary-table.js';
-import {
-  StepExecutor as WorkflowStepLifecycleExecutor,
-  type StepExecutorDeps as WorkflowStepLifecycleExecutorDeps,
-} from './step-executor.js';
-import {
-  interpolateStepTask as interpolateStepTaskTemplate,
-  resolveDotPath as resolveTemplateDotPath,
-  resolveTemplate,
-  TemplateResolver,
-  type VariableContext,
-} from './template-resolver.js';
-import type {
-  AccessPreset,
-  AgentCli,
-  AgentDefinition,
-  AgentPermissions,
-  AgentPreset,
-  CompletionEvidenceChannelOrigin,
-  CompletionEvidenceChannelPost,
-  CompletionEvidenceFileChange,
-  CompletionEvidenceSignal,
-  CompletionEvidenceSignalKind,
-  CompletionEvidenceToolSideEffect,
-  DryRunReport,
-  DryRunWave,
-  ErrorHandlingConfig,
-  IdleNudgeConfig,
-  PathDefinition,
-  PermissionProfileDefinition,
-  PreflightCheck,
-  RelayYamlConfig,
-  StepCompletionDecision,
-  StepCompletionEvidence,
-  SwarmPattern,
-  VerificationCheck,
-  WorkflowDefinition,
-  WorkflowOwnerDecision,
-  WorkflowRunRow,
-  WorkflowRunStatus,
-  WorkflowStep,
-  WorkflowExecuteOptions,
-  WorkflowStepCompletionReason,
-  WorkflowStepRow,
-  WorkflowStepStatus,
-  ProcessBackend,
-  RunnerStepExecutor,
-} from './types.js';
-import { WorkflowTrajectory, type StepOutcome } from './trajectory.js';
-import {
-  runVerification,
-  stripInjectedTaskEcho,
-  type VerificationOptions,
-  type VerificationResult,
-  WorkflowCompletionError,
-} from './verification.js';
-
-// ── AgentRelay SDK imports ──────────────────────────────────────────────────
-
-// Import from sub-paths to avoid pulling in the full @relaycast/sdk dependency.
-import { AgentRelay } from '../relay.js';
-import type { Agent, AgentRelayOptions, AgentSpawner } from '../relay.js';
-import { RelayCast, RelayError, type AgentClient } from '@relaycast/sdk';
-
-// ── Environment filtering ──────────────────────────────────────────────────
-
-/** Keys explicitly allowed to propagate to spawned child processes. */
-const ENV_ALLOWLIST = new Set([
-  'PATH',
-  'HOME',
-  'USER',
-  'SHELL',
-  'LANG',
-  'TERM',
-  'TMPDIR',
-  'TZ',
-  'NODE_ENV',
-  'NODE_PATH',
-  'NODE_OPTIONS',
-  'NODE_EXTRA_CA_CERTS',
-  'RUST_LOG',
-  'RUST_BACKTRACE',
-  'RELAY_API_KEY',
-  'RELAYCAST_BASE_URL',
-  'RELAY_LLM_PROXY',
-  'RELAY_LLM_PROXY_URL',
-  'CREDENTIAL_PROXY_TOKEN',
-  'RELAY_LLM_PROXY_TOKEN',
-  'AGENT_RELAY_DASHBOARD_PORT',
-  'AGENT_RELAY_RUN_ID_FILE',
-  'EDITOR',
-  'VISUAL',
-  'GIT_AUTHOR_NAME',
-  'GIT_AUTHOR_EMAIL',
-  'GIT_COMMITTER_NAME',
-  'GIT_COMMITTER_EMAIL',
-  'HTTPS_PROXY',
-  'HTTP_PROXY',
-  'NO_PROXY',
-  'https_proxy',
-  'http_proxy',
-  'no_proxy',
-  'XDG_CONFIG_HOME',
-  'XDG_DATA_HOME',
-  'XDG_CACHE_HOME',
-]);
-
-type ProxyProvider = 'openai' | 'anthropic' | 'openrouter';
-
-interface ProxyModeConfig {
-  token: string;
-  url: string;
-}
-
-interface ProxyTokenClaims {
-  sub: string;
-  aud: 'relay-llm-proxy';
-  provider: ProxyProvider;
-  credentialId: string;
-  budget?: number;
-  exp?: number;
-}
-
-interface CredentialProxyModule {
-  mintProxyToken: (claims: ProxyTokenClaims, secret: string) => Promise<string>;
-}
-
-/** Return a filtered copy of process.env containing only allowlisted keys. */
-function filteredEnv(extra?: Record<string, string | undefined>): Record<string, string | undefined> {
-  const env: Record<string, string | undefined> = {};
-  for (const key of ENV_ALLOWLIST) {
-    if (process.env[key] !== undefined) {
-      env[key] = process.env[key];
-    }
-  }
-  if (extra) {
-    Object.assign(env, extra);
-  }
-  return env;
-}
-
-// ── DB adapter interface ────────────────────────────────────────────────────
-
-/** Minimal DB adapter so the runner is not coupled to a specific driver. */
-export interface WorkflowDb {
-  insertRun(run: WorkflowRunRow): Promise<void>;
-  updateRun(id: string, patch: Partial<WorkflowRunRow>): Promise<void>;
-  getRun(id: string): Promise<WorkflowRunRow | null>;
-
-  insertStep(step: WorkflowStepRow): Promise<void>;
-  updateStep(id: string, patch: Partial<WorkflowStepRow>): Promise<void>;
-  getStepsByRunId(runId: string): Promise<WorkflowStepRow[]>;
-}
-
-/** Result returned by spawnAndWait / execNonInteractive with optional process exit info. */
-interface SpawnResult {
-  output: string;
-  exitCode?: number;
-  exitSignal?: string;
-  promptTaskText?: string;
-}
-
-/** Error carrying exit code/signal from a failed subprocess spawn. */
-class SpawnExitError extends Error {
-  exitCode?: number;
-  exitSignal?: string;
-  constructor(message: string, exitCode?: number, exitSignal?: string | null) {
-    super(message);
-    this.name = 'SpawnExitError';
-    this.exitCode = exitCode;
-    this.exitSignal = exitSignal ?? undefined;
-  }
-}
-
-interface CompletionDecisionResult {
-  completionReason: WorkflowStepCompletionReason;
-  ownerDecision?: WorkflowOwnerDecision;
-  reason?: string;
-}
-
-// ── Events ──────────────────────────────────────────────────────────────────
-
-export type WorkflowEvent =
-  | { type: 'run:started'; runId: string }
-  | { type: 'run:completed'; runId: string }
-  | { type: 'run:failed'; runId: string; error: string }
-  | { type: 'run:cancelled'; runId: string }
-  | { type: 'broker:event'; runId: string; event: BrokerEvent }
-  | { type: 'step:started'; runId: string; stepName: string }
-  | {
-      type: 'step:owner-assigned';
-      runId: string;
-      stepName: string;
-      ownerName: string;
-      specialistName: string;
-    }
-  | {
-      type: 'step:completed';
-      runId: string;
-      stepName: string;
-      output?: string;
-      exitCode?: number;
-      exitSignal?: string;
-    }
-  | {
-      type: 'step:review-completed';
-      runId: string;
-      stepName: string;
-      reviewerName: string;
-      decision: 'approved' | 'rejected';
-    }
-  | { type: 'step:owner-timeout'; runId: string; stepName: string; ownerName: string }
-  | { type: 'step:agent-report'; runId: string; stepName: string; report: CliSessionReport }
-  | {
-      type: 'step:failed';
-      runId: string;
-      stepName: string;
-      error: string;
-      exitCode?: number;
-      exitSignal?: string;
-    }
-  | { type: 'step:skipped'; runId: string; stepName: string }
-  | { type: 'step:retrying'; runId: string; stepName: string; attempt: number }
-  | { type: 'step:nudged'; runId: string; stepName: string; nudgeCount: number }
-  | { type: 'step:force-released'; runId: string; stepName: string };
-
-export type WorkflowEventListener = (event: WorkflowEvent) => void;
-
-// ── Runner options ──────────────────────────────────────────────────────────
-
-export interface WorkflowRunnerOptions {
-  db?: WorkflowDb;
-  workspaceId?: string;
-  relay?: AgentRelayOptions;
-  cwd?: string;
-  summaryDir?: string;
-  executor?: RunnerStepExecutor;
-  envSecrets?: Record<string, string>;
-  /**
-   * Process backend for remote execution environments.
-   * When set without an explicit executor, the runner wraps it in a
-   * RunnerStepExecutor that creates isolated environments for agent and
-   * deterministic steps. The runner builds CLI commands and passes auth env,
-   * cwd, and timeout; the backend provides create/exec/destroy primitives.
-   *
-   * When both executor and processBackend are set, executor takes precedence.
-   * When neither is set, the broker spawns local child processes (default).
-   */
-  processBackend?: ProcessBackend;
-}
-
-// ── Internal step state ─────────────────────────────────────────────────────
-
-interface StepState {
-  row: WorkflowStepRow;
-  agent?: Agent;
-}
-
-interface SupervisedStep {
-  specialist: AgentDefinition;
-  owner: AgentDefinition;
-  reviewer?: AgentDefinition;
-}
-
-interface SpawnedAgentInfo {
-  requestedName: string;
-  actualName: string;
-  agent: Agent;
-}
-
-interface SpawnAndWaitOptions {
-  agentNameSuffix?: string;
-  retryAttempt?: number;
-  evidenceStepName?: string;
-  evidenceRole?: string;
-  logicalName?: string;
-  preserveOnIdle?: boolean;
-  onSpawned?: (info: SpawnedAgentInfo) => void | Promise<void>;
-  onChunk?: (info: { agentName: string; chunk: string }) => void;
-}
-
-interface SupervisedRuntimeAgent {
-  stepName: string;
-  role: 'owner' | 'specialist';
-  logicalName: string;
-}
-
-interface RuntimeStepAgent {
-  stepName: string;
-  role: string;
-  logicalName: string;
-}
-
-interface FileSnapshotEntry {
-  mtimeMs: number;
-  size: number;
-}
-
-interface StepEvidenceRecord {
-  evidence: StepCompletionEvidence;
-  baselineSnapshots: Map<string, Map<string, FileSnapshotEntry>>;
-  filesCaptured: boolean;
-}
-
-interface StepSignalParticipants {
-  ownerSenders: Set<string>;
-  workerSenders: Set<string>;
-}
-
-interface CustomVerificationFailure {
-  command: string;
-  output: string;
-}
-
-interface DiagnosticResult {
-  analysis: string;
-  metadata: {
-    agentName: string;
-    elapsedMs: number;
-    tokenCount: number;
-  };
-}
-
-interface DeterministicRepairContext {
-  step: WorkflowStep;
-  agentDef: AgentDefinition;
-  attempt: number;
-  maxRetries: number;
-  command: string;
-  cwd: string;
-  error: string;
-  output: string;
-  exitCode?: number;
-  exitSignal?: string;
-}
-
-interface AgentStepRepairContext {
-  step: WorkflowStep;
-  agentDef: AgentDefinition;
-  attempt: number;
-  maxRetries: number;
-  cwd: string;
-  error: string;
-  output: string;
-  exitCode?: number;
-  exitSignal?: string;
-  completionReason?: WorkflowStepCompletionReason;
-}
-
-type DiagnosticVerificationCheck = VerificationCheck & {
-  diagnosticAgent?: string;
-  diagnosticTimeout?: number;
-};
-
-const DEFAULT_WORKFLOW_MAX_RETRIES = 2;
-const DEFAULT_WORKFLOW_REPAIR_RETRIES = 2;
-const DEFAULT_WORKFLOW_RETRY_DELAY_MS = 1000;
-
-interface ChannelEvidenceOptions {
-  stepName?: string;
-  sender?: string;
-  actor?: string;
-  role?: string;
-  target?: string;
-  origin?: CompletionEvidenceChannelOrigin;
-}
-
-// ── CLI resolution ───────────────────────────────────────────────────────────
-
-/**
- * Resolve `cursor` to the concrete cursor agent binary available in PATH.
- * Delegates to the consolidated cli-resolver which checks PATH + well-known
- * install directories. Falls back to `agent` if nothing found.
- */
-function resolveCursorCli(): 'cursor-agent' | 'agent' {
-  const resolved = resolveCliSync('cursor');
-  return (resolved?.binary as 'cursor-agent' | 'agent') ?? 'agent';
-}
-
-function getWorkflowSdkSpawner(relay: AgentRelay, cli: AgentCli): AgentSpawner | null {
-  switch (cli) {
-    case 'claude':
-      return relay.claude;
-    case 'codex':
-      return relay.codex;
-    case 'gemini':
-      return relay.gemini;
-    case 'opencode':
-      return relay.opencode;
-    default:
-      return null;
-  }
-}
-
-function resolveWorkflowTokenSigningKey(env: NodeJS.ProcessEnv): LocalJwksSigningKey {
-  const privateKeyPem = env[RELAYAUTH_JWT_PRIVATE_KEY_PEM_ENV];
-  const kid = env[RELAYAUTH_JWT_KID_ENV];
-  if (privateKeyPem && kid) {
-    return {
-      privateKey: importPrivateKeyPem(privateKeyPem),
-      kid,
-    };
-  }
-
-  const generated = createLocalJwksKeyPair();
-  return {
-    privateKey: generated.privateKey,
-    kid: generated.kid,
-  };
-}
-
-// ── WorkflowRunner ──────────────────────────────────────────────────────────
-
-export class WorkflowRunner {
-  private readonly db: WorkflowDb;
-  private readonly workspaceId: string;
-  private readonly relayOptions: AgentRelayOptions;
-  private readonly cwd: string;
-  private readonly summaryDir: string;
-  private executor?: RunnerStepExecutor;
-  private readonly envSecrets?: Record<string, string>;
-  private readonly templateResolver: TemplateResolver;
-  private readonly channelMessenger: ChannelMessenger;
-
-  /** @internal exposed for CLI signal-handler shutdown only */
-  relay?: AgentRelay;
-  private relaycast?: RelayCast;
-  private relaycastAgent?: AgentClient;
-  private relayApiKey?: string;
-  private relayApiKeyAutoCreated = false;
-  private channel?: string;
-  private trajectory?: WorkflowTrajectory;
-  private abortController?: AbortController;
-  private paused = false;
-  private pauseResolver?: () => void;
-  private listeners: WorkflowEventListener[] = [];
-
-  /** Current config for the active run, so spawnAndWait can access swarm config. */
-  private currentConfig?: RelayYamlConfig;
-  /** Current run ID for event emission from spawnAndWait context. */
-  private currentRunId?: string;
-  /** Live Agent handles keyed by name, for hub-mediated nudging. */
-  private readonly activeAgentHandles = new Map<string, Agent>();
-  /** Per-agent workflow tokens for relay/relayfile auth across spawn modes. */
-  private readonly agentTokens = new Map<string, string>();
-  /** Per-agent credential proxy tokens keyed by logical agent definition name. */
-  private readonly proxyTokens = new Map<string, string>();
-  /** Per-agent relayfile mounts keyed by logical agent definition name. */
-  private readonly agentMounts = new Map<string, MountHandle>();
-
-  // PTY-based output capture: accumulate terminal output per-agent
-  private readonly ptyOutputBuffers = new Map<string, string[]>();
-  /** Snapshot of PTY output from the most recent failed attempt, keyed by step name. */
-  private readonly lastFailedStepOutput = new Map<string, string>();
-  /** Most recent custom verification failure details, keyed by step name. */
-  private readonly lastCustomVerificationFailure = new Map<string, CustomVerificationFailure>();
-  private readonly ptyListeners = new Map<string, (chunk: string) => void>();
-  private readonly ptyLogStreams = new Map<string, WriteStream>();
-  /** Path to workers.json so `agents:kill` can find workflow-spawned agents */
-  private readonly workersPath: string;
-  /** In-memory tracking of active workers to avoid race conditions on workers.json */
-  private readonly activeWorkers = new Map<
-    string,
-    { cli: string; task: string; spawnedAt: number; pid?: number; logFile: string }
-  >();
-  /** Mutex for serializing workers.json file access */
-  private workersFileLock: Promise<void> = Promise.resolve();
-  /** Timestamp when the current workflow run started, for elapsed-time logging. */
-  private runStartTime?: number;
-  /** Unsubscribe handle for broker stderr listener wired during a run. */
-  private unsubBrokerStderr?: () => void;
-  private unsubRelayListeners: Array<() => void> = [];
-  /** Tracks last idle log time per agent to debounce idle warnings (30s multiples). */
-  private readonly lastIdleLog = new Map<string, number>();
-  /** Tracks last logged activity type per agent to avoid duplicate status lines. */
-  private readonly lastActivity = new Map<string, string>();
-  /** Runtime-name lookup for agents participating in supervised owner flows. */
-  private readonly supervisedRuntimeAgents = new Map<string, SupervisedRuntimeAgent>();
-  /** Runtime-name lookup for active step agents so channel messages can be attributed to a step. */
-  private readonly runtimeStepAgents = new Map<string, RuntimeStepAgent>();
-  /** Per-step completion evidence collected across output, channel, files, and tool side-effects. */
-  private readonly stepCompletionEvidence = new Map<string, StepEvidenceRecord>();
-  /** Expected owner/worker identities per step so coordination signals can be validated by sender. */
-  private readonly stepSignalParticipants = new Map<string, StepSignalParticipants>();
-  /** Resolved named paths from the top-level `paths` config, keyed by name → absolute directory. */
-  private resolvedPaths = new Map<string, string>();
-  /** Tracks agent names currently assigned as reviewers (ref-counted to handle concurrent usage). */
-  private readonly activeReviewers = new Map<string, number>();
-  /** Structured CLI session reports captured during the current run, keyed by step name. */
-  private readonly agentReports = new Map<string, CliSessionReport>();
-  /** Optional per-run token budget tracker; only created when budgets are configured. */
-  private budgetTracker?: BudgetTracker;
-  private static readonly PTY_TASK_ARG_SIZE_LIMIT = 2 * 1024 * 1024; // 2 MB
-  private readonly processBackend?: ProcessBackend;
-
-  constructor(options: WorkflowRunnerOptions = {}) {
-    this.db = options.db ?? new InMemoryWorkflowDb();
-    this.workspaceId = options.workspaceId ?? 'local';
-    this.relayOptions = options.relay ?? {};
-    this.cwd = options.cwd ?? process.cwd();
-    this.summaryDir = options.summaryDir ?? path.join(this.cwd, '.relay', 'summaries');
-    this.workersPath = path.join(this.cwd, '.agent-relay', 'team', 'workers.json');
-    this.executor = options.executor;
-    this.processBackend = options.processBackend;
-    this.envSecrets = options.envSecrets;
-    if (!this.executor && this.processBackend) {
-      this.executor = createProcessBackendExecutor(this.processBackend, {
-        env: this.envSecrets,
-      });
-    }
-    this.templateResolver = new TemplateResolver();
-    this.channelMessenger = new ChannelMessenger({ postFn: (text) => this.postToChannel(text) });
-  }
-
-  // ── Path resolution ─────────────────────────────────────────────────────
-
-  /** Expand environment variables like $HOME or $VAR in a path string. */
-  private static resolveEnvVars(p: string): string {
-    return p.replace(/\$([A-Za-z_][A-Za-z0-9_]*)/g, (_match, varName: string) => {
-      return process.env[varName] ?? _match;
-    });
-  }
-
-  /**
-   * Resolve and validate the top-level `paths` definitions from the config.
-   * Returns a map of name → absolute directory path.
-   * Throws if a required path does not exist.
-   */
-  private resolvePathDefinitions(
-    pathDefs: PathDefinition[] | undefined,
-    baseCwd: string
-  ): { resolved: Map<string, string>; errors: string[]; warnings: string[] } {
-    const resolved = new Map<string, string>();
-    const errors: string[] = [];
-    const warnings: string[] = [];
-    if (!pathDefs || pathDefs.length === 0) return { resolved, errors, warnings };
-
-    const seenNames = new Set<string>();
-    for (const pd of pathDefs) {
-      if (seenNames.has(pd.name)) {
-        errors.push(`Duplicate path name "${pd.name}"`);
-        continue;
-      }
-      seenNames.add(pd.name);
-
-      const expanded = WorkflowRunner.resolveEnvVars(pd.path);
-      const abs = path.resolve(baseCwd, expanded);
-      resolved.set(pd.name, abs);
-
-      const isRequired = pd.required !== false; // default true
-      if (!existsSync(abs)) {
-        if (isRequired) {
-          errors.push(`Path "${pd.name}" resolves to "${abs}" which does not exist (required)`);
-        } else {
-          warnings.push(`Path "${pd.name}" resolves to "${abs}" which does not exist (optional)`);
-        }
-      }
-    }
-
-    return { resolved, errors, warnings };
-  }
-
-  private initializeBudgetTracker(config: RelayYamlConfig, workflow: WorkflowDefinition): void {
-    const agentMap = new Map(
-      config.agents.map((agent) => [agent.name, WorkflowRunner.resolveAgentDef(agent)])
-    );
-    const stepConfigs = workflow.steps.flatMap((step) => {
-      if (
-        step.type === 'deterministic' ||
-        step.type === 'worktree' ||
-        step.type === 'integration' ||
-        !step.agent
-      ) {
-        return [];
-      }
-
-      const agentDef = agentMap.get(step.agent);
-      return [
-        {
-          stepName: step.name,
-          agentName: step.agent,
-          maxTokens: agentDef?.constraints?.maxTokens,
-        },
-      ];
-    });
-
-    const hasWorkflowBudget = config.swarm.tokenBudget !== undefined;
-    const hasAgentBudgets = stepConfigs.some((step) => step.maxTokens !== undefined);
-
-    this.budgetTracker =
-      hasWorkflowBudget || hasAgentBudgets
-        ? new BudgetTracker({
-            workflowBudget: config.swarm.tokenBudget,
-            steps: stepConfigs,
-          })
-        : undefined;
-  }
-
-  private ensureBudgetAllowsSpawn(stepName: string, agentName: string): void {
-    if (!this.budgetTracker) return;
-
-    const budgetCheck = this.budgetTracker.checkCanSpawn(stepName);
-    if (budgetCheck.allowed) return;
-
-    const workflowBudget = this.budgetTracker.getRunSummaryBudgetData()?.workflow;
-    const used = workflowBudget?.used.toLocaleString('en-US') ?? '0';
-    const limit = workflowBudget?.limit?.toLocaleString('en-US') ?? '--';
-    this.log(`[budget] Skipping step ${stepName} — workflow budget exhausted (used ${used} of ${limit})`);
-    throw new BudgetExceededError(
-      stepName,
-      'workflow',
-      workflowBudget?.limit ?? 0,
-      workflowBudget?.used ?? 0
-    );
-  }
-
-  private getTotalReportTokens(report: CliSessionReport): number | undefined {
-    if (!report.tokens) return undefined;
-    return report.tokens.input + report.tokens.output + report.tokens.cacheRead;
-  }
-
-  private validatePermissions(
-    agents: AgentDefinition[] | undefined,
-    permissionProfiles: RelayYamlConfig['permission_profiles'],
-    source = '<config>'
-  ): { errors: string[]; warnings: string[] } {
-    const errors: string[] = [];
-    const warnings: string[] = [];
-    const accessPresets = new Set<AccessPreset>(['readonly', 'readwrite', 'restricted', 'full']);
-    const profiles = permissionProfiles ?? {};
-    const profileNames = new Set(Object.keys(profiles));
-
-    const validateStringArray = (value: unknown, label: string): string[] | undefined => {
-      if (value === undefined) {
-        return undefined;
-      }
-      if (!Array.isArray(value)) {
-        errors.push(`${label} must be an array of strings`);
-        return undefined;
-      }
-
-      const normalized: string[] = [];
-      for (const entry of value) {
-        if (typeof entry !== 'string') {
-          errors.push(`${label} must be an array of strings`);
-          continue;
-        }
-        normalized.push(entry);
-      }
-      return normalized;
-    };
-
-    const validateGlobPattern = (pattern: string, label: string): void => {
-      const trimmed = pattern.trim();
-      if (trimmed === '') {
-        errors.push(`${label} must not contain empty glob patterns`);
-        return;
-      }
-      if (trimmed.includes('\0')) {
-        errors.push(`${label} contains an invalid glob pattern "${pattern}" (NUL byte)`);
-        return;
-      }
-
-      let escaped = false;
-      let bracketDepth = 0;
-      let braceDepth = 0;
-
-      for (const ch of trimmed) {
-        if (escaped) {
-          escaped = false;
-          continue;
-        }
-        if (ch === '\\') {
-          escaped = true;
-          continue;
-        }
-        if (ch === '[') {
-          bracketDepth += 1;
-          continue;
-        }
-        if (ch === ']' && bracketDepth > 0) {
-          bracketDepth -= 1;
-          continue;
-        }
-        if (ch === '{') {
-          braceDepth += 1;
-          continue;
-        }
-        if (ch === '}' && braceDepth > 0) {
-          braceDepth -= 1;
-        }
-      }
-
-      if (escaped) {
-        errors.push(`${label} contains an invalid glob pattern "${pattern}" (dangling escape)`);
-        return;
-      }
-      if (bracketDepth > 0) {
-        errors.push(`${label} contains an invalid glob pattern "${pattern}" (unclosed character class)`);
-        return;
-      }
-      if (braceDepth > 0) {
-        errors.push(`${label} contains an invalid glob pattern "${pattern}" (unclosed brace expansion)`);
-        return;
-      }
-
-      try {
-        ignore().add([trimmed]);
-      } catch (err) {
-        errors.push(
-          `${label} contains an invalid glob pattern "${pattern}" (${err instanceof Error ? err.message : String(err)})`
-        );
-      }
-    };
-
-    const validatePermissionObject = (
-      permissions: unknown,
-      label: string,
-      options: { allowProfileReference: boolean }
-    ): void => {
-      if (typeof permissions === 'string') {
-        const shorthand = permissions.trim();
-        if (shorthand === '') {
-          errors.push(`${label} must not be empty`);
-          return;
-        }
-
-        if (accessPresets.has(shorthand as AccessPreset)) {
-          return;
-        }
-
-        if (options.allowProfileReference) {
-          if (!profileNames.has(shorthand)) {
-            errors.push(`${label} references unknown permission profile "${shorthand}"`);
-          }
-          return;
-        }
-
-        errors.push(`${label} must be an object when provided`);
-        return;
-      }
-
-      if (typeof permissions !== 'object' || permissions === null) {
-        errors.push(`${label} must be an object when provided`);
-        return;
-      }
-
-      const permissionRecord = permissions as Record<string, unknown>;
-
-      if (permissionRecord.description !== undefined && typeof permissionRecord.description !== 'string') {
-        errors.push(`${label}.description must be a string when provided`);
-      }
-
-      if (permissionRecord.profile !== undefined) {
-        if (!options.allowProfileReference) {
-          errors.push(`${label}.profile is only supported on agent permissions`);
-        } else if (typeof permissionRecord.profile !== 'string') {
-          errors.push(`${label}.profile must be a string when provided`);
-        } else if (permissionRecord.profile.trim() === '') {
-          errors.push(`${label}.profile must not be empty`);
-        } else if (!profileNames.has(permissionRecord.profile)) {
-          errors.push(`${label}.profile references unknown permission profile "${permissionRecord.profile}"`);
-        }
-      }
-
-      if (permissionRecord.why !== undefined && typeof permissionRecord.why !== 'string') {
-        errors.push(`${label}.why must be a string when provided`);
-      }
-
-      if (
-        permissionRecord.access !== undefined &&
-        !accessPresets.has(permissionRecord.access as AccessPreset)
-      ) {
-        errors.push(`${label}.access must be one of readonly, readwrite, restricted, full`);
-      }
-
-      if (permissionRecord.inherit !== undefined && typeof permissionRecord.inherit !== 'boolean') {
-        errors.push(`${label}.inherit must be a boolean when provided`);
-      }
-
-      if (permissionRecord.network !== undefined) {
-        if (typeof permissionRecord.network === 'boolean') {
-          // valid: boolean form
-        } else if (
-          typeof permissionRecord.network === 'object' &&
-          permissionRecord.network !== null &&
-          !Array.isArray(permissionRecord.network)
-        ) {
-          const net = permissionRecord.network as Record<string, unknown>;
-          validateStringArray(net.allow, `${label}.network.allow`);
-          validateStringArray(net.deny, `${label}.network.deny`);
-        } else {
-          errors.push(`${label}.network must be a boolean or an object with allow/deny arrays`);
-        }
-      }
-
-      if (permissionRecord.files !== undefined) {
-        if (
-          typeof permissionRecord.files !== 'object' ||
-          permissionRecord.files === null ||
-          Array.isArray(permissionRecord.files)
-        ) {
-          errors.push(`${label}.files must be an object when provided`);
-        } else {
-          const files = permissionRecord.files as Record<string, unknown>;
-          const read = validateStringArray(files.read, `${label}.files.read`);
-          const write = validateStringArray(files.write, `${label}.files.write`);
-          const deny = validateStringArray(files.deny, `${label}.files.deny`);
-
-          for (const pattern of read ?? []) {
-            validateGlobPattern(pattern, `${label}.files.read`);
-          }
-          for (const pattern of write ?? []) {
-            validateGlobPattern(pattern, `${label}.files.write`);
-          }
-          for (const pattern of deny ?? []) {
-            validateGlobPattern(pattern, `${label}.files.deny`);
-          }
-
-          if (permissionRecord.access === 'readonly' && (write?.length ?? 0) > 0) {
-            warnings.push(`${label} sets access to "readonly" but also defines files.write entries`);
-          }
-        }
-      }
-
-      const scopes = validateStringArray(permissionRecord.scopes, `${label}.scopes`);
-      for (const scope of scopes ?? []) {
-        if (scope.trim() === '') {
-          errors.push(`${label}.scopes must not contain empty strings`);
-          continue;
-        }
-        if (!/^[^:\s]+:[^:\s]+:[^:\s]+:.+$/u.test(scope)) {
-          errors.push(`${label}.scopes entry "${scope}" must follow plane:resource:action:path format`);
-        }
-      }
-
-      const exec = validateStringArray(permissionRecord.exec, `${label}.exec`);
-      for (const entry of exec ?? []) {
-        if (entry.trim() === '') {
-          errors.push(`${label}.exec must not contain empty strings`);
-        }
-      }
-    };
-
-    if (permissionProfiles !== undefined) {
-      if (
-        typeof permissionProfiles !== 'object' ||
-        permissionProfiles === null ||
-        Array.isArray(permissionProfiles)
-      ) {
-        errors.push(`${source}: permission_profiles must be an object when provided`);
-      } else {
-        for (const [profileName, profile] of Object.entries(permissionProfiles)) {
-          if (profileName.trim() === '') {
-            errors.push(`${source}: permission_profiles keys must not be empty`);
-            continue;
-          }
-          validatePermissionObject(profile, `${source}: permission_profiles.${profileName}`, {
-            allowProfileReference: false,
-          });
-        }
-      }
-    }
-
-    if (!agents || agents.length === 0) {
-      return { errors, warnings };
-    }
-
-    for (const agent of agents) {
-      if (agent.permissions === undefined) {
-        continue;
-      }
-      validatePermissionObject(agent.permissions, `${source}: agent "${agent.name}" permissions`, {
-        allowProfileReference: true,
-      });
-    }
-
-    return { errors, warnings };
-  }
-
-  private mergePermissionLists(
-    base: readonly string[] | undefined,
-    override: readonly string[] | undefined
-  ): string[] | undefined {
-    const merged = [
-      ...new Set([...(base ?? []), ...(override ?? [])].map((value) => value.trim()).filter(Boolean)),
-    ];
-    return merged.length > 0 ? merged : undefined;
-  }
-
-  private mergePermissionFiles(
-    base: AgentPermissions['files'],
-    override: AgentPermissions['files']
-  ): AgentPermissions['files'] {
-    const merged = {
-      read: this.mergePermissionLists(base?.read, override?.read),
-      write: this.mergePermissionLists(base?.write, override?.write),
-      deny: this.mergePermissionLists(base?.deny, override?.deny),
-    };
-
-    return merged.read || merged.write || merged.deny ? merged : undefined;
-  }
-
-  private mergePermissionProfile(
-    profile: PermissionProfileDefinition,
-    permissions: AgentPermissions
-  ): AgentPermissions {
-    const merged: AgentPermissions = {
-      description: permissions.description ?? profile.description,
-      profile: permissions.profile,
-      why: permissions.why ?? profile.why,
-      access: permissions.access ?? profile.access,
-      inherit: permissions.inherit ?? profile.inherit,
-      files: this.mergePermissionFiles(profile.files, permissions.files),
-      scopes: this.mergePermissionLists(profile.scopes, permissions.scopes),
-      network: permissions.network ?? profile.network,
-      exec: this.mergePermissionLists(profile.exec, permissions.exec),
-    };
-
-    return Object.fromEntries(
-      Object.entries(merged).filter(([, value]) => value !== undefined)
-    ) as AgentPermissions;
-  }
-
-  private applyPermissionProfiles(config: RelayYamlConfig): RelayYamlConfig {
-    if (!config.permission_profiles || Object.keys(config.permission_profiles).length === 0) {
-      return config;
-    }
-
-    return {
-      ...config,
-      agents: config.agents.map((agent) => {
-        const rawPermissions = agent.permissions;
-        if (!rawPermissions) {
-          return agent;
-        }
-
-        const normalizedPermissions =
-          typeof rawPermissions === 'string'
-            ? ({
-                ...(config.permission_profiles?.[rawPermissions]
-                  ? { profile: rawPermissions }
-                  : { access: rawPermissions as AccessPreset }),
-              } as AgentPermissions)
-            : rawPermissions;
-
-        const profileName = normalizedPermissions.profile;
-        if (!profileName) {
-          return {
-            ...agent,
-            permissions: normalizedPermissions,
-          };
-        }
-
-        const profile = config.permission_profiles?.[profileName];
-        if (!profile) {
-          return {
-            ...agent,
-            permissions: normalizedPermissions,
-          };
-        }
-
-        return {
-          ...agent,
-          permissions: this.mergePermissionProfile(profile, normalizedPermissions),
-        };
-      }),
-    };
-  }
-
-  /**
-   * Resolve an agent's effective working directory, considering `workdir` (named path reference)
-   * and `cwd` (explicit path). `workdir` takes precedence when both are set.
-   */
-  private resolveAgentCwd(agent: AgentDefinition): string {
-    if (agent.workdir) {
-      const resolved = this.resolvedPaths.get(agent.workdir);
-      if (!resolved) {
-        throw new Error(
-          `Agent "${agent.name}" references workdir "${agent.workdir}" which is not defined in paths`
-        );
-      }
-      return resolved;
-    }
-    if (agent.cwd) {
-      return path.resolve(this.cwd, agent.cwd);
-    }
-    return this.cwd;
-  }
-
-  /**
-   * Resolve a step's working directory from its `workdir` field (named path reference).
-   * Returns undefined if no workdir is set.
-   */
-  private resolveStepWorkdir(step: WorkflowStep): string | undefined {
-    if (!step.workdir) return undefined;
-    const resolved = this.resolvedPaths.get(step.workdir);
-    if (!resolved) {
-      throw new Error(
-        `Step "${step.name}" references workdir "${step.workdir}" which is not defined in paths`
-      );
-    }
-    return resolved;
-  }
-
-  private resolveEffectiveCwd(step: WorkflowStep, agentDef?: AgentDefinition): string {
-    if (step.cwd) {
-      return path.resolve(this.cwd, step.cwd);
-    }
-    return this.resolveStepWorkdir(step) ?? (agentDef ? this.resolveAgentCwd(agentDef) : this.cwd);
-  }
-
-  private resolveMountedCwd(agentName: string, cwd: string): string {
-    const mount = this.agentMounts.get(agentName);
-    if (!mount) {
-      return cwd;
-    }
-
-    const relative = path.relative(this.cwd, cwd);
-    if (relative === '') {
-      return mount.mountPoint;
-    }
-    if (relative === '..' || relative.startsWith(`..${path.sep}`)) {
-      return cwd;
-    }
-    return path.resolve(mount.mountPoint, relative);
-  }
-
-  private resolveExecutionCwd(step: WorkflowStep, agentDef?: AgentDefinition): string {
-    const cwd = this.resolveEffectiveCwd(step, agentDef);
-    if (!agentDef) {
-      return cwd;
-    }
-    return this.resolveMountedCwd(agentDef.name, cwd);
-  }
-
-  private async stopProvisionedMounts(): Promise<void> {
-    const handles = [...this.agentMounts.values()];
-    this.agentMounts.clear();
-    await Promise.all(handles.map((handle) => handle.stop().catch(() => undefined)));
-  }
-
-  private static readonly EVIDENCE_IGNORED_DIRS = new Set([
-    '.git',
-    '.agent-relay',
-    '.trajectories',
-    'node_modules',
-  ]);
-
-  public getStepCompletionEvidence(stepName: string): StepCompletionEvidence | undefined {
-    const record = this.stepCompletionEvidence.get(stepName);
-    if (!record) return undefined;
-
-    const evidence = structuredClone(record.evidence);
-    return this.filterStepEvidenceBySignalProvenance(stepName, evidence);
-  }
-
-  private getOrCreateStepEvidenceRecord(stepName: string): StepEvidenceRecord {
-    const existing = this.stepCompletionEvidence.get(stepName);
-    if (existing) return existing;
-
-    const now = new Date().toISOString();
-    const record: StepEvidenceRecord = {
-      evidence: {
-        stepName,
-        lastUpdatedAt: now,
-        roots: [],
-        output: {
-          stdout: '',
-          stderr: '',
-          combined: '',
-        },
-        channelPosts: [],
-        files: [],
-        process: {},
-        toolSideEffects: [],
-        coordinationSignals: [],
-      },
-      baselineSnapshots: new Map(),
-      filesCaptured: false,
-    };
-    this.stepCompletionEvidence.set(stepName, record);
-    return record;
-  }
-
-  private initializeStepSignalParticipants(
-    stepName: string,
-    ownerSender?: string,
-    workerSender?: string
-  ): void {
-    this.stepSignalParticipants.set(stepName, {
-      ownerSenders: new Set(),
-      workerSenders: new Set(),
-    });
-    this.rememberStepSignalSender(stepName, 'owner', ownerSender);
-    this.rememberStepSignalSender(stepName, 'worker', workerSender);
-  }
-
-  private rememberStepSignalSender(
-    stepName: string,
-    participant: 'owner' | 'worker',
-    ...senders: Array<string | undefined>
-  ): void {
-    const participants = this.stepSignalParticipants.get(stepName) ?? {
-      ownerSenders: new Set<string>(),
-      workerSenders: new Set<string>(),
-    };
-    this.stepSignalParticipants.set(stepName, participants);
-
-    const target = participant === 'owner' ? participants.ownerSenders : participants.workerSenders;
-    for (const sender of senders) {
-      const trimmed = sender?.trim();
-      if (trimmed) target.add(trimmed);
-    }
-  }
-
-  private resolveSignalParticipantKind(role?: string): 'owner' | 'worker' | undefined {
-    const roleLC = role?.toLowerCase().trim();
-    if (!roleLC) return undefined;
-    if (/\b(owner|lead|supervisor)\b/.test(roleLC)) return 'owner';
-    if (/\b(worker|specialist|engineer|implementer)\b/.test(roleLC)) return 'worker';
-    return undefined;
-  }
-
-  private isSignalFromExpectedSender(stepName: string, signal: CompletionEvidenceSignal): boolean {
-    const expectedParticipant =
-      signal.kind === 'worker_done' ? 'worker' : signal.kind === 'lead_done' ? 'owner' : undefined;
-    if (!expectedParticipant) return true;
-
-    const participants = this.stepSignalParticipants.get(stepName);
-    if (!participants) return true;
-
-    const allowedSenders =
-      expectedParticipant === 'owner' ? participants.ownerSenders : participants.workerSenders;
-    if (allowedSenders.size === 0) return true;
-
-    const sender = signal.sender ?? signal.actor;
-    if (sender) {
-      return allowedSenders.has(sender);
-    }
-
-    const observedParticipant = this.resolveSignalParticipantKind(signal.role);
-    if (observedParticipant) {
-      return observedParticipant === expectedParticipant;
-    }
-
-    return signal.source !== 'channel';
-  }
-
-  private filterStepEvidenceBySignalProvenance(
-    stepName: string,
-    evidence: StepCompletionEvidence
-  ): StepCompletionEvidence {
-    evidence.channelPosts = evidence.channelPosts.map((post) => {
-      const signals = post.signals.filter((signal) => this.isSignalFromExpectedSender(stepName, signal));
-      return {
-        ...post,
-        completionRelevant: signals.length > 0,
-        signals,
-      };
-    });
-    evidence.coordinationSignals = evidence.coordinationSignals.filter((signal) =>
-      this.isSignalFromExpectedSender(stepName, signal)
-    );
-    return evidence;
-  }
-
-  private beginStepEvidence(stepName: string, roots: Array<string | undefined>, startedAt?: string): void {
-    const record = this.getOrCreateStepEvidenceRecord(stepName);
-    const evidence = record.evidence;
-    const now = startedAt ?? new Date().toISOString();
-
-    evidence.startedAt ??= now;
-    evidence.status = 'running';
-    evidence.lastUpdatedAt = now;
-
-    for (const root of this.uniqueEvidenceRoots(roots)) {
-      if (!evidence.roots.includes(root)) {
-        evidence.roots.push(root);
-      }
-      if (!record.baselineSnapshots.has(root)) {
-        record.baselineSnapshots.set(root, this.captureFileSnapshot(root));
-      }
-    }
-  }
-
-  private captureStepTerminalEvidence(
-    stepName: string,
-    output: { stdout?: string; stderr?: string; combined?: string },
-    process?: { exitCode?: number; exitSignal?: string },
-    meta?: { sender?: string; actor?: string; role?: string }
-  ): void {
-    const record = this.getOrCreateStepEvidenceRecord(stepName);
-    const evidence = record.evidence;
-    const observedAt = new Date().toISOString();
-
-    const append = (current: string, next?: string): string => {
-      if (!next) return current;
-      return current ? `${current}\n${next}` : next;
-    };
-
-    if (output.stdout) {
-      evidence.output.stdout = append(evidence.output.stdout, output.stdout);
-      for (const signal of this.extractCompletionSignals(output.stdout, 'stdout', observedAt, meta)) {
-        evidence.coordinationSignals.push(signal);
-      }
-    }
-    if (output.stderr) {
-      evidence.output.stderr = append(evidence.output.stderr, output.stderr);
-      for (const signal of this.extractCompletionSignals(output.stderr, 'stderr', observedAt, meta)) {
-        evidence.coordinationSignals.push(signal);
-      }
-    }
-
-    const combinedOutput =
-      output.combined ??
-      [output.stdout, output.stderr].filter((value): value is string => Boolean(value)).join('\n');
-    if (combinedOutput) {
-      evidence.output.combined = append(evidence.output.combined, combinedOutput);
-    }
-
-    if (process) {
-      if (process.exitCode !== undefined) {
-        evidence.process.exitCode = process.exitCode;
-        evidence.coordinationSignals.push({
-          kind: 'process_exit',
-          source: 'process',
-          text: `Process exited with code ${process.exitCode}`,
-          observedAt,
-          value: String(process.exitCode),
-        });
-      }
-      if (process.exitSignal !== undefined) {
-        evidence.process.exitSignal = process.exitSignal;
-      }
-    }
-
-    evidence.lastUpdatedAt = observedAt;
-  }
-
-  private finalizeStepEvidence(
-    stepName: string,
-    status: WorkflowStepStatus,
-    completedAt?: string,
-    completionReason?: WorkflowStepCompletionReason
-  ): void {
-    const record = this.stepCompletionEvidence.get(stepName);
-    if (!record) return;
-
-    const evidence = record.evidence;
-    const observedAt = completedAt ?? new Date().toISOString();
-    evidence.status = status;
-    if (status !== 'running') {
-      evidence.completedAt = observedAt;
-    }
-    evidence.lastUpdatedAt = observedAt;
-
-    if (!record.filesCaptured) {
-      const existing = new Set(evidence.files.map((file) => `${file.kind}:${file.path}`));
-      for (const root of evidence.roots) {
-        const before = record.baselineSnapshots.get(root) ?? new Map<string, FileSnapshotEntry>();
-        const after = this.captureFileSnapshot(root);
-        for (const change of this.diffFileSnapshots(before, after, root, observedAt)) {
-          const key = `${change.kind}:${change.path}`;
-          if (existing.has(key)) continue;
-          existing.add(key);
-          evidence.files.push(change);
-        }
-      }
-      record.filesCaptured = true;
-    }
-
-    if (completionReason) {
-      const decision = this.buildStepCompletionDecision(stepName, completionReason);
-      if (decision) {
-        void this.trajectory?.stepCompletionDecision(stepName, decision);
-      }
-    }
-  }
-
-  private recordStepToolSideEffect(
-    stepName: string,
-    effect: Omit<CompletionEvidenceToolSideEffect, 'observedAt'> & { observedAt?: string }
-  ): void {
-    const record = this.getOrCreateStepEvidenceRecord(stepName);
-    const observedAt = effect.observedAt ?? new Date().toISOString();
-    record.evidence.toolSideEffects.push({
-      ...effect,
-      observedAt,
-    });
-    record.evidence.lastUpdatedAt = observedAt;
-  }
-
-  private recordChannelEvidence(text: string, options: ChannelEvidenceOptions = {}): void {
-    const stepName =
-      options.stepName ??
-      this.inferStepNameFromChannelText(text) ??
-      (options.actor ? this.runtimeStepAgents.get(options.actor)?.stepName : undefined);
-    if (!stepName) return;
-
-    const record = this.getOrCreateStepEvidenceRecord(stepName);
-    const postedAt = new Date().toISOString();
-    const sender = options.sender ?? options.actor;
-    const signals = this.extractCompletionSignals(text, 'channel', postedAt, {
-      sender,
-      actor: options.actor,
-      role: options.role,
-    });
-
-    const channelPost: CompletionEvidenceChannelPost = {
-      stepName,
-      text,
-      postedAt,
-      origin: options.origin ?? 'runner_post',
-      completionRelevant: signals.length > 0,
-      sender,
-      actor: options.actor,
-      role: options.role,
-      target: options.target,
-      signals,
-    };
-
-    record.evidence.channelPosts.push(channelPost);
-    record.evidence.coordinationSignals.push(...signals);
-    record.evidence.lastUpdatedAt = postedAt;
-  }
-
-  private extractCompletionSignals(
-    text: string,
-    source: CompletionEvidenceSignal['source'],
-    observedAt: string,
-    meta?: { sender?: string; actor?: string; role?: string }
-  ): CompletionEvidenceSignal[] {
-    const signals: CompletionEvidenceSignal[] = [];
-    const seen = new Set<string>();
-    const add = (kind: CompletionEvidenceSignalKind, signalText: string, value?: string): void => {
-      const trimmed = signalText.trim().slice(0, 280);
-      if (!trimmed) return;
-      const key = `${kind}:${trimmed}:${value ?? ''}`;
-      if (seen.has(key)) return;
-      seen.add(key);
-      signals.push({
-        kind,
-        source,
-        text: trimmed,
-        observedAt,
-        sender: meta?.sender,
-        actor: meta?.actor,
-        role: meta?.role,
-        value,
-      });
-    };
-
-    for (const match of text.matchAll(/\bWORKER_DONE\b(?::\s*([^\n]+))?/gi)) {
-      add('worker_done', match[0], match[1]?.trim());
-    }
-    for (const match of text.matchAll(/\bLEAD_DONE\b(?::\s*([^\n]+))?/gi)) {
-      add('lead_done', match[0], match[1]?.trim());
-    }
-    for (const match of text.matchAll(/\bSTEP_COMPLETE:([A-Za-z0-9_.:-]+)/g)) {
-      add('step_complete', match[0], match[1]);
-    }
-    for (const match of text.matchAll(
-      /\bOWNER_DECISION:\s*(COMPLETE|INCOMPLETE_RETRY|INCOMPLETE_FAIL|NEEDS_CLARIFICATION)\b/gi
-    )) {
-      add('owner_decision', match[0], match[1].toUpperCase());
-    }
-    for (const match of text.matchAll(/\bREVIEW_DECISION:\s*(APPROVE|REJECT)\b/gi)) {
-      add('review_decision', match[0], match[1].toUpperCase());
-    }
-    if (/\bverification gate observed\b|\bverification passed\b/i.test(text)) {
-      add('verification_passed', this.firstMeaningfulLine(text) ?? text);
-    }
-    if (/\bverification failed\b/i.test(text)) {
-      add('verification_failed', this.firstMeaningfulLine(text) ?? text);
-    }
-    if (
-      /\b(summary|handoff|ready for review|ready for handoff|task complete|work complete|completed work|finished work)\b/i.test(
-        text
-      )
-    ) {
-      add('task_summary', this.firstMeaningfulLine(text) ?? text);
-    }
-
-    return signals;
-  }
-
-  private inferStepNameFromChannelText(text: string): string | undefined {
-    const bracketMatch = text.match(/^\*\*\[([^\]]+)\]/);
-    if (bracketMatch?.[1]) return bracketMatch[1];
-
-    const markerMatch = text.match(/\bSTEP_COMPLETE:([A-Za-z0-9_.:-]+)/);
-    if (markerMatch?.[1]) return markerMatch[1];
-
-    return undefined;
-  }
-
-  private uniqueEvidenceRoots(roots: Array<string | undefined>): string[] {
-    return [
-      ...new Set(roots.filter((root): root is string => Boolean(root)).map((root) => path.resolve(root))),
-    ];
-  }
-
-  private captureFileSnapshot(root: string): Map<string, FileSnapshotEntry> {
-    const snapshot = new Map<string, FileSnapshotEntry>();
-    if (!existsSync(root)) return snapshot;
-
-    const visit = (currentPath: string): void => {
-      let entries: Dirent[];
-      try {
-        entries = readdirSync(currentPath, { withFileTypes: true });
-      } catch {
-        return;
-      }
-
-      for (const entry of entries) {
-        if (entry.isDirectory() && WorkflowRunner.EVIDENCE_IGNORED_DIRS.has(entry.name)) {
-          continue;
-        }
-
-        const fullPath = path.join(currentPath, entry.name);
-        if (entry.isDirectory()) {
-          visit(fullPath);
-          continue;
-        }
-
-        try {
-          const stats = statSync(fullPath);
-          if (!stats.isFile()) continue;
-          snapshot.set(fullPath, { mtimeMs: stats.mtimeMs, size: stats.size });
-        } catch {
-          // Best-effort evidence collection only.
-        }
-      }
-    };
-
-    try {
-      const stats = statSync(root);
-      if (stats.isFile()) {
-        snapshot.set(root, { mtimeMs: stats.mtimeMs, size: stats.size });
-        return snapshot;
-      }
-    } catch {
-      return snapshot;
-    }
-
-    visit(root);
-    return snapshot;
-  }
-
-  private diffFileSnapshots(
-    before: Map<string, FileSnapshotEntry>,
-    after: Map<string, FileSnapshotEntry>,
-    root: string,
-    observedAt: string
-  ): CompletionEvidenceFileChange[] {
-    const allPaths = new Set([...before.keys(), ...after.keys()]);
-    const changes: CompletionEvidenceFileChange[] = [];
-
-    for (const filePath of allPaths) {
-      const prior = before.get(filePath);
-      const next = after.get(filePath);
-
-      let kind: CompletionEvidenceFileChange['kind'] | undefined;
-      if (!prior && next) {
-        kind = 'created';
-      } else if (prior && !next) {
-        kind = 'deleted';
-      } else if (prior && next && (prior.mtimeMs !== next.mtimeMs || prior.size !== next.size)) {
-        kind = 'modified';
-      }
-
-      if (!kind) continue;
-
-      changes.push({
-        path: this.normalizeEvidencePath(filePath),
-        kind,
-        observedAt,
-        root,
-      });
-    }
-
-    return changes.sort((a, b) => a.path.localeCompare(b.path));
-  }
-
-  private normalizeEvidencePath(filePath: string): string {
-    const relative = path.relative(this.cwd, filePath);
-    if (!relative || relative === '') return path.basename(filePath);
-    return relative.startsWith('..') ? filePath : relative;
-  }
-
-  private buildStepCompletionDecision(
-    stepName: string,
-    completionReason: WorkflowStepCompletionReason
-  ): StepCompletionDecision | undefined {
-    let reason: string | undefined;
-    let mode: StepCompletionDecision['mode'];
-    switch (completionReason) {
-      case 'completed_verified':
-        mode = 'verification';
-        reason = 'Verification passed';
-        break;
-      case 'completed_by_evidence':
-        mode = 'evidence';
-        reason = 'Completion inferred from collected evidence';
-        break;
-      case 'completed_by_owner_decision': {
-        const evidence = this.getStepCompletionEvidence(stepName);
-        const markerObserved = evidence?.coordinationSignals.some(
-          (signal) => signal.kind === 'step_complete'
-        );
-        mode = markerObserved ? 'marker' : 'owner_decision';
-        reason = markerObserved ? 'Legacy STEP_COMPLETE marker observed' : 'Owner approved completion';
-        break;
-      }
-      default:
-        return undefined;
-    }
-
-    return {
-      mode,
-      reason,
-      evidence: this.buildTrajectoryCompletionEvidence(stepName),
-    };
-  }
-
-  private buildTrajectoryCompletionEvidence(
-    stepName: string
-  ): StepCompletionDecision['evidence'] | undefined {
-    const evidence = this.getStepCompletionEvidence(stepName);
-    if (!evidence) return undefined;
-
-    const signals = evidence.coordinationSignals.slice(-6).map((signal) => signal.value ?? signal.text);
-    const channelPosts = evidence.channelPosts
-      .filter((post) => post.completionRelevant)
-      .slice(-3)
-      .map((post) => post.text.slice(0, 160));
-    const files = evidence.files.slice(0, 6).map((file) => `${file.kind}:${file.path}`);
-
-    const summaryParts: string[] = [];
-    if (signals.length > 0) summaryParts.push(`${signals.length} signal(s)`);
-    if (channelPosts.length > 0) summaryParts.push(`${channelPosts.length} relevant channel post(s)`);
-    if (files.length > 0) summaryParts.push(`${files.length} file change(s)`);
-    if (evidence.process.exitCode !== undefined) {
-      summaryParts.push(`exit=${evidence.process.exitCode}`);
-    }
-
-    return {
-      summary: summaryParts.length > 0 ? summaryParts.join(', ') : undefined,
-      signals: signals.length > 0 ? signals : undefined,
-      channelPosts: channelPosts.length > 0 ? channelPosts : undefined,
-      files: files.length > 0 ? files : undefined,
-      exitCode: evidence.process.exitCode,
-    };
-  }
-
-  // ── Progress logging ────────────────────────────────────────────────────
-
-  /** Log a progress message with elapsed time since run start. */
-  private log(msg: string): void {
-    const elapsed = this.runStartTime ? Math.round((Date.now() - this.runStartTime) / 1000) : 0;
-    const mins = Math.floor(elapsed / 60);
-    const secs = elapsed % 60;
-    const ts =
-      mins > 0
-        ? `${String(mins).padStart(2, '0')}:${String(secs).padStart(2, '0')}`
-        : `00:${String(secs).padStart(2, '0')}`;
-    console.log(`${chalk.dim.cyan('[workflow')} ${chalk.dim.cyan(ts)}${chalk.dim.cyan(']')} ${msg}`);
-  }
-
-  // ── Relaycast auto-provisioning ────────────────────────────────────────
-
-  /**
-   * Ensure a Relaycast workspace API key is available for the broker.
-   * Resolution order:
-   *   1. RELAY_API_KEY environment variable (explicit override)
-   *   2. Auto-create a fresh workspace via the Relaycast API
-   *
-   * Each workflow run gets its own isolated workspace — no caching, no sharing.
-   */
-  private async ensureRelaycastApiKey(channel: string): Promise<void> {
-    if (this.relayApiKey) return;
-
-    // Explicit override from relayOptions or environment takes priority.
-    const envKey = this.relayOptions.env?.RELAY_API_KEY ?? process.env.RELAY_API_KEY;
-    if (envKey) {
-      this.relayApiKey = envKey;
-      return;
-    }
-
-    // Always create a fresh workspace — each run gets full isolation.
-    const workspaceName = `relay-${channel}-${randomBytes(4).toString('hex')}`;
-    const baseUrl =
-      this.relayOptions.env?.RELAYCAST_BASE_URL ??
-      process.env.RELAYCAST_BASE_URL ??
-      'https://api.relaycast.dev';
-    const res = await fetch(`${baseUrl}/v1/workspaces`, {
-      method: 'POST',
-      headers: { 'content-type': 'application/json' },
-      body: JSON.stringify({ name: workspaceName }),
-    });
-
-    if (!res.ok) {
-      throw new Error(`Failed to auto-create Relaycast workspace: ${res.status} ${await res.text()}`);
-    }
-
-    const body = (await res.json()) as Record<string, any>;
-    const data = (body.data ?? body) as Record<string, any>;
-    const apiKey = data.api_key as string;
-
-    if (!apiKey) {
-      throw new Error('Relaycast workspace response missing api_key');
-    }
-
-    this.relayApiKey = apiKey;
-    this.relayApiKeyAutoCreated = true;
-
-    // Best-effort: push the key to a co-running dashboard (agent-relay up) so it
-    // can make Relaycast API calls without any file or manual env var setup.
-    const dashboardPort = process.env.AGENT_RELAY_DASHBOARD_PORT || '3888';
-    fetch(`http://127.0.0.1:${dashboardPort}/api/relay-config`, {
-      method: 'POST',
-      headers: { 'content-type': 'application/json' },
-      body: JSON.stringify({ apiKey }),
-    })
-      .then((res) => {
-        if (!res.ok) {
-          console.warn(`[WorkflowRunner] dashboard key push failed: HTTP ${res.status}`);
-        }
-      })
-      .catch(() => {
-        // Dashboard not running — silently ignore.
-      });
-  }
-
-  private async loadCredentialProxyModule(): Promise<CredentialProxyModule | null> {
-    try {
-      const dynamicImport = new Function('specifier', 'return import(specifier)') as (
-        specifier: string
-      ) => Promise<unknown>;
-      const module = (await dynamicImport('@agent-relay/credential-proxy')) as Partial<CredentialProxyModule>;
-      return typeof module.mintProxyToken === 'function' ? (module as CredentialProxyModule) : null;
-    } catch (error) {
-      if ((error as NodeJS.ErrnoException | undefined)?.code === 'ERR_MODULE_NOT_FOUND') {
-        return null;
-      }
-
-      throw error;
-    }
-  }
-
-  private resolveCredentialProxyProvider(agentDef: AgentDefinition, config: RelayYamlConfig): ProxyProvider {
-    const configuredProviders = Object.keys(config.swarm.credentialProxy?.providers ?? {});
-    const explicitProvider = agentDef.credentials?.provider?.trim().toLowerCase();
-    if (
-      explicitProvider === 'openai' ||
-      explicitProvider === 'anthropic' ||
-      explicitProvider === 'openrouter'
-    ) {
-      return explicitProvider;
-    }
-
-    const model = agentDef.constraints?.model?.trim().toLowerCase() ?? '';
-    if (model.includes('openrouter')) {
-      return 'openrouter';
-    }
-    if (model.includes('claude') || model.includes('anthropic')) {
-      return 'anthropic';
-    }
-    if (
-      model.includes('openai') ||
-      model.includes('chatgpt') ||
-      model.includes('gpt') ||
-      /\bo[134](?:\b|-)/.test(model)
-    ) {
-      return 'openai';
-    }
-
-    if (configuredProviders.length === 1) {
-      const [onlyProvider] = configuredProviders;
-      if (onlyProvider === 'openai' || onlyProvider === 'anthropic' || onlyProvider === 'openrouter') {
-        return onlyProvider;
-      }
-    }
-
-    switch (agentDef.cli) {
-      case 'claude':
-        return 'anthropic';
-      case 'codex':
-      case 'aider':
-      case 'goose':
-      case 'opencode':
-      case 'cursor':
-      case 'cursor-agent':
-        return 'openai';
-      default:
-        throw new Error(
-          `Unable to resolve credential proxy provider for agent "${agentDef.name}". Set credentials.provider or constraints.model.`
-        );
-    }
-  }
-
-  private resolveCredentialProxySecret(config: RelayYamlConfig): string {
-    const configuredSecret = config.swarm.credentialProxy?.jwtSecret;
-    if (configuredSecret?.startsWith('$')) {
-      const envSecret = process.env[configuredSecret.slice(1)];
-      if (envSecret) {
-        return envSecret;
-      }
-    } else if (configuredSecret) {
-      return configuredSecret;
-    }
-
-    const defaultSecret = process.env.RELAY_PROXY_JWT_SECRET;
-    if (defaultSecret) {
-      return defaultSecret;
-    }
-
-    throw new Error(
-      'Credential proxy JWT secret is missing. Set swarm.credentialProxy.jwtSecret or RELAY_PROXY_JWT_SECRET.'
-    );
-  }
-
-  private async mintAgentProxyToken(
-    agentDef: AgentDefinition,
-    config: RelayYamlConfig
-  ): Promise<string | undefined> {
-    const proxyConfig = config.swarm?.credentialProxy;
-    if (!proxyConfig?.proxyUrl || !agentDef.credentials?.proxy) {
-      return undefined;
-    }
-
-    const provider = this.resolveCredentialProxyProvider(agentDef, config);
-    const providerConfig = proxyConfig.providers?.[provider];
-    const credentialId = providerConfig?.credentialId;
-    if (!credentialId) {
-      throw new Error(
-        `Credential proxy provider "${provider}" is not configured for agent "${agentDef.name}".`
-      );
-    }
-
-    const budget = agentDef.constraints?.maxTokens ?? proxyConfig.defaultBudget;
-    const cacheKey = `${agentDef.name}:${provider}:${credentialId}:${budget ?? 'default'}`;
-    const cachedToken = this.proxyTokens.get(cacheKey);
-    if (cachedToken) {
-      return cachedToken;
-    }
-
-    const credentialProxy = await this.loadCredentialProxyModule();
-    if (!credentialProxy) {
-      throw new Error(
-        'Credential proxy mode requires the optional peer dependency "@agent-relay/credential-proxy".'
-      );
-    }
-
-    const nowSeconds = Math.floor(Date.now() / 1000);
-    const token = await credentialProxy.mintProxyToken(
-      {
-        sub: this.workspaceId,
-        aud: 'relay-llm-proxy',
-        provider,
-        credentialId,
-        budget,
-        exp: nowSeconds + 15 * 60,
-      },
-      this.resolveCredentialProxySecret(config)
-    );
-
-    this.proxyTokens.set(cacheKey, token);
-    return token;
-  }
-
-  private async resolveAgentProxyMode(
-    agentDef: AgentDefinition,
-    config?: RelayYamlConfig
-  ): Promise<ProxyModeConfig | undefined> {
-    if (!agentDef.credentials?.proxy) {
-      return undefined;
-    }
-
-    const env = this.getMergedRelayEnvSource();
-    const configuredProxyUrl = config?.swarm?.credentialProxy?.proxyUrl;
-    const proxyUrl = configuredProxyUrl ?? resolveProxyUrlFromEnv(env);
-    if (!proxyUrl) {
-      return undefined;
-    }
-
-    if (!configuredProxyUrl) {
-      const injectedToken = resolveProxyTokenFromEnv(env);
-      if (!injectedToken) {
-        return undefined;
-      }
-
-      return {
-        url: proxyUrl,
-        token: injectedToken,
-      };
-    }
-
-    const token = await this.mintAgentProxyToken(agentDef, config);
-    if (!token) {
-      return undefined;
-    }
-
-    return {
-      url: proxyUrl,
-      token,
-    };
-  }
-
-  private getMergedRelayEnvSource(): NodeJS.ProcessEnv {
-    return {
-      ...process.env,
-      ...(this.relayOptions.env ?? {}),
-      ...(this.relayApiKey ? { RELAY_API_KEY: this.relayApiKey } : {}),
-    };
-  }
-
-  private getRelayEnv(proxyMode?: ProxyModeConfig): NodeJS.ProcessEnv | undefined {
-    const env = this.getMergedRelayEnvSource();
-    const inheritedProxyUrl = resolveProxyUrlFromEnv(env);
-    const inheritedProxyToken = resolveProxyTokenFromEnv(env);
-
-    if (
-      !this.relayApiKey &&
-      !this.relayOptions.env &&
-      !proxyMode &&
-      !(inheritedProxyUrl && inheritedProxyToken)
-    ) {
-      return undefined;
-    }
-
-    const normalizedProxy =
-      proxyMode?.url && proxyMode.token
-        ? proxyMode
-        : inheritedProxyUrl && inheritedProxyToken
-          ? { url: inheritedProxyUrl, token: inheritedProxyToken }
-          : undefined;
-
-    if (normalizedProxy) {
-      Object.assign(env, buildNormalizedProxyEnv(normalizedProxy.url, normalizedProxy.token));
-      for (const key of getStrippedApiKeyVars()) {
-        delete env[key];
-      }
-    }
-
-    return env;
-  }
-
-  private async provisionAgents(config: RelayYamlConfig): Promise<void> {
-    // Cloud launcher already compiled and seeded relayfile ACLs before the
-    // sandbox started.  Skip in-sandbox provisioning — the relayfile API has
-    // no POST /v1/workspaces route, so attempting it causes a fatal 404.
-    if (process.env.RELAY_CLOUD_PROVISIONING_DONE === '1') {
-      return;
-    }
-
-    this.agentTokens.clear();
-    this.proxyTokens.clear();
-    await this.stopProvisionedMounts();
-
-    const agentsToProvision: Record<string, NonNullable<AgentDefinition['permissions']>> = {};
-    for (const agent of config.agents) {
-      if (agent.permissions) {
-        agentsToProvision[agent.name] = agent.permissions;
-      }
-    }
-
-    const agentNames = Object.keys(agentsToProvision);
-    if (agentNames.length === 0) {
-      return;
-    }
-
-    const relayEnv = {
-      ...process.env,
-      ...(this.getRelayEnv() ?? {}),
-    };
-    const tokenSigningKey = resolveWorkflowTokenSigningKey(relayEnv);
-    const result = await provisionWorkflowAgents({
-      tokenSigningKey,
-      workspace: this.workspaceId,
-      projectDir: this.cwd,
-      relayfileBaseUrl: relayEnv.RELAYFILE_BASE_URL ?? 'http://127.0.0.1:8080',
-      agents: agentsToProvision,
-      tokenTtlSeconds: 3600,
-    });
-
-    for (const [agentName, token] of result.tokens) {
-      this.agentTokens.set(agentName, token);
-    }
-    for (const [agentName, mount] of result.mounts) {
-      this.agentMounts.set(agentName, mount);
-    }
-
-    this.log(
-      `Provisioned workflow tokens for ${result.tokens.size} agent${result.tokens.size === 1 ? '' : 's'}`
-    );
-  }
-
-  private getRelaycastBaseUrl(): string {
-    return (
-      this.relayOptions.env?.RELAYCAST_BASE_URL ??
-      process.env.RELAYCAST_BASE_URL ??
-      'https://api.relaycast.dev'
-    );
-  }
-
-  private getRelaycastClient(): RelayCast {
-    if (!this.relayApiKey) {
-      throw new Error('No Relaycast API key available');
-    }
-    if (!this.relaycast) {
-      this.relaycast = new RelayCast({
-        apiKey: this.relayApiKey,
-        baseUrl: this.getRelaycastBaseUrl(),
-      });
-    }
-    return this.relaycast;
-  }
-
-  private async ensureRelaycastRunnerAgent(): Promise<AgentClient> {
-    if (this.relaycastAgent) return this.relaycastAgent;
-
-    const rc = this.getRelaycastClient();
-    let registration;
-    try {
-      registration = await rc.agents.register({ name: 'WorkflowRunner', type: 'agent' });
-    } catch (err) {
-      if (err instanceof RelayError && err.code === 'name_conflict') {
-        registration = await rc.agents.register({
-          name: `WorkflowRunner-${randomBytes(4).toString('hex')}`,
-          type: 'agent',
-        });
-      } else {
-        throw err;
-      }
-    }
-
-    this.relaycastAgent = rc.as(registration.token);
-    return this.relaycastAgent;
-  }
-
-  private async createAndJoinRelaycastChannel(channel: string, topic?: string): Promise<void> {
-    const agent = await this.ensureRelaycastRunnerAgent();
-    try {
-      await agent.channels.create({ name: channel, ...(topic ? { topic } : {}) });
-    } catch (err) {
-      if (!(err instanceof RelayError && err.code === 'name_conflict')) {
-        throw err;
-      }
-    }
-    await agent.channels.join(channel);
-  }
-
-  private async registerRelaycastExternalAgent(name: string, persona?: string): Promise<AgentClient | null> {
-    const rc = this.getRelaycastClient();
-    try {
-      const registration = await rc.agents.register({
-        name,
-        type: 'agent',
-        ...(persona ? { persona } : {}),
-      });
-      return rc.as(registration.token);
-    } catch (err) {
-      if (err instanceof RelayError && err.code === 'name_conflict') {
-        return null;
-      }
-      throw err;
-    }
-  }
-
-  private startRelaycastHeartbeat(agent: AgentClient, intervalMs = 30_000): () => void {
-    const beat = () => {
-      agent.heartbeat().catch(() => {});
-    };
-    const timer = setInterval(beat, intervalMs);
-    timer.unref();
-    beat();
-    return () => clearInterval(timer);
-  }
-
-  // ── Event subscription ──────────────────────────────────────────────────
-
-  on(listener: WorkflowEventListener): () => void {
-    this.listeners.push(listener);
-    return () => {
-      this.listeners = this.listeners.filter((l) => l !== listener);
-    };
-  }
-
-  private emit(event: WorkflowEvent): void {
-    for (const listener of this.listeners) {
-      listener(event);
-    }
-  }
-
-  // ── Parsing & validation ────────────────────────────────────────────────
-
-  /** Parse a relay.yaml file from disk. */
-  async parseYamlFile(filePath: string): Promise<RelayYamlConfig> {
-    const absPath = path.resolve(this.cwd, filePath);
-    const raw = await readFile(absPath, 'utf-8');
-    return this.parseYamlString(raw, absPath);
-  }
-
-  /** Parse a relay.yaml string. */
-  parseYamlString(raw: string, source = '<string>'): RelayYamlConfig {
-    const parsed = parseYaml(raw);
-    this.validateConfig(parsed, source);
-    const config = this.normalizeLegacyPermissionConfig(parsed as RelayYamlConfig);
-    config.agents ??= [];
-    return config;
-  }
-
-  private normalizeLegacyPermissionConfig(config: RelayYamlConfig): RelayYamlConfig {
-    const legacyPermissions = (
-      config as RelayYamlConfig & {
-        permissions?: { profiles?: RelayYamlConfig['permission_profiles'] };
-      }
-    ).permissions;
-
-    if (
-      config.permission_profiles === undefined &&
-      legacyPermissions &&
-      typeof legacyPermissions === 'object' &&
-      legacyPermissions.profiles &&
-      typeof legacyPermissions.profiles === 'object'
-    ) {
-      return {
-        ...config,
-        permission_profiles: legacyPermissions.profiles,
-      };
-    }
-
-    return config;
-  }
-
-  private applyReliabilityDefaults(config: RelayYamlConfig): RelayYamlConfig {
-    const existing = config.errorHandling;
-    if (existing?.strategy === 'fail-fast' || existing?.strategy === 'continue') {
-      return config;
-    }
-
-    const hasRepairAgentCandidate = (config.agents ?? []).length > 0;
-    const maxRetries =
-      existing?.maxRetries ??
-      existing?.repairRetries ??
-      (existing ? DEFAULT_WORKFLOW_MAX_RETRIES : DEFAULT_WORKFLOW_MAX_RETRIES);
-    const repairRetries =
-      existing?.repairRetries ??
-      (hasRepairAgentCandidate
-        ? (existing?.maxRetries ?? DEFAULT_WORKFLOW_REPAIR_RETRIES)
-        : existing?.repairRetries);
-
-    return {
-      ...config,
-      errorHandling: {
-        ...existing,
-        strategy: 'retry',
-        maxRetries,
-        retryDelayMs: existing?.retryDelayMs ?? DEFAULT_WORKFLOW_RETRY_DELAY_MS,
-        ...(repairRetries !== undefined ? { repairRetries } : {}),
-      },
-    };
-  }
-
-  /** Validate a config object against the RelayYamlConfig shape. */
-  validateConfig(config: unknown, source = '<config>'): asserts config is RelayYamlConfig {
-    if (typeof config !== 'object' || config === null) {
-      throw new Error(`${source}: config must be a non-null object`);
-    }
-
-    const c = config as Record<string, unknown>;
-
-    if (typeof c.version !== 'string') {
-      throw new Error(`${source}: missing required field "version"`);
-    }
-    if (typeof c.name !== 'string') {
-      throw new Error(`${source}: missing required field "name"`);
-    }
-    if (typeof c.swarm !== 'object' || c.swarm === null) {
-      throw new Error(`${source}: missing required field "swarm"`);
-    }
-    const swarm = c.swarm as Record<string, unknown>;
-    if (typeof swarm.pattern !== 'string') {
-      throw new Error(`${source}: missing required field "swarm.pattern"`);
-    }
-    if (c.agents !== undefined && !Array.isArray(c.agents)) {
-      throw new Error(`${source}: "agents" must be an array when provided`);
-    }
-    const legacyPermissions = c.permissions;
-    if (
-      legacyPermissions !== undefined &&
-      (typeof legacyPermissions !== 'object' ||
-        legacyPermissions === null ||
-        Array.isArray(legacyPermissions))
-    ) {
-      throw new Error(`${source}: "permissions" must be an object when provided`);
-    }
-    if (
-      c.permission_profiles !== undefined &&
-      (typeof c.permission_profiles !== 'object' ||
-        c.permission_profiles === null ||
-        Array.isArray(c.permission_profiles))
-    ) {
-      throw new Error(`${source}: "permission_profiles" must be an object when provided`);
-    }
-    if (
-      c.permission_profiles === undefined &&
-      legacyPermissions !== undefined &&
-      typeof legacyPermissions === 'object' &&
-      legacyPermissions !== null
-    ) {
-      const profiles = (legacyPermissions as Record<string, unknown>).profiles;
-      if (
-        profiles !== undefined &&
-        (typeof profiles !== 'object' || profiles === null || Array.isArray(profiles))
-      ) {
-        throw new Error(`${source}: "permissions.profiles" must be an object when provided`);
-      }
-    }
-
-    for (const agent of c.agents ?? []) {
-      if (typeof agent !== 'object' || agent === null) {
-        throw new Error(`${source}: each agent must be an object`);
-      }
-      const a = agent as Record<string, unknown>;
-      if (typeof a.name !== 'string') {
-        throw new Error(`${source}: each agent must have a string "name"`);
-      }
-      if (typeof a.cli !== 'string') {
-        throw new Error(`${source}: each agent must have a string "cli"`);
-      }
-    }
-
-    if (c.workflows !== undefined) {
-      if (!Array.isArray(c.workflows)) {
-        throw new Error(`${source}: "workflows" must be an array`);
-      }
-      for (const wf of c.workflows) {
-        this.validateWorkflow(wf, (c.agents ?? []) as AgentDefinition[], source);
-      }
-    }
-  }
-
-  // ── Dry-run simulation ──────────────────────────────────────────────
-
-  /**
-   * Validate a workflow config and simulate execution waves without spawning agents.
-   * Returns a DryRunReport with DAG analysis, agent summary, and wave breakdown.
-   */
-  dryRun(config: RelayYamlConfig, workflowName?: string, vars?: VariableContext): DryRunReport {
-    const errors: string[] = [];
-    const warnings: string[] = [];
-
-    // 1. Validate config
-    let resolved: RelayYamlConfig;
-    try {
-      this.validateConfig(config);
-      resolved = vars ? this.resolveVariables(config, vars) : config;
-      resolved = this.applyPermissionProfiles(resolved);
-    } catch (err) {
-      errors.push(err instanceof Error ? err.message : String(err));
-      return {
-        valid: false,
-        errors,
-        warnings,
-        name: (config as any)?.name ?? '<unknown>',
-        pattern: (config as any)?.swarm?.pattern ?? '<unknown>',
-        agents: [],
-        waves: [],
-        totalSteps: 0,
-        estimatedWaves: 0,
-      };
-    }
-
-    // 1b. Validate permissions and resolve named paths
-    const permissionResult = this.validatePermissions(resolved.agents, resolved.permission_profiles);
-    errors.push(...permissionResult.errors);
-    warnings.push(...permissionResult.warnings);
-
-    const pathResult = this.resolvePathDefinitions(resolved.paths, this.cwd);
-    errors.push(...pathResult.errors);
-    warnings.push(...pathResult.warnings);
-    const dryRunPaths = pathResult.resolved;
-
-    // Validate workdir references on agents
-    for (const agent of resolved.agents) {
-      if (agent.workdir && !dryRunPaths.has(agent.workdir)) {
-        errors.push(
-          `Agent "${agent.name}" references workdir "${agent.workdir}" which is not defined in paths`
-        );
-      }
-    }
-
-    // 2. Find target workflow
-    const workflows = resolved.workflows ?? [];
-    const workflow = workflowName ? workflows.find((w) => w.name === workflowName) : workflows[0];
-
-    if (!workflow) {
-      errors.push(
-        workflowName ? `Workflow "${workflowName}" not found in config` : 'No workflows defined in config'
-      );
-      return {
-        valid: false,
-        errors,
-        warnings,
-        name: resolved.name,
-        description: resolved.description,
-        pattern: resolved.swarm.pattern,
-        agents: [],
-        waves: [],
-        totalSteps: 0,
-        estimatedWaves: 0,
-      };
-    }
-
-    // 3. Load and validate custom steps
-    let customSteps = new Map<string, import('./types.js').CustomStepDefinition>();
-    try {
-      customSteps = loadCustomSteps(this.cwd);
-    } catch (err) {
-      if (err instanceof CustomStepsParseError) {
-        errors.push(`Custom steps file error: ${err.issue}\n${err.suggestion}`);
-      } else {
-        errors.push(`Failed to load custom steps: ${err instanceof Error ? err.message : String(err)}`);
-      }
-    }
-
-    // Validate custom step usage in workflow steps
-    const customStepValidation = validateCustomStepsUsage(workflow.steps, customSteps);
-    errors.push(...customStepValidation.errors);
-    warnings.push(...customStepValidation.warnings);
-
-    // Resolve custom steps for further validation
-    let resolvedSteps = workflow.steps;
-    if (customStepValidation.valid) {
-      try {
-        resolvedSteps = resolveAllCustomSteps(workflow.steps, customSteps);
-      } catch (err) {
-        if (err instanceof CustomStepResolutionError) {
-          errors.push(`${err.issue}\n${err.suggestion}`);
-        } else {
-          errors.push(`Failed to resolve custom steps: ${err instanceof Error ? err.message : String(err)}`);
-        }
-      }
-    }
-
-    // 4. Build agent map and validate step→agent references
-    const agentMap = new Map<string, AgentDefinition>();
-    for (const agent of resolved.agents) {
-      agentMap.set(agent.name, agent);
-    }
-
-    const stepAgentCounts = new Map<string, number>();
-    for (const step of resolvedSteps) {
-      // Only validate agent references for agent-type steps
-      if (step.agent) {
-        if (!agentMap.has(step.agent)) {
-          warnings.push(`Step "${step.name}" references unknown agent "${step.agent}"`);
-        }
-        stepAgentCounts.set(step.agent, (stepAgentCounts.get(step.agent) ?? 0) + 1);
-      }
-    }
-
-    // Validate workdir references on steps
-    for (const step of resolvedSteps) {
-      if (step.workdir && !dryRunPaths.has(step.workdir)) {
-        errors.push(`Step "${step.name}" references workdir "${step.workdir}" which is not defined in paths`);
-      }
-    }
-
-    // Validate cwd paths
-    for (const agent of resolved.agents) {
-      if (agent.cwd) {
-        const resolvedCwd = path.resolve(this.cwd, agent.cwd);
-        if (!existsSync(resolvedCwd)) {
-          warnings.push(
-            `Agent "${agent.name}" cwd "${agent.cwd}" resolves to "${resolvedCwd}" which does not exist`
-          );
-        }
-      }
-      if (agent.additionalPaths) {
-        for (const ap of agent.additionalPaths) {
-          const resolvedPath = path.resolve(this.cwd, ap);
-          if (!existsSync(resolvedPath)) {
-            warnings.push(
-              `Agent "${agent.name}" additionalPath "${ap}" resolves to "${resolvedPath}" which does not exist`
-            );
-          }
-        }
-      }
-    }
-
-    // Cycle detection via topological sort
-    const stepNames = new Set(resolvedSteps.map((s) => s.name));
-    const inDegree = new Map<string, number>();
-    const adjacency = new Map<string, string[]>();
-    for (const step of resolvedSteps) {
-      inDegree.set(step.name, 0);
-      adjacency.set(step.name, []);
-    }
-    for (const step of resolvedSteps) {
-      for (const dep of step.dependsOn ?? []) {
-        if (stepNames.has(dep)) {
-          adjacency.get(dep)!.push(step.name);
-          inDegree.set(step.name, (inDegree.get(step.name) ?? 0) + 1);
-        }
-      }
-    }
-    const topoQueue: string[] = [];
-    for (const [name, deg] of inDegree) {
-      if (deg === 0) topoQueue.push(name);
-    }
-    let visited = 0;
-    while (topoQueue.length > 0) {
-      const node = topoQueue.shift()!;
-      visited++;
-      for (const neighbor of adjacency.get(node) ?? []) {
-        const newDeg = (inDegree.get(neighbor) ?? 1) - 1;
-        inDegree.set(neighbor, newDeg);
-        if (newDeg === 0) topoQueue.push(neighbor);
-      }
-    }
-    if (visited < resolvedSteps.length) {
-      errors.push(
-        'Dependency cycle detected in workflow steps. Check dependsOn references for circular dependencies.'
-      );
-    }
-
-    // Missing dependency references
-    for (const step of resolvedSteps) {
-      for (const dep of step.dependsOn ?? []) {
-        if (!stepNames.has(dep)) {
-          errors.push(`Step "${step.name}" depends on unknown step "${dep}"`);
-        }
-      }
-    }
-
-    // Unreachable steps (steps that are never depended on and aren't root steps)
-    const dependedOn = new Set<string>();
-    for (const step of resolvedSteps) {
-      for (const dep of step.dependsOn ?? []) {
-        dependedOn.add(dep);
-      }
-    }
-
-    // Timeout warnings
-    for (const step of resolvedSteps) {
-      if (!step.timeoutMs) {
-        const agentDef = step.agent ? agentMap.get(step.agent) : undefined;
-        if (!agentDef?.constraints?.timeoutMs && !resolved.swarm.timeoutMs) {
-          warnings.push(
-            `Step "${step.name}" has no timeout configured (no step, agent, or swarm-level timeout)`
-          );
-        }
-      }
-    }
-
-    // Large dependency fan-in warning (decomposition guidance)
-    for (const step of resolvedSteps) {
-      if ((step.dependsOn?.length ?? 0) >= 5) {
-        warnings.push(
-          `Step "${step.name}" depends on ${step.dependsOn!.length} upstream steps. ` +
-            `Consider decomposing into smaller verification steps to reduce context size.`
-        );
-      }
-    }
-
-    const permissions = resolved.agents.map((agent) => {
-      const compiled = resolveAgentPermissions(agent.name, agent.permissions, this.cwd, this.workspaceId);
-      const source: NonNullable<DryRunReport['permissions']>[number]['source'] = compiled.sources.some(
-        (entry) => entry.type === 'yaml'
-      )
-        ? 'yaml'
-        : compiled.sources.some((entry) => entry.type === 'preset')
-          ? 'preset'
-          : compiled.sources.some((entry) => entry.type === 'dotfile')
-            ? 'dotfiles'
-            : 'none';
-
-      return {
-        agent: agent.name,
-        access: compiled.effectiveAccess,
-        readPaths: compiled.summary.readonly,
-        writePaths: compiled.summary.readwrite,
-        denyPaths: compiled.summary.denied,
-        scopes: compiled.scopes.length,
-        source,
-      };
-    });
-
-    // 4. Build agent summary
-    const agents = resolved.agents.map((a) => ({
-      name: a.name,
-      cli: a.cli,
-      role: a.role,
-      cwd: a.workdir ? dryRunPaths.get(a.workdir) : a.cwd,
-      stepCount: stepAgentCounts.get(a.name) ?? 0,
-    }));
-
-    // 5. Simulate execution waves
-    const waves: DryRunWave[] = [];
-    const completed = new Set<string>();
-    const allSteps = [...resolvedSteps];
-    let waveNum = 0;
-
-    while (completed.size < allSteps.length) {
-      const ready = allSteps.filter((step) => {
-        if (completed.has(step.name)) return false;
-        const deps = step.dependsOn ?? [];
-        return deps.every((dep) => completed.has(dep));
-      });
-
-      if (ready.length === 0) {
-        // Remaining steps are blocked — likely a cycle or unresolvable deps
-        const blocked = allSteps.filter((s) => !completed.has(s.name)).map((s) => s.name);
-        errors.push(`Blocked steps with unresolvable dependencies: ${blocked.join(', ')}`);
-        break;
-      }
-
-      waveNum++;
-      waves.push({
-        wave: waveNum,
-        steps: ready.map((s) => ({
-          name: s.name,
-          agent: s.agent,
-          dependsOn: s.dependsOn ?? [],
-        })),
-      });
-
-      for (const step of ready) {
-        completed.add(step.name);
-      }
-    }
-
-    // 6. Resource estimation
-    const peakConcurrency = Math.max(...waves.map((w) => w.steps.length), 0);
-    const totalAgentSteps = resolvedSteps.filter(
-      (s) => s.type !== 'deterministic' && s.type !== 'worktree' && s.type !== 'integration'
-    ).length;
-
-    // 7. Check maxConcurrency against wave widths
-    const maxConcurrency = resolved.swarm.maxConcurrency;
-    if (maxConcurrency !== undefined) {
-      for (const wave of waves) {
-        if (wave.steps.length > maxConcurrency) {
-          warnings.push(
-            `Wave ${wave.wave} has ${wave.steps.length} parallel steps but maxConcurrency is ${maxConcurrency}`
-          );
-        }
-      }
-    }
-
-    return {
-      valid: errors.length === 0,
-      errors,
-      warnings,
-      name: workflow.name,
-      description: workflow.description ?? resolved.description,
-      pattern: resolved.swarm.pattern,
-      agents,
-      permissions,
-      waves,
-      totalSteps: workflow.steps.length,
-      maxConcurrency,
-      estimatedWaves: waves.length,
-      estimatedPeakConcurrency: peakConcurrency,
-      estimatedTotalAgentSteps: totalAgentSteps,
-    };
-  }
-
-  private validateWorkflow(wf: unknown, agents: AgentDefinition[], source: string): void {
-    if (typeof wf !== 'object' || wf === null) {
-      throw new Error(`${source}: each workflow must be an object`);
-    }
-    const w = wf as Record<string, unknown>;
-    if (typeof w.name !== 'string') {
-      throw new Error(`${source}: each workflow must have a string "name"`);
-    }
-    if (!Array.isArray(w.steps) || w.steps.length === 0) {
-      throw new Error(`${source}: workflow "${w.name}" must have a non-empty "steps" array`);
-    }
-    for (const step of w.steps) {
-      if (typeof step !== 'object' || step === null) {
-        throw new Error(`${source}: each step must be an object`);
-      }
-      const s = step as Record<string, unknown>;
-      if (typeof s.name !== 'string') {
-        throw new Error(`${source}: each step must have a string "name" field`);
-      }
-
-      // Deterministic steps require type and command
-      if (s.type === 'deterministic') {
-        if (typeof s.command !== 'string') {
-          throw new Error(`${source}: deterministic step "${s.name}" must have a "command" field`);
-        }
-      } else if (s.type === 'worktree') {
-        if (typeof s.branch !== 'string' || s.branch.trim().length === 0) {
-          throw new Error(`${source}: worktree step "${s.name}" must have a "branch" string field`);
-        }
-      } else if (s.type === 'integration') {
-        // Integration steps require integration and action
-        if (typeof s.integration !== 'string') {
-          throw new Error(`${source}: integration step "${s.name}" must have an "integration" string field`);
-        }
-        if (typeof s.action !== 'string') {
-          throw new Error(`${source}: integration step "${s.name}" must have an "action" string field`);
-        }
-      } else {
-        // Agent steps (type undefined or 'agent') require agent and task
-        if (typeof s.agent !== 'string' || typeof s.task !== 'string') {
-          throw new Error(`${source}: agent step "${s.name}" must have "agent" and "task" string fields`);
-        }
-      }
-    }
-
-    // Validate DAG: check for unknown dependencies and cycles
-    const stepNames = new Set((w.steps as WorkflowStep[]).map((s) => s.name));
-    for (const step of w.steps as WorkflowStep[]) {
-      if (step.dependsOn) {
-        for (const dep of step.dependsOn) {
-          if (!stepNames.has(dep)) {
-            throw new Error(`${source}: step "${step.name}" depends on unknown step "${dep}"`);
-          }
-        }
-      }
-    }
-    this.detectCycles(w.steps as WorkflowStep[], source, w.name as string);
-    this.detectLeadWorkerDeadlock(w.steps as WorkflowStep[], agents, source, w.name as string);
-
-    // Warn if non-interactive agent task is excessively large before interpolation
-    for (const step of w.steps as WorkflowStep[]) {
-      if (step.type === 'deterministic' || step.type === 'worktree' || step.type === 'integration') continue;
-      const agentDef = agents.find((a) => a.name === step.agent);
-      const isNonInteractive =
-        agentDef?.interactive === false || ['worker', 'reviewer', 'analyst'].includes(agentDef?.preset ?? '');
-      if (isNonInteractive && (step.task ?? '').length > 10_000) {
-        console.warn(
-          `[WorkflowRunner] Warning: non-interactive step "${step.name}" has a very large task (${step.task!.length} chars). ` +
-            `Consider pre-reading files in a deterministic step and injecting only the relevant excerpt.`
-        );
-      }
-    }
-  }
-
-  private detectCycles(steps: WorkflowStep[], source: string, workflowName: string): void {
-    const adj = new Map<string, string[]>();
-    for (const step of steps) {
-      adj.set(step.name, step.dependsOn ?? []);
-    }
-
-    const visited = new Set<string>();
-    const inStack = new Set<string>();
-
-    const dfs = (node: string): void => {
-      if (inStack.has(node)) {
-        throw new Error(
-          `${source}: workflow "${workflowName}" contains a dependency cycle involving "${node}"`
-        );
-      }
-      if (visited.has(node)) return;
-      inStack.add(node);
-      for (const dep of adj.get(node) ?? []) {
-        dfs(dep);
-      }
-      inStack.delete(node);
-      visited.add(node);
-    };
-
-    for (const step of steps) {
-      dfs(step.name);
-    }
-  }
-
-  private detectLeadWorkerDeadlock(
-    steps: WorkflowStep[],
-    agents: AgentDefinition[],
-    source: string,
-    workflowName: string
-  ): void {
-    // Build a map of step name → steps that depend on it
-    const downstreamOf = new Map<string, string[]>();
-    for (const step of steps) {
-      for (const dep of step.dependsOn ?? []) {
-        if (!downstreamOf.has(dep)) downstreamOf.set(dep, []);
-        downstreamOf.get(dep)!.push(step.name);
-      }
-    }
-
-    for (const step of steps) {
-      // Only check interactive agent steps (leads)
-      if (step.type === 'deterministic' || step.type === 'worktree' || step.type === 'integration') continue;
-      const agentDef = agents.find((a) => a.name === step.agent);
-      // Skip non-interactive agents — they can't wait for channel signals
-      if (
-        agentDef?.interactive === false ||
-        agentDef?.preset === 'worker' ||
-        agentDef?.preset === 'reviewer' ||
-        agentDef?.preset === 'analyst'
-      )
-        continue;
-
-      const downstream = downstreamOf.get(step.name) ?? [];
-      if (downstream.length === 0) continue;
-
-      // Check if the task mentions downstream step names in a "waiting" context
-      const task = step.task ?? '';
-      const waitingKeywords = /\b(wait|waiting|monitor|check inbox|check.*channel|DONE|_DONE|signal)\b/i;
-      if (!waitingKeywords.test(task)) continue;
-
-      // Check if any downstream step name appears in the task
-      const mentioned = downstream.filter((name) => task.includes(name));
-      if (mentioned.length > 0) {
-        throw new Error(
-          `${source}: workflow "${workflowName}" likely has a lead\u2194worker deadlock. ` +
-            `Step "${step.name}" (interactive lead) mentions downstream step(s) [${mentioned.join(', ')}] in its task ` +
-            `and appears to wait for their signals, but those steps can't start until "${step.name}" completes. ` +
-            `Fix: make workers depend on a shared upstream step (e.g. "context"), not on the lead step. ` +
-            `See tests/workflows/README.md rule #6.`
-        );
-      }
-    }
-  }
-
-  // ── Template variable resolution ────────────────────────────────────────
-
-  /** Resolve {{variable}} placeholders in all task strings. */
-  resolveVariables(config: RelayYamlConfig, vars: VariableContext): RelayYamlConfig {
-    return this.templateResolver.resolveVariables(config, vars);
-  }
-
-  private interpolate(template: string, vars: VariableContext): string {
-    return resolveTemplate(template, vars);
-  }
-
-  private resolveDotPath(key: string, vars: VariableContext): string | number | boolean | undefined {
-    return resolveTemplateDotPath(key, vars);
-  }
-
-  /** Build a nested context from completed step outputs for {{steps.X.output}} resolution. */
-  private buildStepOutputContext(stepStates: Map<string, StepState>, runId?: string): VariableContext {
-    const steps: Record<string, { output: string }> = {};
-    for (const [name, state] of stepStates) {
-      if (state.row.status === 'completed' && state.row.output !== undefined) {
-        steps[name] = { output: state.row.output };
-      } else if (state.row.status === 'completed' && runId) {
-        // Recover from persisted output on disk (e.g., after restart)
-        const persisted = this.loadStepOutput(runId, name);
-        if (persisted) {
-          state.row.output = persisted;
-          steps[name] = { output: persisted };
-        }
-      }
-    }
-    return { steps } as unknown as VariableContext;
-  }
-
-  /** Interpolate step-output variables, silently skipping unresolved ones (they may be user vars). */
-  private interpolateStepTask(template: string, context: VariableContext): string {
-    return interpolateStepTaskTemplate(template, context);
-  }
-
-  private createStepLifecycleExecutor(
-    workflow: WorkflowDefinition,
-    stepStates: Map<string, StepState>,
-    agentMap: Map<string, AgentDefinition>,
-    errorHandling: ErrorHandlingConfig | undefined,
-    runId: string
-  ): WorkflowStepLifecycleExecutor<StepState> {
-    // eslint-disable-next-line prefer-const -- circular: deps closure captures lifecycle before assignment
-    let lifecycle!: WorkflowStepLifecycleExecutor<StepState>;
-    const deps: WorkflowStepLifecycleExecutorDeps<StepState> = {
-      cwd: this.cwd,
-      runId,
-      templateResolver: this.templateResolver,
-      channelMessenger: this.channelMessenger,
-      verificationRunner: (check, output, stepName, injectedTaskText, options) =>
-        this.runVerification(check, output, stepName, injectedTaskText, options),
-      postToChannel: (text) => this.postToChannel(text),
-      persistStepRow: async (stepId, patch) => this.db.updateStep(stepId, patch),
-      persistStepOutput: async (lifecycleRunId, stepName, output) =>
-        this.persistStepOutput(lifecycleRunId, stepName, output),
-      loadStepOutput: (lifecycleRunId, stepName) => this.loadStepOutput(lifecycleRunId, stepName),
-      checkAborted: () => this.checkAborted(),
-      waitIfPaused: () => this.waitIfPaused(),
-      log: (message) => this.log(message),
-      onStepStarted: async (step) => {
-        this.emit({ type: 'step:started', runId, stepName: step.name });
-      },
-      onStepCompleted: async (step, state, result) => {
-        this.emit({
-          type: 'step:completed',
-          runId,
-          stepName: step.name,
-          output: result.output,
-          exitCode: result.exitCode,
-          exitSignal: result.exitSignal,
-        });
-        this.finalizeStepEvidence(step.name, result.status, state.row.completedAt, result.completionReason);
-      },
-      onStepFailed: async (step, state, result) => {
-        this.captureStepTerminalEvidence(
-          step.name,
-          {},
-          {
-            exitCode: result.exitCode,
-            exitSignal: result.exitSignal,
-          }
-        );
-        this.emit({
-          type: 'step:failed',
-          runId,
-          stepName: step.name,
-          error: result.error ?? 'Unknown error',
-          exitCode: result.exitCode,
-          exitSignal: result.exitSignal,
-        });
-        this.finalizeStepEvidence(step.name, 'failed', state.row.completedAt, result.completionReason);
-      },
-      executeStep: async (step, state) => {
-        await this.executeStep(step, state, stepStates, agentMap, errorHandling, runId, lifecycle);
-        return {
-          status: state.row.status,
-          output: state.row.output ?? '',
-          completionReason: state.row.completionReason,
-          retries: state.row.retryCount,
-          error: state.row.error,
-        };
-      },
-      onBeginTrack: async (steps) => {
-        if (steps.length > 1 && this.trajectory) {
-          await this.trajectory.beginTrack(steps.map((step) => step.name).join(', '));
-        }
-      },
-      onConverge: async (readySteps, batchOutcomes) => {
-        if (readySteps.length <= 1 || !this.trajectory?.shouldReflectOnConverge()) {
-          return;
-        }
-
-        const completedNames = new Set(
-          batchOutcomes.filter((outcome) => outcome.status === 'completed').map((outcome) => outcome.name)
-        );
-        const unblocked = workflow.steps
-          .filter((step) => step.dependsOn?.some((dependency) => completedNames.has(dependency)))
-          .filter((step) => stepStates.get(step.name)?.row.status === 'pending')
-          .map((step) => step.name);
-
-        await this.trajectory.synthesizeAndReflect(
-          readySteps.map((step) => step.name).join(' + '),
-          batchOutcomes,
-          unblocked.length > 0 ? unblocked : undefined
-        );
-      },
-      markDownstreamSkipped: async (failedStepName) =>
-        this.markDownstreamSkipped(failedStepName, workflow.steps, stepStates, runId),
-      buildCompletionMode: (stepName, completionReason) =>
-        completionReason ? this.buildStepCompletionDecision(stepName, completionReason)?.mode : undefined,
-    };
-
-    lifecycle = new WorkflowStepLifecycleExecutor<StepState>(deps);
-    return lifecycle;
-  }
-
-  // ── Execution ───────────────────────────────────────────────────────────
-
-  /** Execute a named workflow from a validated config. */
-  async execute(
-    config: RelayYamlConfig,
-    workflowName?: string,
-    vars?: VariableContext,
-    executeOptions?: WorkflowExecuteOptions
-  ): Promise<WorkflowRunRow> {
-    // Set up abort controller early so callers can abort() even during setup
-    this.abortController = new AbortController();
-    this.paused = false;
-
-    const resolved = this.applyPermissionProfiles(vars ? this.resolveVariables(config, vars) : config);
-
-    // Validate config (catches cycles, missing deps, invalid steps, etc.)
-    this.validateConfig(resolved);
-    const runtimeConfig = this.applyReliabilityDefaults(resolved);
-
-    const permissionResult = this.validatePermissions(
-      runtimeConfig.agents,
-      runtimeConfig.permission_profiles
-    );
-    if (permissionResult.errors.length > 0) {
-      throw new Error(`Permission validation failed:\n  ${permissionResult.errors.join('\n  ')}`);
-    }
-    for (const warning of permissionResult.warnings) {
-      console.warn(`[WorkflowRunner] Warning: ${warning}`);
-    }
-
-    // Resolve and validate named paths from the top-level `paths` config
-    const pathResult = this.resolvePathDefinitions(runtimeConfig.paths, this.cwd);
-    if (pathResult.errors.length > 0) {
-      throw new Error(`Path validation failed:\n  ${pathResult.errors.join('\n  ')}`);
-    }
-    this.resolvedPaths = pathResult.resolved;
-    if (this.resolvedPaths.size > 0) {
-      for (const [name, abs] of this.resolvedPaths) {
-        console.log(`[workflow] path "${name}" → ${abs}`);
-      }
-    }
-
-    const workflows = runtimeConfig.workflows ?? [];
-
-    const workflow = workflowName ? workflows.find((w) => w.name === workflowName) : workflows[0];
-
-    if (!workflow) {
-      throw new Error(
-        workflowName ? `Workflow "${workflowName}" not found in config` : 'No workflows defined in config'
-      );
-    }
-
-    // Load and resolve custom step definitions
-    const customSteps = loadCustomSteps(this.cwd);
-    const resolvedSteps = resolveAllCustomSteps(workflow.steps, customSteps);
-    const resolvedWorkflow = { ...workflow, steps: resolvedSteps };
-
-    const runId = this.generateId();
-    const now = new Date().toISOString();
-
-    const run: WorkflowRunRow = {
-      id: runId,
-      workspaceId: this.workspaceId,
-      workflowName: resolvedWorkflow.name,
-      pattern: runtimeConfig.swarm.pattern,
-      status: 'pending',
-      config: runtimeConfig,
-      startedAt: now,
-      createdAt: now,
-      updatedAt: now,
-    };
-
-    await this.db.insertRun(run);
-    this.persistRunIdHint(runId);
-
-    // Build step rows
-    const stepStates = new Map<string, StepState>();
-    for (const step of resolvedWorkflow.steps) {
-      // Handle agent, deterministic, worktree, and integration steps
-      const isNonAgent =
-        step.type === 'deterministic' || step.type === 'worktree' || step.type === 'integration';
-
-      const stepRow: WorkflowStepRow = {
-        id: this.generateId(),
-        runId,
-        stepName: step.name,
-        agentName: isNonAgent ? null : (step.agent ?? null),
-        stepType: isNonAgent ? (step.type as 'deterministic' | 'worktree' | 'integration') : 'agent',
-        status: 'pending',
-        task:
-          step.type === 'deterministic'
-            ? (step.command ?? '')
-            : step.type === 'worktree'
-              ? (step.branch ?? '')
-              : step.type === 'integration'
-                ? `${step.integration}.${step.action}`
-                : (step.task ?? ''),
-        dependsOn: step.dependsOn ?? [],
-        retryCount: 0,
-        createdAt: now,
-        updatedAt: now,
-      };
-      await this.db.insertStep(stepRow);
-      stepStates.set(step.name, { row: stepRow });
-    }
-
-    // Handle startFrom: skip all transitive dependencies of the target step
-    if (executeOptions?.startFrom) {
-      const startFromName = executeOptions.startFrom;
-      const stepNames = new Set(resolvedWorkflow.steps.map((s) => s.name));
-      if (!stepNames.has(startFromName)) {
-        throw new Error(
-          `startFrom step "${startFromName}" not found in workflow. Available steps: ${[...stepNames].join(', ')}`
-        );
-      }
-
-      const transitiveDeps = this.collectTransitiveDeps(startFromName, resolvedWorkflow.steps);
-      const skippedCount = transitiveDeps.size;
-
-      // Determine which run ID to load cached outputs from
-      const cacheRunId = executeOptions.previousRunId ?? this.findMostRecentRunWithSteps(transitiveDeps);
-
-      for (const depName of transitiveDeps) {
-        const state = stepStates.get(depName);
-        if (!state) continue;
-
-        // Load cached output from a previous run if available
-        const cachedOutput = cacheRunId ? this.loadStepOutput(cacheRunId, depName) : undefined;
-        if (!cachedOutput) {
-          this.log(`[startFrom] No cached output for skipped step "${depName}" — using empty string`);
-        }
-
-        state.row.status = 'completed';
-        state.row.output = cachedOutput ?? '';
-        state.row.completedAt = now;
-        await this.db.updateStep(state.row.id, {
-          status: 'completed',
-          output: state.row.output,
-          completedAt: now,
-          updatedAt: now,
-        });
-      }
-
-      if (skippedCount > 0) {
-        this.log(`[startFrom] Skipping ${skippedCount} steps, starting from "${startFromName}"`);
-      }
-    }
-
-    return this.runWorkflowCore({
-      run,
-      workflow: resolvedWorkflow,
-      config: runtimeConfig,
-      stepStates,
-      isResume: false,
-    });
-  }
-
-  /** Resume a previously paused or partially completed run. */
-  async resume(runId: string, vars?: VariableContext, config?: RelayYamlConfig): Promise<WorkflowRunRow> {
-    // Set up abort controller early so callers can abort() even during setup
-    this.abortController = new AbortController();
-    this.paused = false;
-
-    let run = await this.db.getRun(runId);
-    let stepStates = new Map<string, StepState>();
-    if (!run) {
-      const reconstructed = this.reconstructRunFromCache(runId, config);
-      if (!reconstructed) {
-        throw new Error(`Run "${runId}" not found (no database entry or cached step outputs)`);
-      }
-      this.log('[resume] Reconstructing run from cached step outputs (workflow-runs.jsonl missing)');
-      run = reconstructed.run;
-      stepStates = reconstructed.stepStates;
-      await this.db.insertRun(run);
-      for (const [, state] of stepStates) {
-        await this.db.insertStep(state.row);
-      }
-    }
-    this.persistRunIdHint(runId);
-
-    if (run.status !== 'running' && run.status !== 'failed') {
-      throw new Error(`Run "${runId}" is in status "${run.status}" and cannot be resumed`);
-    }
-
-    const resolvedConfig = this.applyReliabilityDefaults(
-      vars ? this.resolveVariables(run.config, vars) : run.config
-    );
-
-    // Resolve path definitions (same as execute()) so workdir lookups work on resume
-    const pathResult = this.resolvePathDefinitions(resolvedConfig.paths, this.cwd);
-    if (pathResult.errors.length > 0) {
-      throw new Error(`Path validation failed:\n  ${pathResult.errors.join('\n  ')}`);
-    }
-    this.resolvedPaths = pathResult.resolved;
-
-    const workflows = resolvedConfig.workflows ?? [];
-    const workflow = workflows.find((w) => w.name === run.workflowName);
-    if (!workflow) {
-      throw new Error(`Workflow "${run.workflowName}" not found in stored config`);
-    }
-
-    if (stepStates.size === 0) {
-      const existingSteps = await this.db.getStepsByRunId(runId);
-      for (const stepRow of existingSteps) {
-        stepStates.set(stepRow.stepName, { row: stepRow });
-      }
-    }
-
-    // Reset failed steps to pending for retry
-    for (const [, state] of stepStates) {
-      if (state.row.status === 'failed') {
-        state.row.status = 'pending';
-        state.row.error = undefined;
-        state.row.completionReason = undefined;
-        await this.db.updateStep(state.row.id, {
-          status: 'pending',
-          error: undefined,
-          completionReason: undefined,
-          updatedAt: new Date().toISOString(),
-        });
-      }
-    }
-
-    return this.runWorkflowCore({
-      run,
-      workflow,
-      config: resolvedConfig,
-      stepStates,
-      isResume: true,
-    });
-  }
-
-  private async runWorkflowCore(input: {
-    run: WorkflowRunRow;
-    workflow: WorkflowDefinition;
-    config: RelayYamlConfig;
-    stepStates: Map<string, StepState>;
-    isResume: boolean;
-  }): Promise<WorkflowRunRow> {
-    const { run, workflow, config, stepStates, isResume } = input;
-    const runId = run.id;
-
-    // Start execution (abortController already set by execute()/resume())
-    this.currentConfig = config;
-    this.currentRunId = runId;
-    this.runStartTime = Date.now();
-    this.runtimeStepAgents.clear();
-    this.stepCompletionEvidence.clear();
-    this.agentReports.clear();
-    this.initializeBudgetTracker(config, workflow);
-
-    this.log(`Starting workflow "${workflow.name}" (${workflow.steps.length} steps)`);
-
-    // Initialize trajectory recording
-    this.trajectory = new WorkflowTrajectory(config.trajectories, runId, this.cwd);
-
-    try {
-      await this.updateRunStatus(runId, 'running');
-      if (!isResume) {
-        this.emit({ type: 'run:started', runId });
-      }
-
-      const pendingCount = [...stepStates.values()].filter((s) => s.row.status === 'pending').length;
-      if (isResume) {
-        await this.trajectory.start(
-          workflow.name,
-          workflow.steps.length,
-          `Resumed run: ${pendingCount} pending steps of ${workflow.steps.length} total`,
-          config.description,
-          config.swarm.pattern
-        );
-      } else {
-        // Analyze DAG for trajectory context on first run
-        const dagInfo = this.analyzeDAG(workflow.steps);
-        await this.trajectory.start(
-          workflow.name,
-          workflow.steps.length,
-          dagInfo,
-          config.description,
-          config.swarm.pattern
-        );
-      }
-
-      const channel =
-        config.swarm.channel ??
-        `wf-${this.sanitizeChannelName(config.name || run.workflowName)}-${this.generateShortId()}`;
-      this.channel = channel;
-      if (!config.swarm.channel) {
-        config.swarm.channel = channel;
-        await this.db.updateRun(runId, { config });
-      }
-      const relaycastDisabled = this.relayOptions.env?.AGENT_RELAY_WORKFLOW_DISABLE_RELAYCAST === '1';
-      const requiresBroker =
-        !this.executor &&
-        workflow.steps.some(
-          (step) => step.type !== 'deterministic' && step.type !== 'worktree' && step.type !== 'integration'
-        );
-      // Skip broker/relay init when an external executor handles agent spawning
-      if (requiresBroker) {
-        if (!relaycastDisabled) {
-          this.log('Resolving Relaycast API key...');
-          await this.ensureRelaycastApiKey(channel);
-          this.log('API key resolved');
-          if (this.relayApiKeyAutoCreated && this.relayApiKey) {
-            this.log(`Workspace created — follow this run in Relaycast:`);
-            this.log(`  Observer: https://agentrelay.com/observer?key=${this.relayApiKey}`);
-            this.log(`  Channel: ${channel}`);
-          }
-        }
-
-        this.log('Starting broker...');
-        // Include a short run ID suffix in the broker name so each workflow execution
-        // registers a unique identity in Relaycast. Without this, re-running in the same
-        // workspace hits a 409 conflict because the previous run's agent is still registered.
-        const brokerBaseName = path.basename(this.cwd) || 'workflow';
-        const brokerName = `${brokerBaseName}-${runId.slice(0, 8)}`;
-        this.relay = new AgentRelay({
-          ...this.relayOptions,
-          brokerName,
-          channels: relaycastDisabled ? [] : [channel],
-          env: this.getRelayEnv(),
-          // Workflows spawn agents across multiple waves; each spawn requires a PTY +
-          // Relaycast registration. 60s is too tight when the broker is saturated with
-          // long-running PTY processes from earlier steps. 120s gives room to breathe.
-          requestTimeoutMs: this.relayOptions.requestTimeoutMs ?? 120_000,
-        });
-
-        // Wire PTY output dispatcher — routes chunks to per-agent listeners + activity logging
-        this.unsubRelayListeners.push(
-          this.relay.addListener('workerOutput', ({ name, chunk }) => {
-            const listener = this.ptyListeners.get(name);
-            if (listener) listener(chunk);
-
-            // Parse PTY output for high-signal activity
-            const stripped = WorkflowRunner.stripAnsi(chunk);
-            const shortName = name.replace(/-[a-f0-9]{6,}$/, '');
-            let activity: string | undefined;
-            if (/Read\(/.test(stripped)) {
-              // Extract filename — path may be truncated at chunk boundary so require
-              // at least a dir separator or 8+ chars to trust the basename.
-              const m = stripped.match(/Read\(\s*~?([^\s)"']{8,})/);
-              if (m) {
-                const base = path.basename(m[1]);
-                activity = base.length >= 3 ? `Reading ${base}` : 'Reading file...';
-              } else {
-                activity = 'Reading file...';
-              }
-            } else if (/Edit\(/.test(stripped)) {
-              const m = stripped.match(/Edit\(\s*~?([^\s)"']{8,})/);
-              if (m) {
-                const base = path.basename(m[1]);
-                activity = base.length >= 3 ? `Editing ${base}` : 'Editing file...';
-              } else {
-                activity = 'Editing file...';
-              }
-            } else if (/Bash\(/.test(stripped)) {
-              // Extract a short preview of the command
-              const m = stripped.match(/Bash\(\s*(.{1,40})/);
-              activity = m ? `Running: ${m[1].trim()}...` : 'Running command...';
-            } else if (/Explore\(/.test(stripped)) {
-              const m = stripped.match(/Explore\(\s*(.{1,50})/);
-              activity = m ? `Exploring: ${m[1].replace(/\).*/, '').trim()}` : 'Exploring codebase...';
-            } else if (/Task\(/.test(stripped)) {
-              activity = 'Running sub-agent...';
-            } else if (/Sublimating|Thinking|Coalescing|Cultivating/.test(stripped)) {
-              const m = stripped.match(/(\d+)s/);
-              activity = m ? `Thinking... (${m[1]}s)` : 'Thinking...';
-            }
-            if (activity && this.lastActivity.get(name) !== activity) {
-              this.lastActivity.set(name, activity);
-              this.log(`[${shortName}] ${activity}`);
-            }
-          })
-        );
-
-        // Wire relay event hooks for rich console logging
-        this.unsubRelayListeners.push(
-          this.relay.addListener('messageReceived', (msg) => {
-            this.emit({
-              type: 'broker:event',
-              runId,
-              event: {
-                kind: 'relay_inbound',
-                event_id: msg.eventId,
-                from: msg.from,
-                target: msg.to,
-                body: msg.text,
-                thread_id: msg.threadId,
-              } as BrokerEvent,
-            });
-            const body = msg.text.length > 120 ? msg.text.slice(0, 117) + '...' : msg.text;
-            const fromShort = msg.from.replace(/-[a-f0-9]{6,}$/, '');
-            const toShort = msg.to.replace(/-[a-f0-9]{6,}$/, '');
-            this.log(`[msg] ${fromShort} → ${toShort}: ${body}`);
-
-            if (this.channel && (msg.to === this.channel || msg.to === `#${this.channel}`)) {
-              const runtimeAgent = this.runtimeStepAgents.get(msg.from);
-              this.recordChannelEvidence(msg.text, {
-                sender: runtimeAgent?.logicalName ?? msg.from,
-                actor: msg.from,
-                role: runtimeAgent?.role,
-                target: msg.to,
-                origin: 'relay_message',
-                stepName: runtimeAgent?.stepName,
-              });
-            }
-
-            const supervision = this.supervisedRuntimeAgents.get(msg.from);
-            if (supervision?.role === 'owner') {
-              this.recordStepToolSideEffect(supervision.stepName, {
-                type: 'owner_monitoring',
-                detail: `Owner messaged ${msg.to}: ${msg.text.slice(0, 120)}`,
-                raw: { to: msg.to, text: msg.text },
-              });
-              void this.trajectory?.ownerMonitoringEvent(
-                supervision.stepName,
-                supervision.logicalName,
-                `Messaged ${msg.to}: ${msg.text.slice(0, 120)}`,
-                { to: msg.to, text: msg.text }
-              );
-            }
-          })
-        );
-
-        this.unsubRelayListeners.push(
-          this.relay.addListener('agentSpawned', (agent) => {
-            this.emit({
-              type: 'broker:event',
-              runId,
-              event: {
-                kind: 'agent_spawned',
-                name: agent.name,
-                runtime: agent.runtime,
-              } as BrokerEvent,
-            });
-            // Skip agents already managed by step execution
-            if (!this.activeAgentHandles.has(agent.name)) {
-              this.log(`[spawned] ${agent.name} (${agent.runtime})`);
-            }
-          })
-        );
-
-        this.unsubRelayListeners.push(
-          this.relay.addListener('agentReleased', (agent) => {
-            this.emit({
-              type: 'broker:event',
-              runId,
-              event: {
-                kind: 'agent_released',
-                name: agent.name,
-              } as BrokerEvent,
-            });
-          })
-        );
-
-        this.unsubRelayListeners.push(
-          this.relay.addListener('agentExited', (agent) => {
-            this.emit({
-              type: 'broker:event',
-              runId,
-              event: {
-                kind: 'agent_exited',
-                name: agent.name,
-                code: agent.exitCode,
-                signal: agent.exitSignal,
-              } as BrokerEvent,
-            });
-            this.lastActivity.delete(agent.name);
-            this.lastIdleLog.delete(agent.name);
-            if (!this.activeAgentHandles.has(agent.name)) {
-              this.log(`[exited] ${agent.name} (code: ${agent.exitCode ?? '?'})`);
-            }
-          })
-        );
-
-        this.unsubRelayListeners.push(
-          this.relay.addListener('deliveryUpdate', (event) => {
-            this.emit({ type: 'broker:event', runId, event });
-          })
-        );
-
-        this.unsubRelayListeners.push(
-          this.relay.addListener('agentIdle', ({ name, idleSecs }) => {
-            this.emit({
-              type: 'broker:event',
-              runId,
-              event: {
-                kind: 'agent_idle',
-                name,
-                idle_secs: idleSecs,
-              } as BrokerEvent,
-            });
-            // Only log at 30s multiples to avoid watchdog spam
-            const bucket = Math.floor(idleSecs / 30) * 30;
-            if (bucket >= 30 && this.lastIdleLog.get(name) !== bucket) {
-              this.lastIdleLog.set(name, bucket);
-              const shortName = name.replace(/-[a-f0-9]{6,}$/, '');
-              this.log(`[idle] ${shortName} silent for ${bucket}s`);
-            }
-          })
-        );
-
-        this.relaycast = undefined;
-        this.relaycastAgent = undefined;
-
-        // Wire broker stderr to console for observability — skip empty and
-        // JSON event lines (already surfaced via the broker:event emitter).
-        this.unsubBrokerStderr = this.relay.onBrokerStderr((line: string) => {
-          const trimmed = line.trim();
-          if (!trimmed) return;
-          // JSON event lines from the Rust EventEmitter are already parsed
-          // and emitted as broker:event — no need to double-log them.
-          if (trimmed.startsWith('{') && trimmed.endsWith('}')) return;
-          console.log(`${chalk.dim.yellow('[broker]')} ${line}`);
-        });
-
-        if (!relaycastDisabled) {
-          this.log(`Creating channel: ${channel}...`);
-          if (isResume) {
-            await this.createAndJoinRelaycastChannel(channel);
-          } else {
-            await this.createAndJoinRelaycastChannel(channel, workflow.description);
-          }
-          this.log('Channel ready');
-
-          if (isResume) {
-            this.postToChannel(`Workflow **${workflow.name}** resumed — ${pendingCount} pending steps`);
-          } else {
-            this.postToChannel(
-              `Workflow **${workflow.name}** started — ${workflow.steps.length} steps, pattern: ${config.swarm.pattern}`
-            );
-          }
-        }
-      }
-
-      const agentMap = new Map<string, AgentDefinition>();
-      for (const agent of config.agents) {
-        agentMap.set(agent.name, agent);
-      }
-
-      // Run preflight checks before any steps (skip on resume)
-      if (!isResume && workflow.preflight?.length) {
-        await this.runPreflightChecks(workflow.preflight, runId);
-      }
-
-      await this.provisionAgents(config);
-
-      this.log(`Executing ${workflow.steps.length} steps (pattern: ${config.swarm.pattern})`);
-      await this.executeSteps(workflow, stepStates, agentMap, config.errorHandling, runId);
-
-      // A run is successful iff every step completed or was skipped. Under
-      // continue-on-error we keep executing past a failure, but the run
-      // itself still "failed" — otherwise the final status contradicts the
-      // summary table ("1 passed, 3 failed" but run.status=completed) and
-      // downstream wrappers that key off run.status (e.g. the cloud
-      // orchestrator's bootstrap) silently report success.
-      const allCompleted = [...stepStates.values()].every(
-        (s) => s.row.status === 'completed' || s.row.status === 'skipped'
-      );
-
-      if (allCompleted) {
-        this.log('Workflow completed successfully');
-        await this.updateRunStatus(runId, 'completed');
-        this.emit({ type: 'run:completed', runId });
-
-        const outcomes = this.collectOutcomes(stepStates, workflow.steps);
-        const summary = this.trajectory.buildRunSummary(outcomes);
-        const confidence = this.trajectory.computeConfidence(outcomes);
-        await this.trajectory.complete(summary, confidence, {
-          learnings: this.trajectory.extractLearnings(outcomes),
-          challenges: this.trajectory.extractChallenges(outcomes),
-        });
-
-        this.postCompletionReport(workflow.name, outcomes, summary, confidence);
-        this.logRunSummary(workflow.name, outcomes, runId);
-      } else {
-        const failedStep = [...stepStates.values()].find((s) => s.row.status === 'failed');
-        const errorMsg = failedStep?.row.error ?? 'One or more steps failed';
-        await this.updateRunStatus(runId, 'failed', errorMsg);
-        this.emit({ type: 'run:failed', runId, error: errorMsg });
-
-        const outcomes = this.collectOutcomes(stepStates, workflow.steps);
-        const summary = this.trajectory.buildRunSummary(outcomes);
-        const confidence = this.trajectory.computeConfidence(outcomes);
-        const learnings = this.trajectory.extractLearnings(outcomes);
-        const challenges = this.trajectory.extractChallenges(outcomes);
-        this.postFailureReport(workflow.name, outcomes, errorMsg);
-        this.logRunSummary(workflow.name, outcomes, runId);
-        await this.trajectory.abandon(errorMsg, {
-          summary,
-          confidence,
-          learnings,
-          challenges,
-        });
-      }
-    } catch (err) {
-      const errorMsg = err instanceof Error ? err.message : String(err);
-      const status: WorkflowRunStatus =
-        !isResume && this.abortController?.signal.aborted ? 'cancelled' : 'failed';
-      await this.updateRunStatus(runId, status, errorMsg);
-
-      if (status === 'cancelled') {
-        // Mark any pending or in-progress steps as failed due to cancellation
-        for (const [stepName, state] of stepStates) {
-          if (state.row.status === 'pending' || state.row.status === 'running') {
-            state.row.status = 'failed';
-            state.row.error = 'Cancelled';
-            await this.db.updateStep(state.row.id, {
-              status: 'failed',
-              error: 'Cancelled',
-              updatedAt: new Date().toISOString(),
-            });
-            this.emit({ type: 'step:failed', runId, stepName, error: 'Cancelled' });
-            this.finalizeStepEvidence(stepName, 'failed');
-          }
-        }
-        this.emit({ type: 'run:cancelled', runId });
-        this.postToChannel(`Workflow **${workflow.name}** cancelled`);
-        await this.trajectory.abandon('Cancelled by user');
-      } else {
-        this.emit({ type: 'run:failed', runId, error: errorMsg });
-        this.postToChannel(`Workflow failed: ${errorMsg}`);
-        const outcomes = this.collectOutcomes(stepStates, workflow.steps);
-        await this.trajectory.abandon(errorMsg, {
-          summary: this.trajectory.buildRunSummary(outcomes),
-          confidence: this.trajectory.computeConfidence(outcomes),
-          learnings: this.trajectory.extractLearnings(outcomes),
-          challenges: this.trajectory.extractChallenges(outcomes),
-        });
-      }
-    } finally {
-      this.lastFailedStepOutput.clear();
-      this.lastCustomVerificationFailure.clear();
-      for (const stream of this.ptyLogStreams.values()) stream.end();
-      this.ptyLogStreams.clear();
-      this.ptyOutputBuffers.clear();
-      this.ptyListeners.clear();
-
-      this.unsubBrokerStderr?.();
-      this.unsubBrokerStderr = undefined;
-
-      // Unsubscribe relay event listeners to prevent leaks
-      for (const off of this.unsubRelayListeners) {
-        try {
-          off();
-        } catch {
-          /* ignore */
-        }
-      }
-      this.unsubRelayListeners = [];
-      this.lastIdleLog.clear();
-      this.lastActivity.clear();
-      this.supervisedRuntimeAgents.clear();
-      this.runtimeStepAgents.clear();
-      this.activeReviewers.clear();
-
-      this.log('Shutting down broker...');
-      await this.relay?.shutdown();
-      this.relay = undefined;
-      this.runStartTime = undefined;
-      this.relaycast = undefined;
-      this.relaycastAgent = undefined;
-      this.channel = undefined;
-      this.trajectory = undefined;
-      this.abortController = undefined;
-      this.currentConfig = undefined;
-      this.currentRunId = undefined;
-      this.activeAgentHandles.clear();
-      await this.stopProvisionedMounts();
-      this.agentTokens.clear(); // Prevent workflow-scoped tokens from leaking into a later run.
-    }
-
-    const finalRun = await this.db.getRun(runId);
-    return finalRun ?? run;
-  }
-
-  /** Pause execution. Currently-running steps will finish but no new steps start. */
-  pause(): void {
-    this.paused = true;
-  }
-
-  /** Resume after a pause(). */
-  unpause(): void {
-    this.paused = false;
-    this.pauseResolver?.();
-    this.pauseResolver = undefined;
-  }
-
-  /** Abort the current run. Running agents are released. */
-  abort(): void {
-    // Unblock waitIfPaused() so the run loop can exit
-    this.pauseResolver?.();
-    this.pauseResolver = undefined;
-    this.abortController?.abort();
-  }
-
-  // ── Step execution engine ─────────────────────────────────────────────
-
-  private async executeSteps(
-    workflow: WorkflowDefinition,
-    stepStates: Map<string, StepState>,
-    agentMap: Map<string, AgentDefinition>,
-    errorHandling: ErrorHandlingConfig | undefined,
-    runId: string
-  ): Promise<void> {
-    const rawStrategy = errorHandling?.strategy ?? workflow.onError ?? 'fail-fast';
-    const strategy =
-      rawStrategy === 'fail'
-        ? 'fail-fast'
-        : rawStrategy === 'skip'
-          ? 'continue'
-          : rawStrategy === 'retry'
-            ? 'fail-fast'
-            : rawStrategy;
-
-    const lifecycle = this.createStepLifecycleExecutor(workflow, stepStates, agentMap, errorHandling, runId);
-
-    await lifecycle.executeAll(
-      workflow.steps,
-      agentMap,
-      {
-        ...(errorHandling ?? { strategy: 'fail-fast' }),
-        strategy,
-      },
-      stepStates
-    );
-  }
-
-  private findReadySteps(steps: WorkflowStep[], stepStates: Map<string, StepState>): WorkflowStep[] {
-    return steps.filter((step) => {
-      const state = stepStates.get(step.name);
-      if (!state || state.row.status !== 'pending') return false;
-
-      const deps = step.dependsOn ?? [];
-      return deps.every((dep) => {
-        const depState = stepStates.get(dep);
-        return depState && (depState.row.status === 'completed' || depState.row.status === 'skipped');
-      });
-    });
-  }
-
-  /**
-   * Execute preflight checks before any workflow steps.
-   * All checks must pass or the workflow fails immediately.
-   */
-  private async runPreflightChecks(checks: PreflightCheck[], runId: string): Promise<void> {
-    this.postToChannel(`Running ${checks.length} preflight check(s)...`);
-
-    for (const check of checks) {
-      this.checkAborted();
-
-      const description = check.description ?? check.command.slice(0, 50);
-      this.postToChannel(`**[preflight]** ${description}`);
-
-      try {
-        const output = await new Promise<string>((resolve, reject) => {
-          const child = cpSpawn('sh', ['-c', check.command], {
-            stdio: 'pipe',
-            cwd: this.cwd,
-            env: filteredEnv(),
-          });
-
-          const stdoutChunks: string[] = [];
-          const stderrChunks: string[] = [];
-
-          // Wire abort signal
-          const abortSignal = this.abortController?.signal;
-          let abortHandler: (() => void) | undefined;
-          if (abortSignal && !abortSignal.aborted) {
-            abortHandler = () => {
-              child.kill('SIGTERM');
-            };
-            abortSignal.addEventListener('abort', abortHandler, { once: true });
-          }
-
-          // 30s timeout for preflight checks
-          const timer = setTimeout(() => {
-            child.kill('SIGTERM');
-            reject(new Error(`Preflight check timed out: ${description}`));
-          }, 30_000);
-
-          child.stdout?.on('data', (chunk: Buffer) => {
-            stdoutChunks.push(chunk.toString());
-          });
-
-          child.stderr?.on('data', (chunk: Buffer) => {
-            stderrChunks.push(chunk.toString());
-          });
-
-          child.on('close', (code) => {
-            clearTimeout(timer);
-            if (abortHandler && abortSignal) {
-              abortSignal.removeEventListener('abort', abortHandler);
-            }
-
-            if (abortSignal?.aborted) {
-              reject(new Error('Preflight check aborted'));
-              return;
-            }
-
-            // Non-zero exit code is a failure
-            if (code !== 0 && code !== null) {
-              const stderr = stderrChunks.join('');
-              reject(
-                new Error(`Preflight check failed (exit ${code})${stderr ? `: ${stderr.slice(0, 200)}` : ''}`)
-              );
-              return;
-            }
-
-            resolve(stdoutChunks.join(''));
-          });
-
-          child.on('error', (err) => {
-            clearTimeout(timer);
-            if (abortHandler && abortSignal) {
-              abortSignal.removeEventListener('abort', abortHandler);
-            }
-            reject(new Error(`Preflight check error: ${err.message}`));
-          });
-        });
-
-        // Check failIf condition
-        if (check.failIf) {
-          const trimmedOutput = output.trim();
-          if (check.failIf === 'non-empty' && trimmedOutput.length > 0) {
-            throw new Error(`Preflight failed: output is non-empty\n${trimmedOutput.slice(0, 200)}`);
-          }
-          if (check.failIf === 'empty' && trimmedOutput.length === 0) {
-            throw new Error('Preflight failed: output is empty');
-          }
-          // Treat as regex pattern
-          if (check.failIf !== 'non-empty' && check.failIf !== 'empty') {
-            const regex = new RegExp(check.failIf);
-            if (regex.test(output)) {
-              throw new Error(`Preflight failed: output matches pattern "${check.failIf}"`);
-            }
-          }
-        }
-
-        // Check successIf condition
-        if (check.successIf) {
-          const regex = new RegExp(check.successIf);
-          if (!regex.test(output)) {
-            throw new Error(`Preflight failed: output does not match required pattern "${check.successIf}"`);
-          }
-        }
-
-        this.postToChannel(`**[preflight]** ${description} — passed`);
-      } catch (err) {
-        const errorMsg = err instanceof Error ? err.message : String(err);
-        this.postToChannel(`**[preflight]** ${description} — FAILED: ${errorMsg}`);
-        throw new Error(`Preflight check failed: ${errorMsg}`);
-      }
-    }
-
-    this.postToChannel('All preflight checks passed');
-  }
-
-  /** Check if a step is deterministic (shell command) vs agent (LLM-powered). */
-  private isDeterministicStep(step: WorkflowStep): boolean {
-    return step.type === 'deterministic';
-  }
-
-  /** Check if a step is a worktree (git worktree setup) step. */
-  private isWorktreeStep(step: WorkflowStep): boolean {
-    return step.type === 'worktree';
-  }
-
-  /** Check if a step is an integration (external service) step. */
-  private isIntegrationStep(step: WorkflowStep): boolean {
-    return step.type === 'integration';
-  }
-
-  private async executeStep(
-    step: WorkflowStep,
-    state: StepState,
-    stepStates: Map<string, StepState>,
-    agentMap: Map<string, AgentDefinition>,
-    errorHandling: ErrorHandlingConfig | undefined,
-    runId: string,
-    lifecycle: WorkflowStepLifecycleExecutor<StepState>
-  ): Promise<void> {
-    // Branch: deterministic steps execute shell commands
-    if (this.isDeterministicStep(step)) {
-      return this.executeDeterministicStep(
-        step,
-        state,
-        stepStates,
-        agentMap,
-        runId,
-        errorHandling,
-        lifecycle
-      );
-    }
-
-    // Branch: worktree steps set up git worktrees
-    if (this.isWorktreeStep(step)) {
-      return this.executeWorktreeStep(step, state, stepStates, runId, lifecycle);
-    }
-
-    // Branch: integration steps interact with external services
-    if (this.isIntegrationStep(step)) {
-      return this.executeIntegrationStep(step, state, stepStates, runId, lifecycle);
-    }
-
-    // Agent step execution
-    return this.executeAgentStep(step, stepStates, agentMap, errorHandling, runId);
-  }
-
-  /**
-   * Execute a deterministic step (shell command).
-   * Fast, reliable, $0 LLM cost.
-   */
-  private async executeDeterministicStep(
-    step: WorkflowStep,
-    state: StepState,
-    stepStates: Map<string, StepState>,
-    agentMap: Map<string, AgentDefinition>,
-    runId: string,
-    errorHandling: ErrorHandlingConfig | undefined,
-    lifecycle: WorkflowStepLifecycleExecutor<StepState>
-  ): Promise<void> {
-    const repairRetries = errorHandling?.strategy === 'retry' ? (errorHandling.repairRetries ?? 0) : 0;
-    const repairAgent =
-      repairRetries > 0
-        ? this.resolveWorkflowRepairAgent(step, stepStates, agentMap, errorHandling)
-        : undefined;
-    const maxRetries = step.retries ?? errorHandling?.maxRetries ?? (repairAgent ? repairRetries : 0);
-    const retryDelay = errorHandling?.retryDelayMs ?? 1000;
-    let lastError = 'Unknown error';
-    let lastCompletionReason: WorkflowStepCompletionReason | undefined;
-    let lastExitCode: number | undefined;
-    let lastExitSignal: string | undefined;
-    let lastResolvedCommand = step.command ?? '';
-    let lastStepCwd = this.cwd;
-    let lastCommandOutput = '';
-
-    const result = await lifecycle.monitorStep(step, state, {
-      maxRetries,
-      retryDelayMs: retryDelay,
-      startMessage: `**[${step.name}]** Started (deterministic)`,
-      onRetry: async (attempt, total) => {
-        this.emit({ type: 'step:retrying', runId, stepName: step.name, attempt });
-        this.postToChannel(`**[${step.name}]** Retrying (attempt ${attempt + 1}/${total + 1})`);
-        this.recordStepToolSideEffect(step.name, {
-          type: 'retry',
-          detail: `Retrying attempt ${attempt + 1}/${total + 1}`,
-          raw: { attempt, maxRetries: total },
-        });
-        if (repairAgent) {
-          await this.runDeterministicRepairAgent({
-            step,
-            agentDef: repairAgent,
-            attempt,
-            maxRetries: total,
-            command: lastResolvedCommand,
-            cwd: lastStepCwd,
-            error: lastError,
-            output: lastCommandOutput,
-            exitCode: lastExitCode,
-            exitSignal: lastExitSignal,
-          });
-        }
-      },
-      execute: async () => {
-        const stepOutputContext = this.buildStepOutputContext(stepStates, runId);
-        let resolvedCommand = this.interpolateStepTask(step.command ?? '', stepOutputContext);
-
-        resolvedCommand = resolvedCommand.replace(/\{\{([\w][\w.\-]*)\}\}/g, (_match, key: string) => {
-          if (key.startsWith('steps.')) return _match;
-          const value = this.resolveDotPath(key, stepOutputContext);
-          return value !== undefined ? String(value) : _match;
-        });
-
-        const stepCwd = this.resolveEffectiveCwd(step);
-        lastResolvedCommand = resolvedCommand;
-        lastStepCwd = stepCwd;
-        this.beginStepEvidence(step.name, [stepCwd], state.row.startedAt);
-        this.log(
-          `[${step.name}] Running: ${resolvedCommand.slice(0, 200)}${resolvedCommand.length > 200 ? '...' : ''}`
-        );
-
-        if (this.executor?.executeDeterministicStep) {
-          const executorResult = await this.executor.executeDeterministicStep(step, resolvedCommand, stepCwd);
-          lastExitCode = executorResult.exitCode;
-          lastExitSignal = undefined;
-          lastCommandOutput = executorResult.output;
-          const failOnError = step.failOnError !== false;
-          if (failOnError && executorResult.exitCode !== 0) {
-            this.log(`[${step.name}] Command failed (exit code ${executorResult.exitCode})`);
-            if (executorResult.output) {
-              this.log(`[${step.name}] Output:\n${executorResult.output}`);
-            }
-            throw new Error(
-              `Command failed with exit code ${executorResult.exitCode}: ${executorResult.output.slice(0, 500)}`
-            );
-          }
-          const output =
-            step.captureOutput !== false
-              ? executorResult.output
-              : `Command completed (exit code ${executorResult.exitCode})`;
-          this.captureStepTerminalEvidence(
-            step.name,
-            { stdout: executorResult.output, combined: executorResult.output },
-            { exitCode: executorResult.exitCode }
-          );
-          const verificationResult = step.verification
-            ? this.runVerification(step.verification, output, step.name)
-            : undefined;
-          return {
-            output,
-            completionReason: verificationResult?.completionReason,
-          };
-        }
-
-        let commandStdout = '';
-        let commandStderr = '';
-        const output = await new Promise<string>((resolve, reject) => {
-          const child = cpSpawn('sh', ['-c', resolvedCommand], {
-            stdio: 'pipe',
-            cwd: stepCwd,
-            env: filteredEnv(),
-          });
-
-          const stdoutChunks: string[] = [];
-          const stderrChunks: string[] = [];
-          const abortSignal = this.abortController?.signal;
-          let abortHandler: (() => void) | undefined;
-          if (abortSignal && !abortSignal.aborted) {
-            abortHandler = () => {
-              child.kill('SIGTERM');
-              setTimeout(() => child.kill('SIGKILL'), 5000);
-            };
-            abortSignal.addEventListener('abort', abortHandler, { once: true });
-          }
-
-          let timedOut = false;
-          let timer: ReturnType<typeof setTimeout> | undefined;
-          if (step.timeoutMs) {
-            timer = setTimeout(() => {
-              timedOut = true;
-              child.kill('SIGTERM');
-              setTimeout(() => child.kill('SIGKILL'), 5000);
-            }, step.timeoutMs);
-          }
-
-          child.stdout?.on('data', (chunk: Buffer) => {
-            stdoutChunks.push(chunk.toString());
-          });
-
-          child.stderr?.on('data', (chunk: Buffer) => {
-            stderrChunks.push(chunk.toString());
-          });
-
-          child.on('close', (code, signal) => {
-            if (timer) clearTimeout(timer);
-            if (abortHandler && abortSignal) {
-              abortSignal.removeEventListener('abort', abortHandler);
-            }
-
-            if (abortSignal?.aborted) {
-              reject(new Error(`Step "${step.name}" aborted`));
-              return;
-            }
-
-            if (timedOut) {
-              reject(
-                new Error(`Step "${step.name}" timed out (no step timeout set, check global swarm.timeoutMs)`)
-              );
-              return;
-            }
-
-            const stdout = stdoutChunks.join('');
-            const stderr = stderrChunks.join('');
-            commandStdout = stdout;
-            commandStderr = stderr;
-            lastExitCode = code ?? undefined;
-            lastExitSignal = signal ?? undefined;
-            lastCommandOutput = [stdout, stderr].filter(Boolean).join('\n');
-
-            const failOnError = step.failOnError !== false;
-            if (failOnError && code !== 0 && code !== null) {
-              this.log(`[${step.name}] Command failed (exit code ${code})`);
-              if (stdout) {
-                this.log(`[${step.name}] stdout:\n${stdout}`);
-              }
-              if (stderr) {
-                this.log(`[${step.name}] stderr:\n${stderr}`);
-              }
-              reject(
-                new Error(`Command failed with exit code ${code}${stderr ? `: ${stderr.slice(0, 500)}` : ''}`)
-              );
-              return;
-            }
-
-            resolve(step.captureOutput !== false ? stdout : `Command completed (exit code ${code ?? 0})`);
-          });
-
-          child.on('error', (err) => {
-            if (timer) clearTimeout(timer);
-            if (abortHandler && abortSignal) {
-              abortSignal.removeEventListener('abort', abortHandler);
-            }
-            reject(new Error(`Failed to execute command: ${err.message}`));
-          });
-        });
-
-        this.captureStepTerminalEvidence(
-          step.name,
-          {
-            stdout: commandStdout || output,
-            stderr: commandStderr,
-            combined: [commandStdout || output, commandStderr].filter(Boolean).join('\n'),
-          },
-          { exitCode: lastExitCode, exitSignal: lastExitSignal }
-        );
-
-        const verificationResult = step.verification
-          ? this.runVerification(step.verification, output, step.name)
-          : undefined;
-        lastCommandOutput = [commandStdout || output, commandStderr].filter(Boolean).join('\n');
-
-        return {
-          output,
-          completionReason: verificationResult?.completionReason,
-        };
-      },
-      toCompletionResult: ({ output, completionReason }, attempt) => ({
-        status: 'completed',
-        output,
-        completionReason,
-        retries: attempt,
-        exitCode: lastExitCode,
-        exitSignal: lastExitSignal,
-      }),
-      onAttemptFailed: async (error) => {
-        lastError = error instanceof Error ? error.message : String(error);
-        lastCompletionReason = error instanceof WorkflowCompletionError ? error.completionReason : undefined;
-      },
-      getFailureResult: () => ({
-        status: 'failed',
-        output: '',
-        error: lastError,
-        retries: state.row.retryCount,
-        exitCode: lastExitCode,
-        exitSignal: lastExitSignal,
-        completionReason: lastCompletionReason,
-      }),
-    });
-
-    if (result.status === 'failed') {
-      this.postToChannel(`**[${step.name}]** Failed: ${result.error ?? 'Unknown error'}`);
-      throw new Error(`Step "${step.name}" failed: ${result.error ?? 'Unknown error'}`);
-    }
-  }
-
-  private resolveWorkflowRepairAgent(
-    step: WorkflowStep,
-    stepStates: Map<string, StepState>,
-    agentMap: Map<string, AgentDefinition>,
-    errorHandling: ErrorHandlingConfig | undefined
-  ): AgentDefinition | undefined {
-    const explicitName = errorHandling?.repairAgent?.trim();
-    if (explicitName) {
-      const explicitAgent = agentMap.get(explicitName);
-      if (explicitAgent) return WorkflowRunner.resolveAgentDef(explicitAgent);
-      this.log(`[${step.name}] repairAgent "${explicitName}" not found; falling back to workflow agents`);
-    }
-
-    if (step.agent) {
-      const stepAgent = agentMap.get(step.agent);
-      if (stepAgent) return WorkflowRunner.resolveAgentDef(stepAgent);
-    }
-
-    for (const dependency of [...(step.dependsOn ?? [])].reverse()) {
-      const dependencyAgent = stepStates.get(dependency)?.row.agentName;
-      if (!dependencyAgent) continue;
-      const agent = agentMap.get(dependencyAgent);
-      if (agent) return WorkflowRunner.resolveAgentDef(agent);
-    }
-
-    const candidates = [...agentMap.values()].map((agent) => WorkflowRunner.resolveAgentDef(agent));
-    candidates.sort((a, b) => this.scoreRepairAgent(b) - this.scoreRepairAgent(a));
-    return candidates[0];
-  }
-
-  private scoreRepairAgent(agent: AgentDefinition): number {
-    const text = `${agent.name} ${agent.role ?? ''} ${agent.preset ?? ''}`.toLowerCase();
-    let score = 0;
-    if (
-      /\b(repair|fix|implement|implementation|engineer|developer|coder|worker|owner|lead|coordinator)\b/.test(
-        text
-      )
-    ) {
-      score += 10;
-    }
-    if (agent.interactive === false || ['worker', 'analyst'].includes(agent.preset ?? '')) {
-      score += 2;
-    }
-    if (/\b(review|reviewer|audit|security|analyst)\b/.test(text)) {
-      score -= 4;
-    }
-    if (agent.permissions?.access === 'readonly') {
-      score -= 20;
-    }
-    return score;
-  }
-
-  private async runDeterministicRepairAgent(context: DeterministicRepairContext): Promise<void> {
-    const repairAgent: AgentDefinition = {
-      ...context.agentDef,
-      interactive: false,
-    };
-    const repairPrompt = this.buildDeterministicRepairPrompt(context);
-    const repairStep: WorkflowStep = {
-      name: `${context.step.name}-repair-${context.attempt}`,
-      type: 'agent',
-      agent: repairAgent.name,
-      task: repairPrompt,
-      cwd: context.cwd,
-      workdir: undefined,
-      retries: 0,
-    };
-    const timeoutMs =
-      repairAgent.constraints?.timeoutMs ?? context.step.timeoutMs ?? this.currentConfig?.swarm?.timeoutMs;
-
-    this.log(
-      `[${context.step.name}] Deterministic gate failed; asking "${repairAgent.name}" to repair before retry ${context.attempt + 1}/${context.maxRetries + 1}`
-    );
-    this.postToChannel(
-      `**[${context.step.name}]** Deterministic gate failed; assigning repair to \`${repairAgent.name}\``
-    );
-    this.recordStepToolSideEffect(context.step.name, {
-      type: 'custom',
-      detail: `Assigned deterministic gate repair to ${repairAgent.name}`,
-      raw: {
-        repairAgent: repairAgent.name,
-        attempt: context.attempt,
-        maxRetries: context.maxRetries,
-        exitCode: context.exitCode,
-        exitSignal: context.exitSignal,
-      },
-    });
-
-    try {
-      this.ensureBudgetAllowsSpawn(context.step.name, repairAgent.name);
-      let repairOutput: string;
-      if (this.executor) {
-        repairOutput = await this.executor.executeAgentStep(repairStep, repairAgent, repairPrompt, timeoutMs);
-      } else if (repairAgent.cli === 'api') {
-        repairOutput = await executeApiStep(
-          repairAgent.constraints?.model ?? 'claude-sonnet-4-20250514',
-          repairPrompt,
-          {
-            envSecrets: this.envSecrets,
-            skills: repairAgent.skills,
-            defaultMaxTokens: repairAgent.constraints?.maxTokens,
-          }
-        );
-      } else {
-        const result = await this.execNonInteractive(repairAgent, repairStep, timeoutMs);
-        repairOutput = result.output;
-      }
-
-      this.recordStepToolSideEffect(context.step.name, {
-        type: 'custom',
-        detail: `Repair agent ${repairAgent.name} completed before deterministic retry`,
-        raw: { repairAgent: repairAgent.name, output: repairOutput.slice(0, 1000) },
-      });
-    } catch (error) {
-      if (error instanceof BudgetExceededError || this.abortController?.signal.aborted) {
-        throw error;
-      }
-      const message = error instanceof Error ? error.message : String(error);
-      this.log(`[${context.step.name}] Repair agent "${repairAgent.name}" failed: ${message}`);
-      this.postToChannel(
-        `**[${context.step.name}]** Repair agent \`${repairAgent.name}\` failed; retrying gate anyway`
-      );
-      this.recordStepToolSideEffect(context.step.name, {
-        type: 'custom',
-        detail: `Repair agent ${repairAgent.name} failed before deterministic retry: ${message}`,
-        raw: { repairAgent: repairAgent.name, error: message },
-      });
-    }
-  }
-
-  private buildDeterministicRepairPrompt(context: DeterministicRepairContext): string {
-    const output = context.output.trim();
-    const clippedOutput = output.length > 4000 ? output.slice(-4000) : output;
-    return (
-      `A deterministic workflow gate failed after an agent/team step. Fix the repository or workflow state so the same gate passes on the next retry.\n\n` +
-      `Step: ${context.step.name}\n` +
-      `Working directory: ${context.cwd}\n` +
-      `Command:\n${context.command}\n\n` +
-      `Failure:\n${context.error}\n` +
-      `Exit code: ${context.exitCode ?? 'unknown'}\n` +
-      `Exit signal: ${context.exitSignal ?? 'none'}\n\n` +
-      `Command output:\n${clippedOutput || '(no output captured)'}\n\n` +
-      `Repair only what is needed for this gate to pass. Preserve unrelated user changes. ` +
-      `After making the fix, report the files changed and the reason the gate should pass.`
-    );
-  }
-
-  private async runAgentStepRepairAgent(context: AgentStepRepairContext): Promise<void> {
-    const repairAgent: AgentDefinition = {
-      ...context.agentDef,
-      interactive: false,
-    };
-    const repairPrompt = this.buildAgentStepRepairPrompt(context);
-    const repairStep: WorkflowStep = {
-      name: `${context.step.name}-repair-${context.attempt}`,
-      type: 'agent',
-      agent: repairAgent.name,
-      task: repairPrompt,
-      cwd: context.cwd,
-      workdir: undefined,
-      retries: 0,
-    };
-    const timeoutMs =
-      repairAgent.constraints?.timeoutMs ?? context.step.timeoutMs ?? this.currentConfig?.swarm?.timeoutMs;
-
-    this.log(
-      `[${context.step.name}] Agent step failed; asking "${repairAgent.name}" to repair before retry ${context.attempt + 1}/${context.maxRetries + 1}`
-    );
-    this.postToChannel(
-      `**[${context.step.name}]** Agent step failed; assigning repair to \`${repairAgent.name}\``
-    );
-    this.recordStepToolSideEffect(context.step.name, {
-      type: 'custom',
-      detail: `Assigned agent-step repair to ${repairAgent.name}`,
-      raw: {
-        repairAgent: repairAgent.name,
-        attempt: context.attempt,
-        maxRetries: context.maxRetries,
-        completionReason: context.completionReason,
-        exitCode: context.exitCode,
-        exitSignal: context.exitSignal,
-      },
-    });
-
-    try {
-      this.ensureBudgetAllowsSpawn(context.step.name, repairAgent.name);
-      let repairOutput: string;
-      if (this.executor) {
-        repairOutput = await this.executor.executeAgentStep(repairStep, repairAgent, repairPrompt, timeoutMs);
-      } else if (repairAgent.cli === 'api') {
-        repairOutput = await executeApiStep(
-          repairAgent.constraints?.model ?? 'claude-sonnet-4-20250514',
-          repairPrompt,
-          {
-            envSecrets: this.envSecrets,
-            skills: repairAgent.skills,
-            defaultMaxTokens: repairAgent.constraints?.maxTokens,
-          }
-        );
-      } else {
-        const result = await this.execNonInteractive(repairAgent, repairStep, timeoutMs);
-        repairOutput = result.output;
-      }
-
-      this.recordStepToolSideEffect(context.step.name, {
-        type: 'custom',
-        detail: `Repair agent ${repairAgent.name} completed before agent retry`,
-        raw: { repairAgent: repairAgent.name, output: repairOutput.slice(0, 1000) },
-      });
-    } catch (error) {
-      if (error instanceof BudgetExceededError || this.abortController?.signal.aborted) {
-        throw error;
-      }
-      const message = error instanceof Error ? error.message : String(error);
-      this.log(`[${context.step.name}] Repair agent "${repairAgent.name}" failed: ${message}`);
-      this.postToChannel(
-        `**[${context.step.name}]** Repair agent \`${repairAgent.name}\` failed; retrying agent step anyway`
-      );
-      this.recordStepToolSideEffect(context.step.name, {
-        type: 'custom',
-        detail: `Repair agent ${repairAgent.name} failed before agent retry: ${message}`,
-        raw: { repairAgent: repairAgent.name, error: message },
-      });
-    }
-  }
-
-  private buildAgentStepRepairPrompt(context: AgentStepRepairContext): string {
-    const output = context.output.trim();
-    const clippedOutput = output.length > 4000 ? output.slice(-4000) : output;
-    const task = (context.step.task ?? '').trim();
-    const clippedTask = task.length > 3000 ? task.slice(0, 3000) : task;
-    return (
-      `A workflow agent step failed or produced an invalid artifact. Repair the repository, workflow state, or step instructions so the step can succeed on the next retry.\n\n` +
-      `Step: ${context.step.name}\n` +
-      `Working directory: ${context.cwd}\n` +
-      `Completion reason: ${context.completionReason ?? 'unknown'}\n` +
-      `Failure:\n${context.error}\n` +
-      `Exit code: ${context.exitCode ?? 'unknown'}\n` +
-      `Exit signal: ${context.exitSignal ?? 'none'}\n\n` +
-      `Step task:\n${clippedTask || '(no task captured)'}\n\n` +
-      `Previous output:\n${clippedOutput || '(no output captured)'}\n\n` +
-      `Repair only what is needed for this step to produce the required artifact or evidence. ` +
-      `Preserve unrelated user changes. After making the fix, report the files changed and why the retry should pass.`
-    );
-  }
-
-  /**
-   * Execute a worktree step (git worktree setup).
-   * Fast, reliable, $0 LLM cost.
-   * Outputs the worktree path for downstream steps to use.
-   */
-  private async executeWorktreeStep(
-    step: WorkflowStep,
-    state: StepState,
-    stepStates: Map<string, StepState>,
-    runId: string,
-    lifecycle: WorkflowStepLifecycleExecutor<StepState>
-  ): Promise<void> {
-    let lastExitCode: number | undefined;
-    let lastExitSignal: string | undefined;
-    let worktreeBranch = '';
-    let createdBranch = false;
-
-    const result = await lifecycle.monitorStep(step, state, {
-      startMessage: `**[${step.name}]** Started (worktree setup)`,
-      execute: async () => {
-        const stepOutputContext = this.buildStepOutputContext(stepStates, runId);
-        const branch = this.interpolateStepTask(step.branch ?? '', stepOutputContext);
-        const baseBranch = step.baseBranch
-          ? this.interpolateStepTask(step.baseBranch, stepOutputContext)
-          : 'HEAD';
-        const worktreePath = step.path
-          ? this.interpolateStepTask(step.path, stepOutputContext)
-          : path.join('.worktrees', step.name);
-        const createBranch = step.createBranch !== false;
-        const stepCwd = this.resolveStepWorkdir(step) ?? this.cwd;
-
-        this.beginStepEvidence(step.name, [stepCwd], state.row.startedAt);
-
-        if (!branch) {
-          throw new Error('Worktree step missing required "branch" field');
-        }
-
-        const absoluteWorktreePath = path.resolve(stepCwd, worktreePath);
-        let branchExists = false;
-
-        await new Promise<void>((resolve) => {
-          const checkChild = cpSpawn('git', ['rev-parse', '--verify', '--quiet', branch], {
-            stdio: 'pipe',
-            cwd: stepCwd,
-            env: filteredEnv(),
-          });
-          checkChild.on('close', (code) => {
-            branchExists = code === 0;
-            resolve();
-          });
-          checkChild.on('error', () => resolve());
-        });
-
-        let worktreeArgs: string[];
-        if (branchExists) {
-          worktreeArgs = ['worktree', 'add', absoluteWorktreePath, branch];
-        } else if (createBranch) {
-          worktreeArgs = ['worktree', 'add', '-b', branch, absoluteWorktreePath, baseBranch];
-        } else {
-          throw new Error(`Branch "${branch}" does not exist and createBranch is false`);
-        }
-
-        let commandStdout = '';
-        let commandStderr = '';
-        const output = await new Promise<string>((resolve, reject) => {
-          const child = cpSpawn('git', worktreeArgs, {
-            stdio: 'pipe',
-            cwd: stepCwd,
-            env: filteredEnv(),
-          });
-
-          const stdoutChunks: string[] = [];
-          const stderrChunks: string[] = [];
-          const abortSignal = this.abortController?.signal;
-          let abortHandler: (() => void) | undefined;
-          if (abortSignal && !abortSignal.aborted) {
-            abortHandler = () => {
-              child.kill('SIGTERM');
-              setTimeout(() => child.kill('SIGKILL'), 5000);
-            };
-            abortSignal.addEventListener('abort', abortHandler, { once: true });
-          }
-
-          let timedOut = false;
-          let timer: ReturnType<typeof setTimeout> | undefined;
-          if (step.timeoutMs) {
-            timer = setTimeout(() => {
-              timedOut = true;
-              child.kill('SIGTERM');
-              setTimeout(() => child.kill('SIGKILL'), 5000);
-            }, step.timeoutMs);
-          }
-
-          child.stdout?.on('data', (chunk: Buffer) => {
-            stdoutChunks.push(chunk.toString());
-          });
-
-          child.stderr?.on('data', (chunk: Buffer) => {
-            stderrChunks.push(chunk.toString());
-          });
-
-          child.on('close', (code, signal) => {
-            if (timer) clearTimeout(timer);
-            if (abortHandler && abortSignal) {
-              abortSignal.removeEventListener('abort', abortHandler);
-            }
-
-            if (abortSignal?.aborted) {
-              reject(new Error(`Step "${step.name}" aborted`));
-              return;
-            }
-
-            if (timedOut) {
-              reject(
-                new Error(`Step "${step.name}" timed out (no step timeout set, check global swarm.timeoutMs)`)
-              );
-              return;
-            }
-
-            commandStdout = stdoutChunks.join('');
-            commandStderr = stderrChunks.join('');
-            lastExitCode = code ?? undefined;
-            lastExitSignal = signal ?? undefined;
-
-            if (code !== 0 && code !== null) {
-              reject(
-                new Error(
-                  `git worktree add failed with exit code ${code}${commandStderr ? `: ${commandStderr.slice(0, 500)}` : ''}`
-                )
-              );
-              return;
-            }
-
-            resolve(absoluteWorktreePath);
-          });
-
-          child.on('error', (err) => {
-            if (timer) clearTimeout(timer);
-            if (abortHandler && abortSignal) {
-              abortSignal.removeEventListener('abort', abortHandler);
-            }
-            reject(new Error(`Failed to execute git worktree command: ${err.message}`));
-          });
-        });
-
-        this.captureStepTerminalEvidence(
-          step.name,
-          {
-            stdout: commandStdout || output,
-            stderr: commandStderr,
-            combined: [commandStdout || output, commandStderr].filter(Boolean).join('\n'),
-          },
-          { exitCode: lastExitCode, exitSignal: lastExitSignal }
-        );
-
-        worktreeBranch = branch;
-        createdBranch = !branchExists && createBranch;
-        return { output };
-      },
-      toCompletionResult: ({ output }, attempt) => ({
-        status: 'completed',
-        output,
-        retries: attempt,
-        exitCode: lastExitCode,
-        exitSignal: lastExitSignal,
-      }),
-      getFailureResult: (error) => ({
-        status: 'failed',
-        output: '',
-        error: error instanceof Error ? error.message : String(error),
-        retries: state.row.retryCount,
-        exitCode: lastExitCode,
-        exitSignal: lastExitSignal,
-      }),
-    });
-
-    if (result.status === 'failed') {
-      this.postToChannel(`**[${step.name}]** Failed: ${result.error ?? 'Unknown error'}`);
-      throw new Error(`Step "${step.name}" failed: ${result.error ?? 'Unknown error'}`);
-    }
-
-    this.postToChannel(
-      `**[${step.name}]** Worktree created at: ${result.output}\n  Branch: ${worktreeBranch}${createdBranch ? ' (created)' : ''}`
-    );
-    this.recordStepToolSideEffect(step.name, {
-      type: 'worktree_created',
-      detail: `Worktree created at ${result.output}`,
-      raw: { branch: worktreeBranch, createdBranch },
-    });
-  }
-
-  /**
-   * Execute an integration step (external service interaction via executor).
-   */
-  private async executeIntegrationStep(
-    step: WorkflowStep,
-    state: StepState,
-    stepStates: Map<string, StepState>,
-    runId: string,
-    lifecycle: WorkflowStepLifecycleExecutor<StepState>
-  ): Promise<void> {
-    const result = await lifecycle.monitorStep(step, state, {
-      startMessage: `**[${step.name}]** Started (integration: ${step.integration}.${step.action})`,
-      execute: async () => {
-        const stepOutputContext = this.buildStepOutputContext(stepStates, runId);
-        const resolvedParams: Record<string, string> = {};
-        for (const [key, value] of Object.entries(step.params ?? {})) {
-          resolvedParams[key] = this.interpolateStepTask(value, stepOutputContext);
-        }
-
-        if (!this.executor?.executeIntegrationStep) {
-          throw new Error(
-            `Integration steps require a cloud executor. Step "${step.name}" cannot run locally. ` +
-              `Use "cloud run" to execute workflows with integration steps.`
-          );
-        }
-
-        const integrationResult = await this.executor.executeIntegrationStep(step, resolvedParams, {
-          workspaceId: this.workspaceId,
-        });
-
-        if (!integrationResult.success) {
-          throw new Error(`Integration step "${step.name}" failed: ${integrationResult.output}`);
-        }
-
-        return { output: integrationResult.output };
-      },
-      toCompletionResult: ({ output }, attempt) => ({
-        status: 'completed',
-        output,
-        retries: attempt,
-      }),
-      getFailureResult: (error) => ({
-        status: 'failed',
-        output: '',
-        error: error instanceof Error ? error.message : String(error),
-        retries: state.row.retryCount,
-      }),
-    });
-
-    if (result.status === 'failed') {
-      this.postToChannel(`**[${step.name}]** Failed: ${result.error ?? 'Unknown error'}`);
-      throw new Error(`Step "${step.name}" failed: ${result.error ?? 'Unknown error'}`);
-    }
-
-    this.postToChannel(`**[${step.name}]** Completed (integration: ${step.integration}.${step.action})`);
-  }
-
-  /**
-   * Execute an agent step (LLM-powered).
-   */
-  private async executeAgentStep(
-    step: WorkflowStep,
-    stepStates: Map<string, StepState>,
-    agentMap: Map<string, AgentDefinition>,
-    errorHandling: ErrorHandlingConfig | undefined,
-    runId: string
-  ): Promise<void> {
-    const state = stepStates.get(step.name);
-    if (!state) throw new Error(`Step state not found: ${step.name}`);
-
-    const agentName = step.agent;
-    if (!agentName) {
-      throw new Error(`Step "${step.name}" is missing required "agent" field`);
-    }
-    const rawAgentDef = agentMap.get(agentName);
-    if (!rawAgentDef) {
-      throw new Error(`Agent "${agentName}" not found in config`);
-    }
-    const specialistDef = WorkflowRunner.resolveAgentDef(rawAgentDef);
-
-    const usesOwnerFlow = specialistDef.cli !== 'api' && specialistDef.interactive !== false;
-    const currentPattern = this.currentConfig?.swarm?.pattern ?? '';
-    const isHubPattern = WorkflowRunner.HUB_PATTERNS.has(currentPattern);
-    const usesAutoHardening =
-      usesOwnerFlow && isHubPattern && !this.isExplicitInteractiveWorker(specialistDef);
-    const ownerDef = usesAutoHardening ? this.resolveAutoStepOwner(specialistDef, agentMap) : specialistDef;
-    // Reviewer resolution is deferred to just before the review gate runs (see below)
-    // so that activeReviewers is up-to-date for concurrent steps.
-    let reviewDef: ReturnType<typeof this.resolveAutoReviewAgent> | undefined;
-    const supervised: SupervisedStep = {
-      specialist: specialistDef,
-      owner: ownerDef,
-      reviewer: reviewDef,
-    };
-    const usesDedicatedOwner = usesOwnerFlow && ownerDef.name !== specialistDef.name;
-
-    const maxRetries =
-      step.retries ??
-      ownerDef.constraints?.retries ??
-      specialistDef.constraints?.retries ??
-      errorHandling?.maxRetries ??
-      0;
-    const retryDelay = errorHandling?.retryDelayMs ?? 1000;
-    const timeoutMs =
-      step.timeoutMs ??
-      ownerDef.constraints?.timeoutMs ??
-      specialistDef.constraints?.timeoutMs ??
-      this.currentConfig?.swarm?.timeoutMs;
-    const repairRetries = errorHandling?.strategy === 'retry' ? (errorHandling.repairRetries ?? 0) : 0;
-    const repairAgent =
-      repairRetries > 0
-        ? this.resolveWorkflowRepairAgent(step, stepStates, agentMap, errorHandling)
-        : undefined;
-
-    let lastError: string | undefined;
-    let lastExitCode: number | undefined;
-    let lastExitSignal: string | undefined;
-    let lastCompletionReason: WorkflowStepCompletionReason | undefined;
-    let lastAttemptStartedAt: number | undefined;
-    let lastEffectiveAgentDef: AgentDefinition | undefined;
-    let lastEffectiveCwd: string | undefined;
-    let lastAttemptReportCaptured = false;
-    let lastDiagnosticResult: DiagnosticResult | null = null;
-
-    // OWNER_DECISION: INCOMPLETE_RETRY is enforced here at the attempt-loop level so every
-    // interactive execution path shares the same contract:
-    // - retries remaining => throw back into the loop and retry
-    // - maxRetries = 0 => fail immediately after the first retry request
-    // - retry budget exhausted => fail with retry_requested_by_owner, never "completed"
-    for (let attempt = 0; attempt <= maxRetries; attempt++) {
-      this.checkAborted();
-
-      // Reset per-attempt exit info so stale values don't leak across retries
-      lastExitCode = undefined;
-      lastExitSignal = undefined;
-      lastAttemptStartedAt = undefined;
-      lastEffectiveAgentDef = undefined;
-      lastEffectiveCwd = undefined;
-      lastAttemptReportCaptured = false;
-      let stepOutputForDiagnostic = '';
-
-      if (attempt > 0) {
-        this.emit({ type: 'step:retrying', runId, stepName: step.name, attempt });
-        this.postToChannel(`**[${step.name}]** Retrying (attempt ${attempt + 1}/${maxRetries + 1})`);
-        this.recordStepToolSideEffect(step.name, {
-          type: 'retry',
-          detail: `Retrying attempt ${attempt + 1}/${maxRetries + 1}`,
-          raw: { attempt, maxRetries },
-        });
-        state.row.retryCount = attempt;
-        await this.db.updateStep(state.row.id, {
-          retryCount: attempt,
-          updatedAt: new Date().toISOString(),
-        });
-        await this.trajectory?.stepRetrying(step, attempt, maxRetries);
-        if (repairAgent && attempt <= repairRetries) {
-          await this.runAgentStepRepairAgent({
-            step,
-            agentDef: repairAgent,
-            attempt,
-            maxRetries,
-            cwd: lastEffectiveCwd ?? this.resolveEffectiveCwd(step, specialistDef),
-            error: lastError ?? 'Unknown error',
-            output: this.lastFailedStepOutput.get(step.name) ?? '',
-            exitCode: lastExitCode,
-            exitSignal: lastExitSignal,
-            completionReason: lastCompletionReason,
-          });
-        }
-        await this.delay(retryDelay);
-      }
-
-      try {
-        this.ensureBudgetAllowsSpawn(step.name, agentName);
-        lastAttemptStartedAt = Date.now();
-        // Mark step as running
-        state.row.status = 'running';
-        state.row.error = undefined;
-        state.row.completionReason = undefined;
-        state.row.startedAt = new Date().toISOString();
-        await this.db.updateStep(state.row.id, {
-          status: 'running',
-          error: undefined,
-          completionReason: undefined,
-          startedAt: state.row.startedAt,
-          updatedAt: new Date().toISOString(),
-        });
-        this.emit({ type: 'step:started', runId, stepName: step.name });
-        this.log(`[${step.name}] Started (owner: ${ownerDef.name}, specialist: ${specialistDef.name})`);
-        this.initializeStepSignalParticipants(step.name, ownerDef.name, specialistDef.name);
-        await this.trajectory?.stepStarted(step, ownerDef.name, {
-          role: usesDedicatedOwner ? 'owner' : 'specialist',
-          owner: ownerDef.name,
-          specialist: specialistDef.name,
-          reviewer: reviewDef?.name,
-        });
-        if (usesDedicatedOwner) {
-          await this.trajectory?.stepSupervisionAssigned(step, supervised);
-        }
-        this.emit({
-          type: 'step:owner-assigned',
-          runId,
-          stepName: step.name,
-          ownerName: ownerDef.name,
-          specialistName: specialistDef.name,
-        });
-
-        // Resolve step-output variables (e.g. {{steps.plan.output}}) at execution time
-        const stepOutputContext = this.buildStepOutputContext(stepStates, runId);
-        let resolvedTask = this.interpolateStepTask(step.task ?? '', stepOutputContext);
-
-        // On retry attempts, prepend failure context so the agent knows what went wrong
-        if (attempt > 0 && lastError) {
-          if (lastDiagnosticResult) {
-            resolvedTask =
-              `[RETRY — Attempt ${attempt + 1}/${maxRetries + 1}] Verification failed.\n` +
-              `Diagnostic analysis:\n${lastDiagnosticResult.analysis}\n\n` +
-              `Original error: ${lastError}\n---\n${resolvedTask}`;
-          } else {
-            const priorOutput = (this.lastFailedStepOutput.get(step.name) ?? '').slice(-2000);
-            const customVerificationFailure = this.lastCustomVerificationFailure.get(step.name);
-            const verificationFailurePrompt = customVerificationFailure
-              ? `[VERIFICATION FAILED] Your code did not pass the verification check.\n` +
-                `Command: ${customVerificationFailure.command}\n` +
-                `Output:\n` +
-                `${customVerificationFailure.output}\n\n` +
-                `Fix the issues above before proceeding.\n`
-              : '';
-            resolvedTask =
-              `[RETRY — Attempt ${attempt + 1}/${maxRetries + 1}]\n` +
-              `Previous attempt failed: ${lastError}\n` +
-              verificationFailurePrompt +
-              (priorOutput ? `Previous output (last 2000 chars):\n${priorOutput}\n` : '') +
-              `---\n${resolvedTask}`;
-          }
-        }
-
-        // If this is an interactive agent, append awareness of non-interactive workers
-        // so the lead knows not to message them and to use step output chaining instead
-        if (specialistDef.interactive !== false || ownerDef.interactive !== false) {
-          const nonInteractiveInfo = this.buildNonInteractiveAwareness(agentMap, stepStates);
-          if (nonInteractiveInfo) {
-            resolvedTask += nonInteractiveInfo;
-          }
-        }
-
-        // Apply step-level workdir override to agent definitions if present
-        const applyStepCwd = (def: AgentDefinition): AgentDefinition => {
-          if (step.cwd) {
-            return { ...def, cwd: step.cwd, workdir: undefined };
-          }
-          if (step.workdir) {
-            const stepWorkdir = this.resolveStepWorkdir(step);
-            if (stepWorkdir) {
-              return { ...def, cwd: stepWorkdir, workdir: undefined };
-            }
-          }
-          return def;
-        };
-        const effectiveSpecialist = applyStepCwd(specialistDef);
-        const effectiveOwner = applyStepCwd(ownerDef);
-        const effectiveReviewer = reviewDef ? applyStepCwd(reviewDef) : undefined;
-        lastEffectiveAgentDef = effectiveSpecialist;
-        lastEffectiveCwd = this.resolveAgentCwd(effectiveSpecialist);
-        this.beginStepEvidence(
-          step.name,
-          [
-            this.resolveAgentCwd(effectiveSpecialist),
-            this.resolveAgentCwd(effectiveOwner),
-            effectiveReviewer ? this.resolveAgentCwd(effectiveReviewer) : undefined,
-          ],
-          state.row.startedAt
-        );
-
-        let specialistOutput: string;
-        let ownerOutput: string;
-        let ownerElapsed: number;
-        let completionReason: WorkflowStepCompletionReason | undefined;
-        let promptTaskText: string | undefined;
-
-        if (usesDedicatedOwner) {
-          const result = await this.executeSupervisedAgentStep(
-            step,
-            { specialist: effectiveSpecialist, owner: effectiveOwner, reviewer: reviewDef },
-            resolvedTask,
-            timeoutMs,
-            attempt
-          );
-          specialistOutput = result.specialistOutput;
-          stepOutputForDiagnostic = result.specialistOutput;
-          ownerOutput = result.ownerOutput;
-          ownerElapsed = result.ownerElapsed;
-          completionReason = result.completionReason;
-        } else {
-          const ownerTask = this.injectStepOwnerContract(
-            step,
-            resolvedTask,
-            effectiveOwner,
-            effectiveSpecialist
-          );
-          const explicitInteractiveWorker = this.isExplicitInteractiveWorker(effectiveOwner);
-          let explicitWorkerHandle: Agent | undefined;
-          let explicitWorkerCompleted = false;
-          let explicitWorkerOutput = '';
-
-          this.log(
-            `[${step.name}] Spawning owner "${effectiveOwner.name}" (cli: ${effectiveOwner.cli})${step.workdir ? ` [workdir: ${step.workdir}]` : ''}`
-          );
-          const resolvedStep = { ...step, task: ownerTask };
-          const ownerStartTime = Date.now();
-          // When processBackend is set without an explicit executor, the runner
-          // constructor synthesizes a RunnerStepExecutor that calls
-          // processBackend.createEnvironment(step.name).exec(command). Explicit
-          // executors still take precedence. See process-backend-executor.ts.
-          const spawnResult = this.executor
-            ? await this.executor.executeAgentStep(resolvedStep, effectiveOwner, ownerTask, timeoutMs)
-            : effectiveOwner.cli === 'api'
-              ? {
-                  output: await executeApiStep(
-                    effectiveOwner.constraints?.model ?? 'claude-sonnet-4-20250514',
-                    ownerTask,
-                    {
-                      envSecrets: this.envSecrets,
-                      skills: effectiveOwner.skills,
-                      defaultMaxTokens: effectiveOwner.constraints?.maxTokens,
-                    }
-                  ),
-                  exitCode: 0,
-                  promptTaskText: ownerTask,
-                }
-              : await this.spawnAndWait(effectiveOwner, resolvedStep, timeoutMs, {
-                  retryAttempt: attempt,
-                  evidenceStepName: step.name,
-                  evidenceRole: usesOwnerFlow ? 'owner' : 'specialist',
-                  preserveOnIdle: !isHubPattern || !this.isLeadLikeAgent(effectiveOwner) ? false : undefined,
-                  logicalName: effectiveOwner.name,
-                  onSpawned: explicitInteractiveWorker
-                    ? ({ agent }) => {
-                        explicitWorkerHandle = agent;
-                      }
-                    : undefined,
-                  onChunk: explicitInteractiveWorker
-                    ? ({ chunk }) => {
-                        explicitWorkerOutput += WorkflowRunner.stripAnsi(chunk);
-                        if (
-                          !explicitWorkerCompleted &&
-                          this.hasExplicitInteractiveWorkerCompletionEvidence(
-                            step,
-                            explicitWorkerOutput,
-                            ownerTask,
-                            resolvedTask
-                          )
-                        ) {
-                          explicitWorkerCompleted = true;
-                          void explicitWorkerHandle?.release().catch(() => undefined);
-                        }
-                      }
-                    : undefined,
-                });
-          const output = typeof spawnResult === 'string' ? spawnResult : spawnResult.output;
-          promptTaskText =
-            typeof spawnResult === 'string'
-              ? effectiveOwner.interactive === false
-                ? undefined
-                : ownerTask
-              : (spawnResult.promptTaskText ?? ownerTask);
-          lastExitCode = typeof spawnResult === 'string' ? undefined : spawnResult.exitCode;
-          lastExitSignal = typeof spawnResult === 'string' ? undefined : spawnResult.exitSignal;
-          ownerElapsed = Date.now() - ownerStartTime;
-          this.log(`[${step.name}] Owner "${effectiveOwner.name}" exited`);
-          if (usesOwnerFlow) {
-            try {
-              const completionDecision = this.resolveOwnerCompletionDecision(
-                step,
-                output,
-                output,
-                promptTaskText ?? ownerTask,
-                promptTaskText ?? ownerTask
-              );
-              completionReason = completionDecision.completionReason;
-            } catch (error) {
-              const canUseVerificationFallback =
-                !usesDedicatedOwner &&
-                step.verification &&
-                error instanceof WorkflowCompletionError &&
-                error.completionReason === 'failed_no_evidence';
-              if (!canUseVerificationFallback) {
-                throw error;
-              }
-            }
-          }
-          specialistOutput = output;
-          stepOutputForDiagnostic = output;
-          ownerOutput = output;
-        }
-
-        // Even non-interactive steps can emit an explicit OWNER_DECISION contract.
-        // Honor retry/fail/clarification signals before verification-driven success so
-        // real runs stay consistent with interactive owner flows.
-        if (!usesOwnerFlow) {
-          const explicitOwnerDecision = this.parseOwnerDecision(step, ownerOutput, false);
-          if (explicitOwnerDecision?.decision === 'INCOMPLETE_RETRY') {
-            throw new WorkflowCompletionError(
-              `Step "${step.name}" owner requested retry${explicitOwnerDecision.reason ? `: ${explicitOwnerDecision.reason}` : ''}`,
-              'retry_requested_by_owner'
-            );
-          }
-          if (explicitOwnerDecision?.decision === 'INCOMPLETE_FAIL') {
-            throw new WorkflowCompletionError(
-              `Step "${step.name}" owner marked the step incomplete${explicitOwnerDecision.reason ? `: ${explicitOwnerDecision.reason}` : ''}`,
-              'failed_owner_decision'
-            );
-          }
-          if (explicitOwnerDecision?.decision === 'NEEDS_CLARIFICATION') {
-            throw new WorkflowCompletionError(
-              `Step "${step.name}" owner requested clarification before completion${explicitOwnerDecision.reason ? `: ${explicitOwnerDecision.reason}` : ''}`,
-              'retry_requested_by_owner'
-            );
-          }
-        }
-
-        // Run verification if configured.
-        // Self-owned interactive steps still need verification fallback so
-        // explicit OWNER_DECISION output is not mandatory for the happy path.
-        if (step.verification && (!usesOwnerFlow || !usesDedicatedOwner) && !completionReason) {
-          const verificationResult = this.runVerification(
-            step.verification,
-            specialistOutput,
-            step.name,
-            promptTaskText
-          );
-          completionReason = verificationResult.completionReason;
-        }
-
-        // Retry-style owner decisions are control-flow signals, not terminal success states.
-        // Guard here so they cannot accidentally fall through into review or completed-step
-        // persistence if a future branch returns a completionReason instead of throwing.
-        if (completionReason === 'retry_requested_by_owner') {
-          throw new WorkflowCompletionError(
-            `Step "${step.name}" owner requested another attempt`,
-            'retry_requested_by_owner'
-          );
-        }
-
-        // Every interactive step gets a review pass; pick a dedicated reviewer when available.
-        // Resolve reviewer JIT so activeReviewers reflects concurrent steps that started earlier.
-        if (usesAutoHardening && usesDedicatedOwner && !reviewDef) {
-          reviewDef = this.resolveAutoReviewAgent(ownerDef, agentMap);
-          supervised.reviewer = reviewDef;
-        }
-        let combinedOutput = specialistOutput;
-        if (usesOwnerFlow && reviewDef) {
-          this.activeReviewers.set(reviewDef.name, (this.activeReviewers.get(reviewDef.name) ?? 0) + 1);
-          try {
-            const remainingMs = timeoutMs ? Math.max(0, timeoutMs - ownerElapsed) : undefined;
-            const reviewOutput = await this.runStepReviewGate(
-              step,
-              resolvedTask,
-              specialistOutput,
-              ownerOutput,
-              ownerDef,
-              reviewDef,
-              remainingMs
-            );
-            combinedOutput = this.combineStepAndReviewOutput(specialistOutput, reviewOutput);
-          } finally {
-            const count = (this.activeReviewers.get(reviewDef.name) ?? 1) - 1;
-            if (count <= 0) this.activeReviewers.delete(reviewDef.name);
-            else this.activeReviewers.set(reviewDef.name, count);
-          }
-        }
-
-        await this.captureAgentReport(
-          runId,
-          step.name,
-          lastEffectiveAgentDef,
-          lastEffectiveCwd,
-          lastAttemptStartedAt,
-          Date.now()
-        );
-        lastAttemptReportCaptured = true;
-
-        // Mark completed
-        state.row.status = 'completed';
-        state.row.output = combinedOutput;
-        state.row.completionReason = completionReason;
-        state.row.completedAt = new Date().toISOString();
-        await this.db.updateStep(state.row.id, {
-          status: 'completed',
-          output: combinedOutput,
-          completionReason,
-          completedAt: state.row.completedAt,
-          updatedAt: new Date().toISOString(),
-        });
-
-        // Persist step output to disk so it survives restarts and is inspectable
-        await this.persistStepOutput(runId, step.name, combinedOutput);
-
-        this.emit({
-          type: 'step:completed',
-          runId,
-          stepName: step.name,
-          output: combinedOutput,
-          exitCode: lastExitCode,
-          exitSignal: lastExitSignal,
-        });
-        this.finalizeStepEvidence(step.name, 'completed', state.row.completedAt, completionReason);
-        await this.trajectory?.stepCompleted(step, combinedOutput, attempt + 1);
-        return;
-      } catch (err) {
-        lastError = err instanceof Error ? err.message : String(err);
-        lastCompletionReason = err instanceof WorkflowCompletionError ? err.completionReason : undefined;
-        if (stepOutputForDiagnostic) {
-          this.lastFailedStepOutput.set(step.name, stepOutputForDiagnostic);
-        }
-        const diagnosticVerification = step.verification as DiagnosticVerificationCheck | undefined;
-        if (
-          err instanceof WorkflowCompletionError &&
-          err.completionReason === 'failed_verification' &&
-          diagnosticVerification?.diagnosticAgent &&
-          attempt < maxRetries
-        ) {
-          lastDiagnosticResult = await this.runDiagnosticAgent(
-            step,
-            lastError,
-            stepOutputForDiagnostic || (this.lastFailedStepOutput.get(step.name) ?? ''),
-            agentMap,
-            runId
-          );
-        } else {
-          lastDiagnosticResult = null;
-        }
-        if (lastCompletionReason !== 'failed_verification') {
-          this.lastCustomVerificationFailure.delete(step.name);
-        }
-        if (!(err instanceof BudgetExceededError) && !lastAttemptReportCaptured) {
-          await this.captureAgentReport(
-            runId,
-            step.name,
-            lastEffectiveAgentDef,
-            lastEffectiveCwd,
-            lastAttemptStartedAt,
-            Date.now()
-          );
-          lastAttemptReportCaptured = true;
-        }
-        if (err instanceof BudgetExceededError) {
-          break;
-        }
-        if (lastCompletionReason === 'retry_requested_by_owner' && attempt >= maxRetries) {
-          lastError = this.buildOwnerRetryBudgetExceededMessage(step.name, maxRetries, lastError);
-        }
-        if (err instanceof SpawnExitError) {
-          lastExitCode = err.exitCode;
-          lastExitSignal = err.exitSignal;
-        }
-        const ownerTimedOut = usesDedicatedOwner
-          ? /\bowner timed out\b/i.test(lastError)
-          : /\btimed out\b/i.test(lastError) && !lastError.includes(`${step.name}-review`);
-        if (ownerTimedOut) {
-          this.emit({ type: 'step:owner-timeout', runId, stepName: step.name, ownerName: ownerDef.name });
-        }
-      }
-    }
-
-    // All retries exhausted — record root-cause diagnosis and mark failed
-    const nonInteractive =
-      ownerDef.interactive === false || ['worker', 'reviewer', 'analyst'].includes(ownerDef.preset ?? '');
-    const verificationValue =
-      typeof step.verification === 'object' && 'value' in step.verification
-        ? String(step.verification.value)
-        : undefined;
-    if (!lastAttemptReportCaptured) {
-      await this.captureAgentReport(
-        runId,
-        step.name,
-        lastEffectiveAgentDef,
-        lastEffectiveCwd,
-        lastAttemptStartedAt,
-        Date.now()
-      );
-    }
-    await this.trajectory?.stepFailed(step, lastError ?? 'Unknown error', maxRetries + 1, maxRetries, {
-      agent: agentName,
-      nonInteractive,
-      verificationValue,
-    });
-    this.postToChannel(`**[${step.name}]** Failed: ${lastError ?? 'Unknown error'}`);
-    await this.markStepFailed(
-      state,
-      lastError ?? 'Unknown error',
-      runId,
-      {
-        exitCode: lastExitCode,
-        exitSignal: lastExitSignal,
-      },
-      lastCompletionReason
-    );
-    throw new Error(
-      `Step "${step.name}" failed after ${maxRetries} retries: ${lastError ?? 'Unknown error'}`
-    );
-  }
-
-  private async runDiagnosticAgent(
-    step: WorkflowStep,
-    verificationError: string,
-    stepOutput: string,
-    agentMap: Map<string, AgentDefinition>,
-    runId: string
-  ): Promise<DiagnosticResult | null> {
-    const verification = step.verification as DiagnosticVerificationCheck | undefined;
-    const diagnosticAgentName = verification?.diagnosticAgent;
-    if (!verification || !diagnosticAgentName) {
-      return null;
-    }
-
-    const rawDiagnosticDef = agentMap.get(diagnosticAgentName);
-    if (!rawDiagnosticDef) {
-      this.log(
-        `[${step.name}] Diagnostic agent "${diagnosticAgentName}" not found — falling back to standard retry`
-      );
-      return null;
-    }
-
-    const diagnosticAgentDef: AgentDefinition = {
-      ...WorkflowRunner.resolveAgentDef(rawDiagnosticDef),
-      interactive: false,
-    };
-    const verificationCommand =
-      verification.type === 'custom' ? verification.value : `${verification.type}: ${verification.value}`;
-    const diagnosticTimeout = verification.diagnosticTimeout ?? 60_000;
-    const diagnosticPrompt =
-      `The following verification failed after step "${step.name}".\n\n` +
-      `Verification command: ${verificationCommand}\n` +
-      `Verification output:\n${verificationError}\n\n` +
-      `Step task was:\n${step.task ?? ''}\n\n` +
-      `Step output (last 2000 chars):\n${stepOutput.slice(-2000)}\n\n` +
-      `Analyze what went wrong. Be specific. Do NOT fix the code.`;
-    const diagnosticStep: WorkflowStep = {
-      ...step,
-      name: `${step.name}-diagnostic-${runId.slice(0, 8)}`,
-      agent: diagnosticAgentName,
-      task: diagnosticPrompt,
-      verification: undefined,
-      retries: 0,
-    };
-    const diagnosticCwd = this.resolveExecutionCwd(diagnosticStep, diagnosticAgentDef);
-    const startedAt = Date.now();
-
-    try {
-      this.ensureBudgetAllowsSpawn(step.name, diagnosticAgentName);
-      this.log(`[${step.name}] Verification failed — running diagnostic agent '${diagnosticAgentName}'...`);
-      const diagnosticResult = await this.execNonInteractive(
-        diagnosticAgentDef,
-        diagnosticStep,
-        diagnosticTimeout
-      );
-      const elapsedMs = Date.now() - startedAt;
-      await this.captureAgentReport(
-        runId,
-        step.name,
-        diagnosticAgentDef,
-        diagnosticCwd,
-        startedAt,
-        Date.now()
-      );
-      const analysis = diagnosticResult.output.trim();
-      const tokenCount = Math.max(1, Math.ceil(analysis.length / 4));
-      const firstLine =
-        analysis
-          .split(/\r?\n/)
-          .map((line) => line.trim())
-          .find(Boolean) ?? '(no analysis returned)';
-
-      this.log(`[${step.name}] Diagnostic complete (${elapsedMs}ms, ${tokenCount} tokens): ${firstLine}`);
-
-      return {
-        analysis,
-        metadata: {
-          agentName: diagnosticAgentName,
-          elapsedMs,
-          tokenCount,
-        },
-      };
-    } catch (error) {
-      await this.captureAgentReport(
-        runId,
-        step.name,
-        diagnosticAgentDef,
-        diagnosticCwd,
-        startedAt,
-        Date.now()
-      );
-      const message = error instanceof Error ? error.message : String(error);
-      if (/\btimed out\b/i.test(message)) {
-        this.log(`[${step.name}] Diagnostic timed out — falling back to standard retry`);
-      } else {
-        this.log(`[${step.name}] Diagnostic failed — falling back to standard retry: ${message}`);
-      }
-      return null;
-    }
-  }
-
-  private buildOwnerRetryBudgetExceededMessage(
-    stepName: string,
-    maxRetries: number,
-    ownerDecisionError?: string
-  ): string {
-    const attempts = maxRetries + 1;
-    const prefix = `Step "${stepName}" `;
-    const normalizedDecision = ownerDecisionError?.startsWith(prefix)
-      ? ownerDecisionError.slice(prefix.length).trim()
-      : ownerDecisionError?.trim();
-    const decisionSuffix = normalizedDecision ? ` Latest owner decision: ${normalizedDecision}` : '';
-
-    if (maxRetries === 0) {
-      return (
-        `Step "${stepName}" owner requested another attempt, but no retries are configured ` +
-        `(maxRetries=0). Configure retries > 0 to allow OWNER_DECISION: INCOMPLETE_RETRY.` +
-        decisionSuffix
-      );
-    }
-
-    return (
-      `Step "${stepName}" owner requested another attempt after ${attempts} total attempts, ` +
-      `but the retry budget is exhausted (maxRetries=${maxRetries}).` +
-      decisionSuffix
-    );
-  }
-
-  private injectStepOwnerContract(
-    step: WorkflowStep,
-    resolvedTask: string,
-    ownerDef: AgentDefinition,
-    specialistDef: AgentDefinition
-  ): string {
-    if (ownerDef.interactive === false) return resolvedTask;
-    const specialistNote =
-      ownerDef.name === specialistDef.name
-        ? ''
-        : `Specialist intended for this step: "${specialistDef.name}" (${specialistDef.role ?? specialistDef.cli}).`;
-    return (
-      resolvedTask +
-      '\n\n---\n' +
-      `STEP OWNER CONTRACT:\n` +
-      `- You are the accountable owner for step "${step.name}".\n` +
-      (specialistNote ? `- ${specialistNote}\n` : '') +
-      `- If you delegate, you must still verify completion yourself.\n` +
-      `- Preferred final decision format:\n` +
-      `  OWNER_DECISION: <one of COMPLETE, INCOMPLETE_RETRY, INCOMPLETE_FAIL, NEEDS_CLARIFICATION>\n` +
-      `  REASON: <one sentence>\n` +
-      `- Legacy completion marker still supported: STEP_COMPLETE:${step.name}\n` +
-      `- Then self-terminate immediately with /exit.`
-    );
-  }
-
-  private buildOwnerSupervisorTask(
-    step: WorkflowStep,
-    originalTask: string,
-    supervised: SupervisedStep,
-    workerRuntimeName: string
-  ): string {
-    const verificationGuide = this.buildSupervisorVerificationGuide(step.verification);
-    const channelLine = this.channel ? `#${this.channel}` : '(workflow channel unavailable)';
-    const channelContract = this.channel
-      ? `- Prefer Relaycast/group-chat handoff signals over terminal sentinels: wait for the worker to post \`WORKER_DONE: <brief summary>\` in ${channelLine}\n` +
-        `- When you have validated the handoff, post \`LEAD_DONE: <brief summary>\` to ${channelLine} before you exit\n`
-      : '';
-    return (
-      `You are the step owner/supervisor for step "${step.name}".\n\n` +
-      `Worker: ${supervised.specialist.name} (runtime: ${workerRuntimeName}) on ${channelLine}\n` +
-      `Task: ${originalTask}\n\n` +
-      `Your job: Monitor the worker and determine when the task is complete.\n\n` +
-      `How to verify completion:\n` +
-      `- Watch ${channelLine} for the worker's progress messages and mirrored PTY output\n` +
-      `- Check file changes: run \`git diff --stat\` or inspect expected files directly\n` +
-      `- Ask the worker directly on ${channelLine} if you need a status update\n` +
-      channelContract +
-      verificationGuide +
-      `\nWhen you have enough evidence, return:\n` +
-      `OWNER_DECISION: <one of COMPLETE, INCOMPLETE_RETRY, INCOMPLETE_FAIL, NEEDS_CLARIFICATION>\n` +
-      `REASON: <one sentence>\n` +
-      `Legacy completion marker still supported: STEP_COMPLETE:${step.name}`
-    );
-  }
-
-  private buildWorkerHandoffTask(
-    step: WorkflowStep,
-    originalTask: string,
-    supervised: SupervisedStep
-  ): string {
-    if (!this.channel) return originalTask;
-
-    return (
-      `${originalTask}\n\n---\n` +
-      `WORKER COMPLETION CONTRACT:\n` +
-      `- You are handing work off to owner "${supervised.owner.name}" for step "${step.name}".\n` +
-      `- When your work is ready for review, post to #${this.channel}: \`WORKER_DONE: <brief summary>\`\n` +
-      `- Do not rely on terminal output alone for handoff; use the workflow group chat signal above.\n` +
-      `- After posting your handoff signal, self-terminate with /exit unless the owner asks for follow-up.`
-    );
-  }
-
-  private buildWorkflowRuntimeAgentBaseName(stepName: string, options: SpawnAndWaitOptions): string {
-    return `${stepName}${options.agentNameSuffix ? `-${options.agentNameSuffix}` : ''}-${(this.currentRunId ?? this.generateShortId()).slice(0, 8)}`;
-  }
-
-  private async releaseStaleRetryAgents(baseRequestedName: string, stepName: string): Promise<void> {
-    if (!this.relay) {
-      return;
-    }
-
-    const staleAgents = (await this.relay.listAgents()).filter(
-      (agent) => agent.name === baseRequestedName || agent.name.startsWith(`${baseRequestedName}-r`)
-    );
-    if (staleAgents.length === 0) {
-      return;
-    }
-
-    const staleNames = [...new Set(staleAgents.map((agent) => agent.name))].sort();
-    this.log(`[${stepName}] Releasing stale retry agent(s): ${staleNames.join(', ')}`);
-
-    for (const agent of staleAgents) {
-      await agent.release(`workflow retry cleanup for step "${stepName}"`);
-    }
-
-    const deadline = Date.now() + 5_000;
-    while (Date.now() < deadline) {
-      const remaining = (await this.relay.listAgentsRaw())
-        .map((agent) => agent.name)
-        .filter((name) => staleNames.includes(name));
-      if (remaining.length === 0) {
-        return;
-      }
-      await this.delay(100);
-    }
-
-    throw new Error(`Failed to clear stale retry agent(s) before respawn: ${staleNames.join(', ')}`);
-  }
-
-  private buildSupervisorVerificationGuide(verification?: VerificationCheck): string {
-    if (!verification) return '';
-    switch (verification.type) {
-      case 'output_contains':
-        return `- Verification gate: confirm the worker output contains ${JSON.stringify(verification.value)}\n`;
-      case 'file_exists':
-        return `- Verification gate: confirm the file exists at ${JSON.stringify(verification.value)}\n`;
-      case 'exit_code':
-        return `- Verification gate: confirm the worker exits with code ${JSON.stringify(verification.value)}\n`;
-      case 'custom':
-        return `- Verification gate: apply the custom verification rule ${JSON.stringify(verification.value)}\n`;
-      default:
-        return '';
-    }
-  }
-
-  private async executeSupervisedAgentStep(
-    step: WorkflowStep,
-    supervised: SupervisedStep,
-    resolvedTask: string,
-    timeoutMs?: number,
-    retryAttempt = 0
-  ): Promise<{
-    specialistOutput: string;
-    ownerOutput: string;
-    ownerElapsed: number;
-    completionReason: WorkflowStepCompletionReason;
-  }> {
-    if (this.executor) {
-      const specialistTask = this.buildWorkerHandoffTask(step, resolvedTask, supervised);
-      const supervisorTask = this.buildOwnerSupervisorTask(
-        step,
-        resolvedTask,
-        supervised,
-        supervised.specialist.name
-      );
-      const specialistStep = { ...step, task: specialistTask };
-      const ownerStep: WorkflowStep = {
-        ...step,
-        name: `${step.name}-owner`,
-        agent: supervised.owner.name,
-        task: supervisorTask,
-      };
-
-      this.log(
-        `[${step.name}] Spawning specialist "${supervised.specialist.name}" and owner "${supervised.owner.name}"`
-      );
-      const specialistPromise = this.executor.executeAgentStep(
-        specialistStep,
-        supervised.specialist,
-        specialistTask,
-        timeoutMs
-      );
-      // Guard against unhandled rejection if owner fails before specialist settles
-      const specialistSettled = specialistPromise.catch(() => undefined);
-
-      try {
-        const ownerStartTime = Date.now();
-        const ownerOutput = await this.executor.executeAgentStep(
-          ownerStep,
-          supervised.owner,
-          supervisorTask,
-          timeoutMs
-        );
-        const ownerElapsed = Date.now() - ownerStartTime;
-        const specialistOutput = await specialistPromise;
-        const completionDecision = this.resolveOwnerCompletionDecision(
-          step,
-          ownerOutput,
-          specialistOutput,
-          supervisorTask,
-          resolvedTask
-        );
-        return {
-          specialistOutput,
-          ownerOutput,
-          ownerElapsed,
-          completionReason: completionDecision.completionReason,
-        };
-      } catch (error) {
-        await specialistSettled;
-        throw error;
-      }
-    }
-
-    let workerHandle: Agent | undefined;
-    let workerRuntimeName = supervised.specialist.name;
-    let workerSpawned = false;
-    let workerReleased = false;
-    let resolveWorkerSpawn!: () => void;
-    let rejectWorkerSpawn!: (error: unknown) => void;
-    const workerReady = new Promise<void>((resolve, reject) => {
-      resolveWorkerSpawn = resolve;
-      rejectWorkerSpawn = reject;
-    });
-
-    const specialistTask = this.buildWorkerHandoffTask(step, resolvedTask, supervised);
-    const specialistStep = { ...step, task: specialistTask };
-    this.log(
-      `[${step.name}] Spawning specialist "${supervised.specialist.name}" (cli: ${supervised.specialist.cli})`
-    );
-    const workerPromise = this.spawnAndWait(supervised.specialist, specialistStep, timeoutMs, {
-      agentNameSuffix: 'worker',
-      retryAttempt,
-      evidenceStepName: step.name,
-      evidenceRole: 'worker',
-      logicalName: supervised.specialist.name,
-      onSpawned: ({ actualName, agent }) => {
-        workerHandle = agent;
-        workerRuntimeName = actualName;
-        this.supervisedRuntimeAgents.set(actualName, {
-          stepName: step.name,
-          role: 'specialist',
-          logicalName: supervised.specialist.name,
-        });
-        if (!workerSpawned) {
-          workerSpawned = true;
-          resolveWorkerSpawn();
-        }
-      },
-      onChunk: ({ agentName, chunk }) => {
-        this.forwardAgentChunkToChannel(step.name, 'Worker', agentName, chunk, supervised.specialist.name);
-      },
-    }).catch((error) => {
-      if (!workerSpawned) {
-        workerSpawned = true;
-        rejectWorkerSpawn(error);
-      }
-      throw error;
-    });
-
-    const workerSettled = workerPromise.catch(() => undefined);
-    workerPromise
-      .then((result) => {
-        workerReleased = true;
-        this.log(`[${step.name}] Worker ${workerRuntimeName} exited`);
-        this.recordStepToolSideEffect(step.name, {
-          type: 'worker_exit',
-          detail: `Worker ${workerRuntimeName} exited`,
-          raw: { worker: workerRuntimeName, exitCode: result.exitCode, exitSignal: result.exitSignal },
-        });
-        if (
-          step.verification?.type === 'output_contains' &&
-          this.outputContainsVerificationToken(result.output, step.verification.value, result.promptTaskText)
-        ) {
-          this.log(
-            `[${step.name}] Verification gate observed: output contains ${JSON.stringify(step.verification.value)}`
-          );
-        }
-      })
-      .catch((error) => {
-        const message = error instanceof Error ? error.message : String(error);
-        this.postToChannel(
-          `**[${step.name}]** Worker \`${workerRuntimeName}\` exited with error: ${message}`
-        );
-        this.recordStepToolSideEffect(step.name, {
-          type: 'worker_error',
-          detail: `Worker ${workerRuntimeName} exited with error: ${message}`,
-          raw: { worker: workerRuntimeName, error: message },
-        });
-      });
-
-    await workerReady;
-
-    const supervisorTask = this.buildOwnerSupervisorTask(step, resolvedTask, supervised, workerRuntimeName);
-    const ownerStep: WorkflowStep = {
-      ...step,
-      name: `${step.name}-owner`,
-      agent: supervised.owner.name,
-      task: supervisorTask,
-    };
-
-    this.log(`[${step.name}] Spawning owner "${supervised.owner.name}" (cli: ${supervised.owner.cli})`);
-    const ownerStartTime = Date.now();
-
-    try {
-      const ownerResultObj =
-        supervised.owner.cli === 'api'
-          ? {
-              output: await executeApiStep(
-                supervised.owner.constraints?.model ?? 'claude-sonnet-4-20250514',
-                supervisorTask,
-                {
-                  envSecrets: this.envSecrets,
-                  skills: supervised.owner.skills,
-                  defaultMaxTokens: supervised.owner.constraints?.maxTokens,
-                }
-              ),
-              exitCode: 0,
-              promptTaskText: supervisorTask,
-            }
-          : await this.spawnAndWait(supervised.owner, ownerStep, timeoutMs, {
-              agentNameSuffix: 'owner',
-              retryAttempt,
-              evidenceStepName: step.name,
-              evidenceRole: 'owner',
-              logicalName: supervised.owner.name,
-              onSpawned: ({ actualName }) => {
-                this.supervisedRuntimeAgents.set(actualName, {
-                  stepName: step.name,
-                  role: 'owner',
-                  logicalName: supervised.owner.name,
-                });
-              },
-              onChunk: ({ chunk }) => {
-                void this.recordOwnerMonitoringChunk(step, supervised.owner, chunk);
-              },
-            });
-      const ownerElapsed = Date.now() - ownerStartTime;
-      const ownerOutput = ownerResultObj.output;
-      this.log(`[${step.name}] Owner "${supervised.owner.name}" exited`);
-      const workerResultObj = await workerPromise;
-      const specialistOutput = workerResultObj.output;
-      const completionDecision = this.resolveOwnerCompletionDecision(
-        step,
-        ownerOutput,
-        specialistOutput,
-        ownerResultObj.promptTaskText ?? supervisorTask,
-        workerResultObj.promptTaskText ?? specialistTask
-      );
-      return {
-        specialistOutput,
-        ownerOutput,
-        ownerElapsed,
-        completionReason: completionDecision.completionReason,
-      };
-    } catch (error) {
-      const message = error instanceof Error ? error.message : String(error);
-      if (!workerReleased && workerHandle) {
-        await workerHandle.release().catch(() => undefined);
-      }
-      await workerSettled;
-      if (/\btimed out\b/i.test(message)) {
-        throw new Error(`Step "${step.name}" owner timed out after ${timeoutMs ?? 'unknown'}ms`);
-      }
-      throw error;
-    }
-  }
-
-  private forwardAgentChunkToChannel(
-    stepName: string,
-    roleLabel: string,
-    agentName: string,
-    chunk: string,
-    sender?: string
-  ): void {
-    const lines = WorkflowRunner.scrubForChannel(chunk)
-      .split('\n')
-      .map((line) => line.trim())
-      .filter(Boolean)
-      .slice(0, 3);
-    for (const line of lines) {
-      this.postToChannel(`**[${stepName}]** ${roleLabel} \`${agentName}\`: ${line.slice(0, 280)}`, {
-        stepName,
-        sender,
-        actor: agentName,
-        role: roleLabel,
-        origin: 'forwarded_chunk',
-      });
-    }
-  }
-
-  private async recordOwnerMonitoringChunk(
-    step: WorkflowStep,
-    ownerDef: AgentDefinition,
-    chunk: string
-  ): Promise<void> {
-    const stripped = WorkflowRunner.stripAnsi(chunk);
-    const details: string[] = [];
-    if (/git diff --stat/i.test(stripped)) details.push('Checked git diff stats');
-    if (/\bls -la\b/i.test(stripped)) details.push('Listed files for verification');
-    if (/status update\?/i.test(stripped)) details.push('Asked the worker for a status update');
-    if (/STEP_COMPLETE:/i.test(stripped)) details.push('Declared the step complete');
-
-    for (const detail of details) {
-      this.recordStepToolSideEffect(step.name, {
-        type: 'owner_monitoring',
-        detail,
-        raw: { output: stripped.slice(0, 240), owner: ownerDef.name },
-      });
-      await this.trajectory?.ownerMonitoringEvent(step.name, ownerDef.name, detail, {
-        output: stripped.slice(0, 240),
-      });
-    }
-  }
-
-  private resolveAutoStepOwner(
-    specialistDef: AgentDefinition,
-    agentMap: Map<string, AgentDefinition>
-  ): AgentDefinition {
-    if (specialistDef.interactive === false) return specialistDef;
-
-    const allDefs = [...agentMap.values()].map((d) => WorkflowRunner.resolveAgentDef(d));
-    const candidates = allDefs.filter((d) => d.interactive !== false);
-    const matchesHubRole = (text: string): boolean =>
-      [...WorkflowRunner.HUB_ROLES].some((r) => new RegExp(`\\b${r}\\b`, 'i').test(text));
-    const ownerish = (def: AgentDefinition): boolean => {
-      const nameLC = def.name.toLowerCase();
-      const roleLC = def.role?.toLowerCase() ?? '';
-      return matchesHubRole(nameLC) || matchesHubRole(roleLC);
-    };
-    const ownerPriority = (def: AgentDefinition): number => {
-      const roleLC = def.role?.toLowerCase() ?? '';
-      const nameLC = def.name.toLowerCase();
-      if (/\blead\b/.test(roleLC) || /\blead\b/.test(nameLC)) return 6;
-      if (/\bcoordinator\b/.test(roleLC) || /\bcoordinator\b/.test(nameLC)) return 5;
-      if (/\bsupervisor\b/.test(roleLC) || /\bsupervisor\b/.test(nameLC)) return 4;
-      if (/\borchestrator\b/.test(roleLC) || /\borchestrator\b/.test(nameLC)) return 3;
-      if (/\bhub\b/.test(roleLC) || /\bhub\b/.test(nameLC)) return 2;
-      return ownerish(def) ? 1 : 0;
-    };
-    const dedicatedOwner = candidates
-      .filter((d) => d.name !== specialistDef.name && ownerish(d))
-      .sort((a, b) => ownerPriority(b) - ownerPriority(a) || a.name.localeCompare(b.name))[0];
-    if (dedicatedOwner) return dedicatedOwner;
-    return specialistDef;
-  }
-
-  private resolveAutoReviewAgent(
-    ownerDef: AgentDefinition,
-    agentMap: Map<string, AgentDefinition>
-  ): AgentDefinition {
-    const allDefs = [...agentMap.values()].map((d) => WorkflowRunner.resolveAgentDef(d));
-    const eligible = (def: AgentDefinition): boolean =>
-      def.name !== ownerDef.name && !this.isExplicitInteractiveWorker(def);
-    const isReviewer = (def: AgentDefinition): boolean => {
-      const roleLC = def.role?.toLowerCase() ?? '';
-      const nameLC = def.name.toLowerCase();
-      return (
-        def.preset === 'reviewer' ||
-        roleLC.includes('review') ||
-        roleLC.includes('critic') ||
-        roleLC.includes('verifier') ||
-        roleLC.includes('qa') ||
-        nameLC.includes('review')
-      );
-    };
-    const reviewerPriority = (def: AgentDefinition): number => {
-      if (def.preset === 'reviewer') return 5;
-      const roleLC = def.role?.toLowerCase() ?? '';
-      const nameLC = def.name.toLowerCase();
-      if (roleLC.includes('review') || nameLC.includes('review')) return 4;
-      if (roleLC.includes('verifier') || roleLC.includes('qa')) return 3;
-      if (roleLC.includes('critic')) return 2;
-      return isReviewer(def) ? 1 : 0;
-    };
-    // Prefer agents not currently assigned as reviewers to avoid double-booking
-    const notBusy = (def: AgentDefinition): boolean => !this.activeReviewers.has(def.name);
-
-    const dedicatedCandidates = allDefs
-      .filter((d) => eligible(d) && isReviewer(d))
-      .sort((a, b) => reviewerPriority(b) - reviewerPriority(a) || a.name.localeCompare(b.name));
-    const dedicated = dedicatedCandidates.find(notBusy) ?? dedicatedCandidates[0];
-    if (dedicated) return dedicated;
-
-    const alternateCandidates = allDefs.filter((d) => eligible(d) && d.interactive !== false);
-    const alternate = alternateCandidates.find(notBusy) ?? alternateCandidates[0];
-    if (alternate) return alternate;
-
-    // Self-review fallback — log a warning since owner reviewing itself is weak.
-    return ownerDef;
-  }
-
-  private isExplicitInteractiveWorker(agentDef: AgentDefinition): boolean {
-    return agentDef.preset === 'worker' && agentDef.interactive !== false;
-  }
-
-  private resolveOwnerCompletionDecision(
-    step: WorkflowStep,
-    ownerOutput: string,
-    specialistOutput: string,
-    injectedTaskText: string,
-    verificationTaskText?: string
-  ): CompletionDecisionResult {
-    const hasMarker = this.hasOwnerCompletionMarker(step, ownerOutput, injectedTaskText);
-    const explicitOwnerDecision = this.parseOwnerDecision(step, ownerOutput, false);
-
-    // INCOMPLETE_RETRY / NEEDS_CLARIFICATION are non-terminal owner outcomes. They never mark
-    // the step complete here; instead they throw back to executeAgentStep(), which decides
-    // whether to retry or fail based on the remaining retry budget for this step.
-    if (explicitOwnerDecision?.decision === 'INCOMPLETE_RETRY') {
-      throw new WorkflowCompletionError(
-        `Step "${step.name}" owner requested retry${explicitOwnerDecision.reason ? `: ${explicitOwnerDecision.reason}` : ''}`,
-        'retry_requested_by_owner'
-      );
-    }
-    if (explicitOwnerDecision?.decision === 'INCOMPLETE_FAIL') {
-      throw new WorkflowCompletionError(
-        `Step "${step.name}" owner marked the step incomplete${explicitOwnerDecision.reason ? `: ${explicitOwnerDecision.reason}` : ''}`,
-        'failed_owner_decision'
-      );
-    }
-    if (explicitOwnerDecision?.decision === 'NEEDS_CLARIFICATION') {
-      throw new WorkflowCompletionError(
-        `Step "${step.name}" owner requested clarification before completion${explicitOwnerDecision.reason ? `: ${explicitOwnerDecision.reason}` : ''}`,
-        'retry_requested_by_owner'
-      );
-    }
-
-    const verificationResult = step.verification
-      ? this.runVerification(step.verification, specialistOutput, step.name, verificationTaskText, {
-          allowFailure: true,
-          completionMarkerFound: hasMarker,
-        })
-      : { passed: false };
-
-    if (verificationResult.error) {
-      throw new WorkflowCompletionError(
-        `Step "${step.name}" verification failed and no owner decision or evidence established completion: ${verificationResult.error}`,
-        'failed_verification'
-      );
-    }
-
-    if (explicitOwnerDecision?.decision === 'COMPLETE') {
-      if (!hasMarker) {
-        this.log(
-          `[${step.name}] Structured OWNER_DECISION completed the step without legacy STEP_COMPLETE marker`
-        );
-      }
-      return {
-        completionReason: 'completed_by_owner_decision',
-        ownerDecision: explicitOwnerDecision.decision,
-        reason: explicitOwnerDecision.reason,
-      };
-    }
-    if (verificationResult.passed) {
-      return { completionReason: 'completed_verified' };
-    }
-
-    const ownerDecision = this.parseOwnerDecision(step, ownerOutput, hasMarker);
-    if (ownerDecision?.decision === 'COMPLETE') {
-      return {
-        completionReason: 'completed_by_owner_decision',
-        ownerDecision: ownerDecision.decision,
-        reason: ownerDecision.reason,
-      };
-    }
-
-    if (!explicitOwnerDecision) {
-      const evidenceReason = this.judgeOwnerCompletionByEvidence(step.name, ownerOutput);
-      if (evidenceReason) {
-        if (!hasMarker) {
-          this.log(`[${step.name}] Evidence-based completion resolved without legacy STEP_COMPLETE marker`);
-        }
-        return {
-          completionReason: 'completed_by_evidence',
-          reason: evidenceReason,
-        };
-      }
-    }
-
-    // Process-exit fallback: if the agent exited cleanly (code 0) and verification
-    // passes (or no verification is configured), infer completion rather than failing.
-    // This reduces dependence on agents posting exact coordination signals.
-    const processExitFallback = this.tryProcessExitFallback(
-      step,
-      specialistOutput,
-      verificationTaskText,
-      ownerOutput
-    );
-    if (processExitFallback) {
-      this.log(
-        `[${step.name}] Completion inferred from clean process exit (code 0)` +
-          (step.verification ? ' + verification passed' : '') +
-          ' — no coordination signal was required'
-      );
-      return processExitFallback;
-    }
-
-    throw new WorkflowCompletionError(
-      `Step "${step.name}" owner completion decision missing: no OWNER_DECISION, legacy STEP_COMPLETE marker, or evidence-backed completion signal`,
-      'failed_no_evidence'
-    );
-  }
-
-  private hasExplicitInteractiveWorkerCompletionEvidence(
-    step: WorkflowStep,
-    output: string,
-    injectedTaskText: string,
-    verificationTaskText: string
-  ): boolean {
-    try {
-      this.resolveOwnerCompletionDecision(step, output, output, injectedTaskText, verificationTaskText);
-      return true;
-    } catch {
-      return false;
-    }
-  }
-
-  private hasOwnerCompletionMarker(step: WorkflowStep, output: string, injectedTaskText: string): boolean {
-    const marker = `STEP_COMPLETE:${step.name}`;
-    const strippedOutput = stripInjectedTaskEcho(output, injectedTaskText);
-    if (strippedOutput.includes(marker)) {
-      return true;
-    }
-    const taskHasMarker = injectedTaskText.includes(marker);
-    const first = output.indexOf(marker);
-    if (first === -1) {
-      return false;
-    }
-    // PTY output often includes echoed prompt text, so when the injected task
-    // itself contains the legacy marker require a second occurrence from the
-    // agent response.
-    const outputLikelyContainsInjectedPrompt =
-      output.includes('STEP OWNER CONTRACT') ||
-      output.includes('Preferred final decision format') ||
-      output.includes('Legacy completion marker still supported') ||
-      output.includes('Output exactly: STEP_COMPLETE:');
-    if (taskHasMarker && outputLikelyContainsInjectedPrompt) {
-      return output.includes(marker, first + marker.length);
-    }
-    return true;
-  }
-
-  private parseOwnerDecision(
-    step: WorkflowStep,
-    ownerOutput: string,
-    hasMarker: boolean
-  ): { decision: WorkflowOwnerDecision; reason?: string } | null {
-    const decisionPattern =
-      /OWNER_DECISION:\s*(COMPLETE|INCOMPLETE_RETRY|INCOMPLETE_FAIL|NEEDS_CLARIFICATION)\b/gi;
-    const decisionMatches = [...ownerOutput.matchAll(decisionPattern)];
-    const outputLikelyContainsEchoedPrompt =
-      ownerOutput.includes('STEP OWNER CONTRACT') ||
-      ownerOutput.includes('Preferred final decision format') ||
-      ownerOutput.includes('one of COMPLETE, INCOMPLETE_RETRY') ||
-      ownerOutput.includes('COMPLETE|INCOMPLETE_RETRY');
-
-    if (decisionMatches.length === 0) {
-      if (!hasMarker) return null;
-      return {
-        decision: 'COMPLETE',
-        reason: `Legacy completion marker observed: STEP_COMPLETE:${step.name}`,
-      };
-    }
-
-    // Filter out matches that appear on a template/instruction line (e.g.
-    // "COMPLETE|INCOMPLETE_RETRY|INCOMPLETE_FAIL|NEEDS_CLARIFICATION") to avoid
-    // picking up the template format as the agent's actual decision.
-    const realMatches = outputLikelyContainsEchoedPrompt
-      ? decisionMatches.filter((m) => {
-          const lineStart = ownerOutput.lastIndexOf('\n', m.index!) + 1;
-          const lineEnd = ownerOutput.indexOf('\n', m.index!);
-          const line = ownerOutput.slice(lineStart, lineEnd === -1 ? undefined : lineEnd);
-          return !line.includes('COMPLETE|INCOMPLETE_RETRY');
-        })
-      : decisionMatches;
-    const decisionMatch =
-      realMatches.length > 0
-        ? realMatches[realMatches.length - 1]
-        : decisionMatches[decisionMatches.length - 1];
-    const decision = decisionMatch?.[1]?.toUpperCase() as WorkflowOwnerDecision | undefined;
-    if (
-      decision !== 'COMPLETE' &&
-      decision !== 'INCOMPLETE_RETRY' &&
-      decision !== 'INCOMPLETE_FAIL' &&
-      decision !== 'NEEDS_CLARIFICATION'
-    ) {
-      return null;
-    }
-
-    const reasonPattern = /(?:^|\n)REASON:\s*(.+)/gi;
-    const reasonMatches = [...ownerOutput.matchAll(reasonPattern)];
-    const reasonMatch =
-      outputLikelyContainsEchoedPrompt && reasonMatches.length > 1
-        ? reasonMatches[reasonMatches.length - 1]
-        : reasonMatches[0];
-    const reason = reasonMatch?.[1]?.trim();
-
-    return {
-      decision,
-      reason: reason && reason !== '<one sentence>' ? reason : undefined,
-    };
-  }
-
-  private stripEchoedPromptLines(output: string, patterns: RegExp[]): string {
-    return output
-      .split('\n')
-      .map((line) => line.trim())
-      .filter(Boolean)
-      .filter((line) => patterns.every((pattern) => !pattern.test(line)))
-      .join('\n');
-  }
-
-  private outputContainsVerificationToken(output: string, token: string, injectedTaskText?: string): boolean {
-    if (!token) {
-      return false;
-    }
-    return stripInjectedTaskEcho(output, injectedTaskText).includes(token);
-  }
-
-  private prepareInteractiveSpawnTask(
-    agentName: string,
-    taskText: string
-  ): { spawnTaskText: string; promptTaskText: string; taskTmpFile?: string } {
-    if (Buffer.byteLength(taskText, 'utf8') <= WorkflowRunner.PTY_TASK_ARG_SIZE_LIMIT) {
-      return {
-        spawnTaskText: taskText,
-        promptTaskText: taskText,
-      };
-    }
-
-    const taskTmpDir = mkdtempSync(path.join(tmpdir(), 'relay-pty-task-'));
-    const taskTmpFile = path.join(taskTmpDir, `${agentName}-${Date.now()}.txt`);
-    writeFileSync(taskTmpFile, taskText, { encoding: 'utf8', mode: 0o600, flag: 'wx' });
-    const promptTaskText =
-      `TASK_FILE:${taskTmpFile}\n` +
-      'Read that file completely before taking any action.\n' +
-      'Treat the file contents as the full workflow task and follow them exactly.\n' +
-      'Do not ask for the task again.';
-
-    return {
-      spawnTaskText: promptTaskText,
-      promptTaskText,
-      taskTmpFile,
-    };
-  }
-
-  private firstMeaningfulLine(output: string): string | undefined {
-    return output
-      .split('\n')
-      .map((line) => line.trim())
-      .find(Boolean);
-  }
-
-  private judgeOwnerCompletionByEvidence(stepName: string, ownerOutput: string): string | null {
-    // Never infer completion when the raw output contains an explicit retry/fail/clarification signal.
-    if (/OWNER_DECISION:\s*(?:INCOMPLETE_RETRY|INCOMPLETE_FAIL|NEEDS_CLARIFICATION)\b/i.test(ownerOutput)) {
-      return null;
-    }
-    const sanitized = this.stripEchoedPromptLines(ownerOutput, [
-      /^STEP OWNER CONTRACT:?$/i,
-      /^Preferred final decision format:?$/i,
-      /^OWNER_DECISION:\s*(?:COMPLETE\|INCOMPLETE_RETRY|<one of COMPLETE, INCOMPLETE_RETRY)/i,
-      /^REASON:\s*<one sentence>$/i,
-      /^Legacy completion marker still supported:/i,
-      /^STEP_COMPLETE:/i,
-    ]);
-    if (!sanitized) return null;
-
-    const hasExplicitSelfRelease =
-      /Calling\s+(?:[\w.-]+\.)?remove_agent\(\{[^<\n]*"reason":"task completed"/i.test(sanitized);
-    const hasPositiveConclusion =
-      /\b(complete(?:d)?|done|verified|looks correct|safe handoff|artifact verified)\b/i.test(sanitized) ||
-      /\bartifacts?\b.*\b(correct|verified|complete)\b/i.test(sanitized) ||
-      hasExplicitSelfRelease;
-    const evidence = this.getStepCompletionEvidence(stepName);
-    const hasValidatedCoordinationSignal =
-      evidence?.coordinationSignals.some(
-        (signal) =>
-          signal.kind === 'worker_done' ||
-          signal.kind === 'lead_done' ||
-          signal.kind === 'verification_passed' ||
-          (signal.kind === 'process_exit' && signal.value === '0')
-      ) ?? false;
-    const hasValidatedInspectionSignal =
-      evidence?.toolSideEffects.some(
-        (effect) =>
-          effect.type === 'owner_monitoring' &&
-          (/Checked git diff stats/i.test(effect.detail) ||
-            /Listed files for verification/i.test(effect.detail))
-      ) ?? false;
-    const hasEvidenceSignal = hasValidatedCoordinationSignal || hasValidatedInspectionSignal;
-
-    if (!hasPositiveConclusion || !hasEvidenceSignal) {
-      return null;
-    }
-
-    return this.firstMeaningfulLine(sanitized) ?? 'Evidence-backed completion';
-  }
-
-  /**
-   * Process-exit fallback: when agent exits with code 0 but posts no coordination
-   * signal, check if verification passes (or no verification is configured) and
-   * infer completion. This is the key mechanism for reducing agent compliance
-   * dependence — the runner trusts a clean exit + passing verification over
-   * requiring exact signal text.
-   */
-  private tryProcessExitFallback(
-    step: WorkflowStep,
-    specialistOutput: string,
-    verificationTaskText?: string,
-    ownerOutput?: string
-  ): CompletionDecisionResult | null {
-    const gracePeriodMs = this.currentConfig?.swarm.completionGracePeriodMs ?? 5000;
-    if (gracePeriodMs === 0) return null;
-
-    // Never infer completion when the owner explicitly requested retry/fail/clarification.
-    if (
-      ownerOutput &&
-      /OWNER_DECISION:\s*(?:INCOMPLETE_RETRY|INCOMPLETE_FAIL|NEEDS_CLARIFICATION)\b/i.test(ownerOutput)
-    ) {
-      return null;
-    }
-
-    const evidence = this.getStepCompletionEvidence(step.name);
-    const hasCleanExit =
-      evidence?.coordinationSignals.some(
-        (signal) => signal.kind === 'process_exit' && signal.value === '0'
-      ) ?? false;
-
-    if (!hasCleanExit) return null;
-
-    // If verification is configured, it must pass for the fallback to succeed.
-    if (step.verification) {
-      const verificationResult = this.runVerification(
-        step.verification,
-        specialistOutput,
-        step.name,
-        verificationTaskText,
-        { allowFailure: true }
-      );
-      if (!verificationResult.passed) return null;
-    }
-
-    return {
-      completionReason: 'completed_by_process_exit',
-      reason: `Process exited with code 0${step.verification ? ' and verification passed' : ''} — coordination signal not required`,
-    };
-  }
-
-  private async runStepReviewGate(
-    step: WorkflowStep,
-    resolvedTask: string,
-    specialistOutput: string,
-    ownerOutput: string,
-    ownerDef: AgentDefinition,
-    reviewerDef: AgentDefinition,
-    timeoutMs?: number
-  ): Promise<string> {
-    const reviewSnippetMax = 12_000;
-    let specialistSnippet = specialistOutput;
-    if (specialistOutput.length > reviewSnippetMax) {
-      const head = Math.floor(reviewSnippetMax / 2);
-      const tail = reviewSnippetMax - head;
-      const omitted = specialistOutput.length - head - tail;
-      specialistSnippet =
-        `${specialistOutput.slice(0, head)}\n` +
-        `...[truncated ${omitted} chars for review]...\n` +
-        `${specialistOutput.slice(specialistOutput.length - tail)}`;
-    }
-
-    let ownerSnippet = ownerOutput;
-    if (ownerOutput.length > reviewSnippetMax) {
-      const head = Math.floor(reviewSnippetMax / 2);
-      const tail = reviewSnippetMax - head;
-      const omitted = ownerOutput.length - head - tail;
-      ownerSnippet =
-        `${ownerOutput.slice(0, head)}\n` +
-        `...[truncated ${omitted} chars for review]...\n` +
-        `${ownerOutput.slice(ownerOutput.length - tail)}`;
-    }
-
-    const reviewTask =
-      `Review workflow step "${step.name}" for completion and safe handoff.\n` +
-      `Step owner: ${ownerDef.name}\n` +
-      `Original objective:\n${resolvedTask}\n\n` +
-      `Specialist output:\n${specialistSnippet}\n\n` +
-      `Owner verification notes:\n${ownerSnippet}\n\n` +
-      `Return exactly:\n` +
-      `REVIEW_DECISION: APPROVE or REJECT\n` +
-      `REVIEW_REASON: <one sentence>\n` +
-      `Then output /exit.`;
-
-    const safetyTimeoutMs = timeoutMs ?? 600_000;
-    const reviewStep: WorkflowStep = {
-      name: `${step.name}-review`,
-      type: 'agent',
-      agent: reviewerDef.name,
-      task: reviewTask,
-    };
-
-    await this.trajectory?.registerAgent(reviewerDef.name, 'reviewer');
-    this.postToChannel(`**[${step.name}]** Review started (reviewer: ${reviewerDef.name})`);
-    this.recordStepToolSideEffect(step.name, {
-      type: 'review_started',
-      detail: `Review started with ${reviewerDef.name}`,
-      raw: { reviewer: reviewerDef.name },
-    });
-    const emitReviewCompleted = async (decision: 'approved' | 'rejected', reason?: string) => {
-      this.recordStepToolSideEffect(step.name, {
-        type: 'review_completed',
-        detail: `Review ${decision} by ${reviewerDef.name}${reason ? `: ${reason}` : ''}`,
-        raw: { reviewer: reviewerDef.name, decision, reason },
-      });
-      await this.trajectory?.reviewCompleted(step.name, reviewerDef.name, decision, reason);
-      this.emit({
-        type: 'step:review-completed',
-        runId: this.currentRunId ?? '',
-        stepName: step.name,
-        reviewerName: reviewerDef.name,
-        decision,
-      });
-    };
-
-    if (this.executor) {
-      const reviewOutput = await this.executor.executeAgentStep(
-        reviewStep,
-        reviewerDef,
-        reviewTask,
-        safetyTimeoutMs
-      );
-      const parsed = this.parseReviewDecision(reviewOutput);
-      if (!parsed) {
-        throw new Error(
-          `Step "${step.name}" review response malformed from "${reviewerDef.name}" (missing REVIEW_DECISION)`
-        );
-      }
-      await emitReviewCompleted(parsed.decision, parsed.reason);
-      if (parsed.decision === 'rejected') {
-        throw new Error(`Step "${step.name}" review rejected by "${reviewerDef.name}"`);
-      }
-      this.postToChannel(`**[${step.name}]** Review approved by \`${reviewerDef.name}\``);
-      return reviewOutput;
-    }
-
-    let reviewerHandle: Agent | undefined;
-    let reviewerReleased = false;
-    let reviewOutput = '';
-    let completedReview: { decision: 'approved' | 'rejected'; reason?: string } | undefined;
-    let reviewCompletionPromise: Promise<void> | undefined;
-    const reviewCompletionStarted = { value: false };
-
-    const startReviewCompletion = (parsed: { decision: 'approved' | 'rejected'; reason?: string }) => {
-      if (reviewCompletionStarted.value) return;
-      reviewCompletionStarted.value = true;
-      completedReview = parsed;
-      reviewCompletionPromise = (async () => {
-        await emitReviewCompleted(parsed.decision, parsed.reason);
-        if (reviewerHandle && !reviewerReleased) {
-          reviewerReleased = true;
-          await reviewerHandle.release().catch(() => undefined);
-        }
-      })();
-    };
-
-    try {
-      await this.spawnAndWait(reviewerDef, reviewStep, safetyTimeoutMs, {
-        evidenceStepName: step.name,
-        evidenceRole: 'reviewer',
-        logicalName: reviewerDef.name,
-        onSpawned: ({ agent }) => {
-          reviewerHandle = agent;
-        },
-        onChunk: ({ chunk }) => {
-          const nextOutput = reviewOutput + WorkflowRunner.stripAnsi(chunk);
-          reviewOutput = nextOutput;
-          const parsed = this.parseReviewDecision(nextOutput);
-          if (parsed) {
-            startReviewCompletion(parsed);
-          }
-        },
-      });
-      await reviewCompletionPromise;
-    } catch (error) {
-      const message = error instanceof Error ? error.message : String(error);
-      if (/\btimed out\b/i.test(message)) {
-        this.log(`[${step.name}] Review safety backstop timeout fired after ${safetyTimeoutMs}ms`);
-        throw new Error(`Step "${step.name}" review safety backstop timed out after ${safetyTimeoutMs}ms`);
-      }
-      throw error;
-    }
-
-    if (!completedReview) {
-      const parsed = this.parseReviewDecision(reviewOutput);
-      if (!parsed) {
-        throw new Error(
-          `Step "${step.name}" review response malformed from "${reviewerDef.name}" (missing REVIEW_DECISION)`
-        );
-      }
-      completedReview = parsed;
-      await emitReviewCompleted(parsed.decision, parsed.reason);
-    }
-
-    if (completedReview.decision === 'rejected') {
-      throw new Error(`Step "${step.name}" review rejected by "${reviewerDef.name}"`);
-    }
-
-    this.postToChannel(`**[${step.name}]** Review approved by \`${reviewerDef.name}\``);
-    return reviewOutput;
-  }
-
-  private parseReviewDecision(
-    reviewOutput: string
-  ): { decision: 'approved' | 'rejected'; reason?: string } | null {
-    const strict = this.parseStrictReviewDecision(reviewOutput);
-    if (strict) {
-      return strict;
-    }
-
-    const tolerant = this.parseTolerantReviewDecision(reviewOutput);
-    if (tolerant) {
-      return tolerant;
-    }
-
-    return this.judgeReviewDecisionFromEvidence(reviewOutput);
-  }
-
-  private parseStrictReviewDecision(
-    reviewOutput: string
-  ): { decision: 'approved' | 'rejected'; reason?: string } | null {
-    const decisionPattern = /REVIEW_DECISION:\s*(APPROVE|REJECT)/gi;
-    const decisionMatches = [...reviewOutput.matchAll(decisionPattern)];
-    if (decisionMatches.length === 0) {
-      return null;
-    }
-
-    const outputLikelyContainsEchoedPrompt =
-      reviewOutput.includes('Return exactly') || reviewOutput.includes('REVIEW_DECISION: APPROVE or REJECT');
-    const realReviewMatches = outputLikelyContainsEchoedPrompt
-      ? decisionMatches.filter((m) => {
-          const lineStart = reviewOutput.lastIndexOf('\n', m.index!) + 1;
-          const lineEnd = reviewOutput.indexOf('\n', m.index!);
-          const line = reviewOutput.slice(lineStart, lineEnd === -1 ? undefined : lineEnd);
-          return !line.includes('APPROVE or REJECT');
-        })
-      : decisionMatches;
-    const decisionMatch =
-      realReviewMatches.length > 0
-        ? realReviewMatches[realReviewMatches.length - 1]
-        : decisionMatches[decisionMatches.length - 1];
-    const decision = decisionMatch?.[1]?.toUpperCase();
-    if (decision !== 'APPROVE' && decision !== 'REJECT') {
-      return null;
-    }
-
-    const reasonPattern = /REVIEW_REASON:\s*(.+)/gi;
-    const reasonMatches = [...reviewOutput.matchAll(reasonPattern)];
-    const reasonMatch =
-      outputLikelyContainsEchoedPrompt && reasonMatches.length > 1
-        ? reasonMatches[reasonMatches.length - 1]
-        : reasonMatches[0];
-    const reason = reasonMatch?.[1]?.trim();
-
-    return {
-      decision: decision === 'APPROVE' ? 'approved' : 'rejected',
-      reason: reason && reason !== '<one sentence>' ? reason : undefined,
-    };
-  }
-
-  private parseTolerantReviewDecision(
-    reviewOutput: string
-  ): { decision: 'approved' | 'rejected'; reason?: string } | null {
-    const sanitized = this.stripEchoedPromptLines(reviewOutput, [
-      /^Return exactly:?$/i,
-      /^REVIEW_DECISION:\s*APPROVE\s+or\s+REJECT$/i,
-      /^REVIEW_REASON:\s*<one sentence>$/i,
-    ]);
-    if (!sanitized) {
-      return null;
-    }
-
-    const lines = sanitized
-      .split('\n')
-      .map((line) => line.trim())
-      .filter(Boolean);
-    for (const line of lines) {
-      const candidate = line.replace(/^REVIEW_DECISION:\s*/i, '').trim();
-      const decision = this.normalizeReviewDecisionCandidate(candidate);
-      if (decision) {
-        return {
-          decision,
-          reason: this.parseReviewReason(sanitized) ?? this.firstMeaningfulLine(sanitized),
-        };
-      }
-    }
-
-    const decision = this.normalizeReviewDecisionCandidate(lines.join(' '));
-    if (!decision) {
-      return null;
-    }
-
-    return {
-      decision,
-      reason: this.parseReviewReason(sanitized) ?? this.firstMeaningfulLine(sanitized),
-    };
-  }
-
-  private normalizeReviewDecisionCandidate(candidate: string): 'approved' | 'rejected' | null {
-    const value = candidate.trim().toLowerCase();
-    if (!value) return null;
-
-    if (
-      /^(approve|approved|complete|completed|pass|passed|accept|accepted|lgtm|ship it|looks good|looks fine)\b/i.test(
-        value
-      )
-    ) {
-      return 'approved';
-    }
-    if (
-      /^(reject|rejected|retry|retry requested|fail|failed|incomplete|needs clarification|not complete|not ready|insufficient evidence)\b/i.test(
-        value
-      )
-    ) {
-      return 'rejected';
-    }
-    return null;
-  }
-
-  private parseReviewReason(reviewOutput: string): string | undefined {
-    const reasonPattern = /REVIEW_REASON:\s*(.+)/gi;
-    const reasonMatches = [...reviewOutput.matchAll(reasonPattern)];
-    const outputLikelyContainsEchoedPrompt =
-      reviewOutput.includes('Return exactly') || reviewOutput.includes('REVIEW_DECISION: APPROVE or REJECT');
-    const reasonMatch =
-      outputLikelyContainsEchoedPrompt && reasonMatches.length > 1
-        ? reasonMatches[reasonMatches.length - 1]
-        : reasonMatches[0];
-    const reason = reasonMatch?.[1]?.trim();
-    return reason && reason !== '<one sentence>' ? reason : undefined;
-  }
-
-  private judgeReviewDecisionFromEvidence(
-    reviewOutput: string
-  ): { decision: 'approved' | 'rejected'; reason?: string } | null {
-    const sanitized = this.stripEchoedPromptLines(reviewOutput, [
-      /^Return exactly:?$/i,
-      /^REVIEW_DECISION:\s*APPROVE\s+or\s+REJECT$/i,
-      /^REVIEW_REASON:\s*<one sentence>$/i,
-    ]);
-    if (!sanitized) {
-      return null;
-    }
-
-    const hasPositiveEvidence =
-      /\b(approved?|complete(?:d)?|verified|looks good|looks fine|safe handoff|pass(?:ed)?)\b/i.test(
-        sanitized
-      );
-    const hasNegativeEvidence =
-      /\b(reject(?:ed)?|retry|fail(?:ed)?|incomplete|missing checks|insufficient evidence|not safe)\b/i.test(
-        sanitized
-      );
-
-    if (hasNegativeEvidence) {
-      return {
-        decision: 'rejected',
-        reason: this.parseReviewReason(sanitized) ?? this.firstMeaningfulLine(sanitized),
-      };
-    }
-    if (!hasPositiveEvidence) {
-      return null;
-    }
-
-    return {
-      decision: 'approved',
-      reason: this.parseReviewReason(sanitized) ?? this.firstMeaningfulLine(sanitized),
-    };
-  }
-
-  private combineStepAndReviewOutput(stepOutput: string, reviewOutput: string): string {
-    const primary = stepOutput.trimEnd();
-    const review = reviewOutput.trim();
-    if (!review) return primary;
-    if (!primary) return `REVIEW_OUTPUT\n${review}\n`;
-    return `${primary}\n\n---\nREVIEW_OUTPUT\n${review}\n`;
-  }
-
-  /**
-   * Build the CLI command and arguments for a non-interactive agent execution.
-   * Delegates to the consolidated CLI registry for per-CLI arg formats.
-   */
-  static buildNonInteractiveCommand(
-    cli: AgentCli,
-    task: string,
-    extraArgs: string[] = []
-  ): { cmd: string; args: string[] } {
-    const [cmd, ...args] = buildProcessCommand(cli, extraArgs, task);
-    return {
-      cmd,
-      args,
-    };
-  }
-
-  /**
-   * Apply preset defaults to an agent definition.
-   * Explicit fields on the definition always win over preset-inferred defaults.
-   */
-  private static resolveAgentDef(def: AgentDefinition): AgentDefinition {
-    // Resolve "cursor" alias to whichever cursor agent binary is in PATH
-    const resolvedCli: AgentCli = def.cli === 'cursor' ? resolveCursorCli() : def.cli;
-
-    if (!def.preset) return resolvedCli !== def.cli ? { ...def, cli: resolvedCli } : def;
-    const nonInteractivePresets: AgentPreset[] = ['worker', 'reviewer', 'analyst'];
-    const defaults: Partial<AgentDefinition> = nonInteractivePresets.includes(def.preset)
-      ? { interactive: false }
-      : {};
-    // Explicit fields on the def always win
-    return { ...defaults, ...def, cli: resolvedCli } as AgentDefinition;
-  }
-
-  /**
-   * Returns a preset-specific prefix that is prepended to the non-interactive
-   * enforcement block in execNonInteractive.
-   */
-  /**
-   * Returns a prefix injected into the task prompt for non-interactive agents.
-   * Lead agents are always interactive (PTY), so they never reach execNonInteractive
-   * and there is no 'lead' case here.
-   */
-  private buildPresetInjection(preset: AgentPreset | undefined): string {
-    switch (preset) {
-      case 'worker':
-        return (
-          'You are a non-interactive worker agent. Produce clean, structured output to stdout.\n' +
-          'Do NOT use mcp__relaycast__add_agent, add_agent, or any MCP tool to spawn sub-agents.\n' +
-          'Do NOT use mcp__relaycast__send_dm or any Relaycast messaging tools — you have no relay connection.\n\n'
-        );
-      case 'reviewer':
-        return (
-          'You are a non-interactive reviewer agent. Read the specified files/artifacts and produce a clear verdict.\n' +
-          'Do NOT spawn sub-agents or use any Relaycast messaging tools.\n\n'
-        );
-      case 'analyst':
-        return (
-          'You are a non-interactive analyst agent. Read the specified code/files and write your findings.\n' +
-          'Do NOT spawn sub-agents or use any Relaycast messaging tools.\n\n'
-        );
-      default:
-        return '';
-    }
-  }
-
-  /**
-   * Execute an agent as a non-interactive subprocess.
-   * No PTY, no relay messaging, no /exit injection. The process receives its task
-   * as a CLI argument and stdout is captured as the step output.
-   */
-  private async execNonInteractive(
-    agentDef: AgentDefinition,
-    step: WorkflowStep,
-    timeoutMs?: number
-  ): Promise<SpawnResult> {
-    const agentName = `${step.name}-${this.generateShortId()}`;
-    const modelArgs = agentDef.constraints?.model ? ['--model', agentDef.constraints.model] : [];
-
-    // Append strict deliverable enforcement — non-interactive agents MUST produce
-    // clear, structured output since there's no opportunity for follow-up or clarification.
-    const presetPrefix = this.buildPresetInjection(agentDef.preset);
-    const taskWithDeliverable =
-      presetPrefix +
-      step.task +
-      '\n\n---\n' +
-      'IMPORTANT: You are running as a non-interactive subprocess. ' +
-      'Do NOT call mcp__relaycast__add_agent, add_agent, or any MCP tool to spawn or manage other agents.\n\n' +
-      'CRITICAL REQUIREMENT — YOU MUST FOLLOW THIS EXACTLY:\n' +
-      'You are running in non-interactive mode. There is NO opportunity for follow-up, ' +
-      'clarification, or additional input. Your stdout output is your ONLY deliverable.\n\n' +
-      'You MUST:\n' +
-      '1. Complete the ENTIRE task in a single pass — no partial work, no "I\'ll continue later"\n' +
-      '2. Print your COMPLETE deliverable to stdout — this is the ONLY output that will be captured\n' +
-      '3. Be thorough and self-contained — another agent will consume your output with zero context about your process\n' +
-      '4. End with a clear summary of what was accomplished and any artifacts produced\n\n' +
-      'DO NOT:\n' +
-      '- Ask questions or request clarification (there is no one to answer)\n' +
-      '- Output partial results expecting a follow-up (there will be none)\n' +
-      '- Skip steps or leave work incomplete\n' +
-      '- Output only status messages without the actual deliverable content';
-
-    const { cmd, args } = WorkflowRunner.buildNonInteractiveCommand(
-      agentDef.cli,
-      taskWithDeliverable,
-      modelArgs
-    );
-
-    // Open a log file for dashboard observability
-    const logsDir = this.getWorkerLogsDir();
-    const logPath = path.join(logsDir, `${agentName}.log`);
-    const logStream = createWriteStream(logPath, { flags: 'a' });
-
-    // Register in workers.json with interactive: false metadata
-    this.registerWorker(agentName, agentDef.cli, step.task ?? '', undefined, false);
-
-    // Register agent in Relaycast for observability
-    let stopHeartbeat: (() => void) | undefined;
-    if (this.relayApiKey) {
-      const agentClient = await this.registerRelaycastExternalAgent(
-        agentName,
-        `Non-interactive workflow agent for step "${step.name}" (${agentDef.cli})`
-      ).catch((err) => {
-        console.warn(`[WorkflowRunner] Failed to register ${agentName} in Relaycast:`, err?.message ?? err);
-        return null;
-      });
-      if (agentClient) {
-        stopHeartbeat = this.startRelaycastHeartbeat(agentClient);
-      }
-    }
-
-    // Post assignment notification (no task content — task arrives via direct broker injection)
-    this.postToChannel(`**[${step.name}]** Assigned to \`${agentName}\` (non-interactive)`);
-
-    const stdoutChunks: string[] = [];
-    const stderrChunks: string[] = [];
-    const proxyMode = await this.resolveAgentProxyMode(agentDef, this.currentConfig);
-    const env = { ...(this.getRelayEnv(proxyMode) ?? filteredEnv()) };
-    if (proxyMode?.url && proxyMode.token) {
-      Object.assign(env, resolveProxyEnv(agentDef.cli, proxyMode.url, proxyMode.token));
-    }
-    const agentToken = this.agentTokens.get(agentDef.name);
-    const mount = this.agentMounts.get(agentDef.name);
-    if (agentToken) {
-      env.RELAY_AGENT_TOKEN = agentToken;
-      env.RELAYFILE_TOKEN = agentToken;
-    }
-    if (mount) {
-      env.RELAY_WORKSPACE = mount.mountPoint;
-      env.RELAY_AGENT_NAME = agentName;
-      env.RELAYFILE_WORKSPACE = this.workspaceId;
-      env.RELAY_WORKSPACE_ID = this.workspaceId;
-      env.RELAY_DEFAULT_WORKSPACE = this.workspaceId;
-    }
-    env.RELAYFILE_BASE_URL =
-      env.RELAYFILE_BASE_URL ??
-      this.getRelayEnv(proxyMode)?.RELAYFILE_BASE_URL ??
-      process.env.RELAYFILE_BASE_URL ??
-      'http://127.0.0.1:8080';
-
-    try {
-      const {
-        stdout: output,
-        exitCode,
-        exitSignal,
-      } = await new Promise<{ stdout: string; exitCode?: number; exitSignal?: string }>((resolve, reject) => {
-        const spawnEnv =
-          agentDef.cli === 'opencode'
-            ? {
-                ...env,
-                OPENCODE_PERMISSION: JSON.stringify({ '*': 'allow', external_directory: { '*': 'allow' } }),
-              }
-            : env;
-        const child = spawnProcess([cmd, ...args], {
-          stdio: ['ignore', 'pipe', 'pipe'],
-          cwd: this.resolveExecutionCwd(step, agentDef),
-          env: spawnEnv,
-        });
-
-        // Update workers.json with PID now that we have it
-        this.registerWorker(agentName, agentDef.cli, step.task ?? '', child.pid, false);
-
-        // Wire abort signal so runner.abort() kills the child process
-        const abortSignal = this.abortController?.signal;
-        let abortHandler: (() => void) | undefined;
-        if (abortSignal && !abortSignal.aborted) {
-          abortHandler = () => {
-            child.kill('SIGTERM');
-            setTimeout(() => child.kill('SIGKILL'), 5000);
-          };
-          abortSignal.addEventListener('abort', abortHandler, { once: true });
-        }
-
-        // Heartbeat so a slow non-interactive agent doesn't look frozen.
-        // Each tick shows the last substantive line received — gives insight
-        // without flooding the log with raw model output.
-        const startedAt = Date.now();
-        let lastHeartbeatLine = '';
-        const heartbeat = setInterval(() => {
-          const elapsed = Math.round((Date.now() - startedAt) / 1000);
-          const suffix = lastHeartbeatLine ? ` — ${lastHeartbeatLine.slice(0, 80)}` : '';
-          this.log(`[${step.name}] still running (${elapsed}s)${suffix}`);
-          lastHeartbeatLine = '';
-        }, 30_000);
-
-        child.stdout?.on('data', (chunk: Buffer) => {
-          const text = chunk.toString();
-          stdoutChunks.push(text);
-          logStream.write(text);
-          // Track last substantive line for the next heartbeat
-          const line =
-            text
-              .split('\n')
-              .map((l) => l.trim())
-              .filter(Boolean)
-              .at(-1) ?? '';
-          if (line) lastHeartbeatLine = line;
-        });
-
-        child.stderr?.on('data', (chunk: Buffer) => {
-          const text = chunk.toString();
-          stderrChunks.push(text);
-          logStream.write(`[stderr] ${text}`);
-        });
-
-        // Handle timeout
-        let timedOut = false;
-        let timer: ReturnType<typeof setTimeout> | undefined;
-        if (timeoutMs) {
-          timer = setTimeout(() => {
-            timedOut = true;
-            child.kill('SIGTERM');
-            // Give process time to clean up, then force kill
-            setTimeout(() => child.kill('SIGKILL'), 5000);
-          }, timeoutMs);
-        }
-
-        child.on('close', (code, signal) => {
-          clearInterval(heartbeat);
-          if (timer) clearTimeout(timer);
-          if (abortHandler && abortSignal) {
-            abortSignal.removeEventListener('abort', abortHandler);
-          }
-          const stdout = stdoutChunks.join('');
-
-          if (abortSignal?.aborted) {
-            reject(new Error(`Step "${step.name}" aborted`));
-            return;
-          }
-
-          if (timedOut) {
-            reject(new Error(`Step "${step.name}" timed out after ${timeoutMs ?? 'unknown'}ms`));
-            return;
-          }
-
-          const cliDef = getCliDefinition(agentDef.cli);
-          if (code !== 0 && code !== null && !cliDef?.ignoreExitCode) {
-            const stderr = stderrChunks.join('');
-            reject(
-              new SpawnExitError(
-                `Step "${step.name}" exited with code ${code}${stderr ? `: ${stderr.slice(0, 500)}` : ''}`,
-                code,
-                signal
-              )
-            );
-            return;
-          }
-
-          resolve({
-            stdout,
-            exitCode: code ?? undefined,
-            exitSignal: signal ?? undefined,
-          });
-        });
-
-        child.on('error', (err) => {
-          clearInterval(heartbeat);
-          if (timer) clearTimeout(timer);
-          if (abortHandler && abortSignal) {
-            abortSignal.removeEventListener('abort', abortHandler);
-          }
-          reject(new Error(`Failed to spawn ${cmd}: ${err.message}`));
-        });
-      });
-
-      this.captureStepTerminalEvidence(step.name, {}, { exitCode, exitSignal });
-      return { output, exitCode, exitSignal };
-    } finally {
-      const stdout = stdoutChunks.join('');
-      const stderr = stderrChunks.join('');
-      const combinedOutput = stdout + stderr;
-      this.lastFailedStepOutput.set(step.name, combinedOutput);
-      this.captureStepTerminalEvidence(step.name, {
-        stdout,
-        stderr,
-        combined: combinedOutput,
-      });
-      stopHeartbeat?.();
-      logStream.end();
-      this.unregisterWorker(agentName);
-    }
-  }
-
-  private async spawnAndWait(
-    agentDef: AgentDefinition,
-    step: WorkflowStep,
-    timeoutMs?: number,
-    options: SpawnAndWaitOptions = {}
-  ): Promise<SpawnResult> {
-    // Branch: non-interactive agents run as simple subprocesses
-    if (agentDef.interactive === false) {
-      return this.execNonInteractive(agentDef, step, timeoutMs);
-    }
-
-    if (!this.relay) {
-      throw new Error('AgentRelay not initialized');
-    }
-
-    const evidenceStepName = options.evidenceStepName ?? step.name;
-
-    const baseRequestedName = this.buildWorkflowRuntimeAgentBaseName(step.name, options);
-    const requestedName =
-      (options.retryAttempt ?? 0) > 0
-        ? `${baseRequestedName}-r${(options.retryAttempt ?? 0) + 1}`
-        : baseRequestedName;
-    let agentName = requestedName;
-
-    if ((options.retryAttempt ?? 0) > 0) {
-      await this.releaseStaleRetryAgents(baseRequestedName, step.name);
-    }
-
-    // Only inject delegation guidance for lead/coordinator agents, not spokes/workers.
-    // In non-hub patterns (pipeline, dag, etc.) every agent is autonomous so they all get it.
-    const role = agentDef.role?.toLowerCase() ?? '';
-    const nameLC = agentDef.name.toLowerCase();
-    const isHub =
-      WorkflowRunner.HUB_ROLES.has(nameLC) ||
-      [...WorkflowRunner.HUB_ROLES].some((r) => new RegExp(`\\b${r}\\b`).test(role));
-    const pattern = this.currentConfig?.swarm.pattern;
-    const isHubPattern = pattern && WorkflowRunner.HUB_PATTERNS.has(pattern);
-    const usesHeadlessWorkflowSpawner = agentDef.cli === 'opencode';
-    const delegationGuidance =
-      usesHeadlessWorkflowSpawner || (!isHub && isHubPattern)
-        ? ''
-        : this.buildDelegationGuidance(agentDef.cli, timeoutMs);
-
-    // Non-claude CLIs (codex, gemini, etc.) don't auto-register with Relaycast
-    // via the MCP system prompt the way claude does. Inject an explicit preamble
-    // so they call register_agent() before any other relay tool.
-    const relayRegistrationNote = usesHeadlessWorkflowSpawner
-      ? ''
-      : this.buildRelayRegistrationNote(agentDef.cli, agentName);
-
-    const interactiveTaskBase = step.task ?? '';
-    const taskWithExit = usesHeadlessWorkflowSpawner
-      ? interactiveTaskBase
-      : interactiveTaskBase +
-        (relayRegistrationNote ? '\n\n' + relayRegistrationNote : '') +
-        (delegationGuidance ? '\n\n' + delegationGuidance + '\n' : '') +
-        '\n\n---\n' +
-        'IMPORTANT: When you have fully completed this task, you MUST self-terminate by either: ' +
-        '(a) calling remove_agent(name: "<your-agent-name>", reason: "task completed") — preferred, or ' +
-        '(b) outputting the exact text "/exit" on its own line as a fallback. ' +
-        'Do not wait for further input — terminate immediately after finishing. ' +
-        'Do NOT spawn sub-agents unless the task explicitly requires it.';
-    const preparedTask = this.prepareInteractiveSpawnTask(agentName, taskWithExit);
-
-    // Register PTY output listener before spawning so we capture everything
-    this.ptyOutputBuffers.set(agentName, []);
-
-    // Open a log file so `agents:logs <name>` works for workflow-spawned agents
-    const logsDir = this.getWorkerLogsDir();
-    const logStream = createWriteStream(path.join(logsDir, `${agentName}.log`), { flags: 'a' });
-    this.ptyLogStreams.set(agentName, logStream);
-
-    this.ptyListeners.set(agentName, (chunk: string) => {
-      const stripped = WorkflowRunner.stripAnsi(chunk);
-      this.ptyOutputBuffers.get(agentName)?.push(stripped);
-      // Write raw output (with ANSI codes) to log file so dashboard's
-      // XTermLogViewer can render colors/formatting natively via xterm.js
-      logStream.write(chunk);
-      options.onChunk?.({ agentName, chunk });
-    });
-
-    const agentChannels = this.channel ? [this.channel] : agentDef.channels;
-
-    let agent: Agent | undefined;
-    let exitResult: string = 'unknown';
-    let stopHeartbeat: (() => void) | undefined;
-    let ptyChunks: string[] = [];
-
-    try {
-      const agentCwd = this.resolveExecutionCwd(step, agentDef);
-      const interactiveSpawnPolicy = resolveSpawnPolicy({
-        AGENT_NAME: agentName,
-        AGENT_CLI: agentDef.cli,
-        RELAY_API_KEY: this.relayApiKey ?? 'workflow-runner',
-        AGENT_CHANNELS: (agentChannels ?? []).join(','),
-      });
-      const proxyMode = await this.resolveAgentProxyMode(agentDef, this.currentConfig);
-      const baseEnv = this.getRelayEnv(proxyMode);
-      const proxyEnvOverrides =
-        proxyMode?.url && proxyMode.token
-          ? resolveProxyEnv(agentDef.cli, proxyMode.url, proxyMode.token)
-          : undefined;
-      const spawnOptions = {
-        name: agentName,
-        model: agentDef.constraints?.model,
-        args: interactiveSpawnPolicy.args,
-        channels: agentChannels,
-        task: preparedTask.spawnTaskText,
-        idleThresholdSecs: agentDef.constraints?.idleThresholdSecs,
-        cwd: agentCwd,
-        agentToken: this.agentTokens.get(agentDef.name),
-        env: proxyEnvOverrides ? { ...baseEnv, ...proxyEnvOverrides } : baseEnv,
-      };
-      const sdkSpawner = getWorkflowSdkSpawner(this.relay, agentDef.cli);
-      if (sdkSpawner) {
-        this.log(
-          `[${step.name}] Using SDK spawner for ${agentDef.cli} (requested runtime: ${agentDef.cli === 'opencode' ? 'headless' : 'pty'})`
-        );
-        agent = await sdkSpawner.spawn(spawnOptions as Parameters<AgentSpawner['spawn']>[0]);
-      } else {
-        this.log(`[${step.name}] Using PTY fallback for ${agentDef.cli}`);
-        agent = await this.relay.spawnPty({
-          ...(spawnOptions as Record<string, unknown>),
-          cli: agentDef.cli,
-        } as Parameters<AgentRelay['spawnPty']>[0]);
-      }
-
-      // Re-key PTY maps if broker assigned a different name than requested
-      if (agent.name !== agentName) {
-        const oldName = agentName;
-        this.ptyOutputBuffers.set(agent.name, this.ptyOutputBuffers.get(oldName) ?? []);
-        this.ptyOutputBuffers.delete(oldName);
-
-        // Close old log stream and rename the file to match the new agent name
-        const oldLogPath = path.join(logsDir, `${oldName}.log`);
-        const newLogPath = path.join(logsDir, `${agent.name}.log`);
-        const oldLogStream = this.ptyLogStreams.get(oldName);
-        if (oldLogStream) {
-          oldLogStream.end();
-          this.ptyLogStreams.delete(oldName);
-          try {
-            renameSync(oldLogPath, newLogPath);
-          } catch {
-            // File may not exist yet if no output was written
-          }
-        }
-
-        // Open new log stream with the correct name
-        const newLogStream = createWriteStream(newLogPath, { flags: 'a' });
-        this.ptyLogStreams.set(agent.name, newLogStream);
-
-        // Update listener to use the new log stream
-        const oldListener = this.ptyListeners.get(oldName);
-        if (oldListener) {
-          this.ptyListeners.delete(oldName);
-          const resolvedAgentName = agent.name;
-          this.ptyListeners.set(resolvedAgentName, (chunk: string) => {
-            const stripped = WorkflowRunner.stripAnsi(chunk);
-            this.ptyOutputBuffers.get(resolvedAgentName)?.push(stripped);
-            newLogStream.write(chunk);
-            options.onChunk?.({ agentName: resolvedAgentName, chunk });
-          });
-        }
-
-        agentName = agent.name;
-      }
-
-      const liveAgent = agent;
-      await options.onSpawned?.({ requestedName, actualName: liveAgent.name, agent: liveAgent });
-      this.runtimeStepAgents.set(liveAgent.name, {
-        stepName: evidenceStepName,
-        role: options.evidenceRole ?? agentDef.role ?? 'agent',
-        logicalName: options.logicalName ?? agentDef.name,
-      });
-      const signalParticipant = this.resolveSignalParticipantKind(
-        options.evidenceRole ?? agentDef.role ?? 'agent'
-      );
-      if (signalParticipant) {
-        this.rememberStepSignalSender(
-          evidenceStepName,
-          signalParticipant,
-          liveAgent.name,
-          options.logicalName ?? agentDef.name
-        );
-      }
-
-      // Register in workers.json so `agents:kill` can find this agent
-      let workerPid: number | undefined;
-      try {
-        const rawAgents = await this.relay!.listAgentsRaw();
-        workerPid = rawAgents.find((a) => a.name === agentName)?.pid ?? undefined;
-      } catch {
-        // Best-effort PID lookup
-      }
-      this.registerWorker(agentName, agentDef.cli, step.task ?? '', workerPid);
-
-      // Register the spawned agent in Relaycast for observability + start heartbeat
-      if (this.relayApiKey) {
-        const agentClient = await this.registerRelaycastExternalAgent(
-          liveAgent.name,
-          `Workflow agent for step "${step.name}" (${agentDef.cli})`
-        ).catch((err) => {
-          console.warn(
-            `[WorkflowRunner] Failed to register ${liveAgent.name} in Relaycast:`,
-            err?.message ?? err
-          );
-          return null;
-        });
-
-        // Keep the agent online in the dashboard while it's working
-        if (agentClient) {
-          stopHeartbeat = this.startRelaycastHeartbeat(agentClient);
-        }
-      }
-
-      // Invite the spawned agent to the workflow channel
-      if (this.channel && this.relayApiKey) {
-        const channelAgent = await this.ensureRelaycastRunnerAgent().catch(() => null);
-        await channelAgent?.channels.invite(this.channel, agent.name).catch(() => {});
-      }
-
-      // Keep operational assignment chatter out of the agent coordination channel.
-      this.log(`[${step.name}] Assigned to ${agent.name}`);
-
-      // Register agent handle for hub-mediated nudging
-      this.activeAgentHandles.set(agentName, agent);
-
-      // Wait for agent to exit, with idle nudging if configured
-      exitResult = await this.waitForExitWithIdleNudging(
-        agent,
-        agentDef,
-        step,
-        timeoutMs,
-        preparedTask.promptTaskText,
-        options.preserveOnIdle ?? this.shouldPreserveIdleSupervisor(agentDef, step, options.evidenceRole)
-      );
-
-      // Stop heartbeat now that agent has exited
-      stopHeartbeat?.();
-
-      if (exitResult === 'timeout') {
-        // Grace-period fallback: before failing, check if the agent completed
-        // its work but just failed to self-terminate. Run verification if
-        // configured — a passing gate + timeout is better than a hard failure.
-        let timeoutRecovered = false;
-        if (step.verification) {
-          const ptyOutput = (this.ptyOutputBuffers.get(agentName) ?? []).join('');
-          const verificationResult = this.runVerification(
-            step.verification,
-            ptyOutput,
-            step.name,
-            preparedTask.promptTaskText,
-            { allowFailure: true }
-          );
-          if (verificationResult.passed) {
-            this.log(`[${step.name}] Agent timed out but verification passed — treating as complete`);
-            this.postToChannel(
-              `**[${step.name}]** Agent idle after completing work — verification passed, releasing`
-            );
-            await agent.release().catch(() => undefined);
-            timeoutRecovered = true;
-          }
-        }
-        if (!timeoutRecovered) {
-          await agent.release().catch(() => undefined);
-          throw new Error(`Step "${step.name}" timed out after ${timeoutMs ?? 'unknown'}ms`);
-        }
-      }
-
-      if (exitResult === 'force-released') {
-        throw new Error(
-          `Step "${step.name}" failed — agent was force-released after exhausting idle nudges without completing`
-        );
-      }
-    } finally {
-      // Snapshot PTY chunks before cleanup — we need them for output reading below
-      ptyChunks = this.ptyOutputBuffers.get(agentName) ?? [];
-      this.lastFailedStepOutput.set(step.name, ptyChunks.join(''));
-      if (ptyChunks.length > 0 || agent?.exitCode !== undefined || agent?.exitSignal !== undefined) {
-        this.captureStepTerminalEvidence(
-          evidenceStepName,
-          {
-            stdout: ptyChunks.length > 0 ? ptyChunks.join('') : undefined,
-            combined: ptyChunks.length > 0 ? ptyChunks.join('') : undefined,
-          },
-          {
-            exitCode: agent?.exitCode,
-            exitSignal: agent?.exitSignal,
-          },
-          {
-            sender: options.logicalName ?? agentDef.name,
-            actor: agent?.name ?? agentName,
-            role: options.evidenceRole ?? agentDef.role ?? 'agent',
-          }
-        );
-      }
-
-      // Always clean up PTY resources — prevents fd leaks if spawnPty or waitForExit throws
-      stopHeartbeat?.();
-      this.activeAgentHandles.delete(agentName);
-      this.ptyOutputBuffers.delete(agentName);
-      this.ptyListeners.delete(agentName);
-      const stream = this.ptyLogStreams.get(agentName);
-      if (stream) {
-        stream.end();
-        this.ptyLogStreams.delete(agentName);
-      }
-      this.unregisterWorker(agentName);
-      this.supervisedRuntimeAgents.delete(agentName);
-      this.runtimeStepAgents.delete(agentName);
-      if (preparedTask.taskTmpFile) {
-        await unlink(preparedTask.taskTmpFile).catch(() => undefined);
-      }
-    }
-
-    let output: string;
-    if (ptyChunks.length > 0) {
-      output = ptyChunks.join('');
-    } else {
-      // Legacy fallback: summary file
-      const summaryPath = path.join(this.summaryDir, `${step.name}.md`);
-      output = existsSync(summaryPath)
-        ? await readFile(summaryPath, 'utf-8')
-        : exitResult === 'timeout'
-          ? 'Agent completed (released after idle timeout)'
-          : exitResult === 'released'
-            ? 'Agent completed (idle — treated as done)'
-            : `Agent exited (${exitResult})`;
-    }
-
-    if (ptyChunks.length === 0) {
-      this.captureStepTerminalEvidence(
-        evidenceStepName,
-        { stdout: output, combined: output },
-        { exitCode: agent?.exitCode, exitSignal: agent?.exitSignal },
-        {
-          sender: options.logicalName ?? agentDef.name,
-          actor: agent?.name ?? agentName,
-          role: options.evidenceRole ?? agentDef.role ?? 'agent',
-        }
-      );
-    }
-
-    return {
-      output,
-      exitCode: agent?.exitCode,
-      exitSignal: agent?.exitSignal,
-      promptTaskText: preparedTask.promptTaskText,
-    };
-  }
-
-  // ── Idle nudging ────────────────────────────────────────────────────────
-
-  /** Patterns where a hub agent coordinates spoke agents. */
-  private static readonly HUB_PATTERNS = new Set<string>([
-    'fan-out',
-    'hub-spoke',
-    'hierarchical',
-    'map-reduce',
-    'scatter-gather',
-    'supervisor',
-    'saga',
-    'auction',
-  ]);
-
-  /** Roles that indicate a coordinator/lead agent (eligible for delegation guidance). */
-  private static readonly HUB_ROLES = new Set([
-    'lead',
-    'hub',
-    'coordinator',
-    'supervisor',
-    'orchestrator',
-    'auctioneer',
-  ]);
-
-  private isLeadLikeAgent(agentDef: AgentDefinition, roleOverride?: string): boolean {
-    if (agentDef.preset === 'lead') return true;
-
-    const role = (roleOverride ?? agentDef.role ?? '').toLowerCase();
-    const nameLC = agentDef.name.toLowerCase();
-    return [...WorkflowRunner.HUB_ROLES].some(
-      (hubRole) =>
-        new RegExp(`\\b${hubRole}\\b`, 'i').test(nameLC) || new RegExp(`\\b${hubRole}\\b`, 'i').test(role)
-    );
-  }
-
-  private shouldPreserveIdleSupervisor(
-    agentDef: AgentDefinition,
-    step: WorkflowStep,
-    evidenceRole?: string
-  ): boolean {
-    if (evidenceRole && /\bowner\b/i.test(evidenceRole)) {
-      return true;
-    }
-
-    if (!this.isLeadLikeAgent(agentDef, evidenceRole)) {
-      return false;
-    }
-
-    const task = step.task ?? '';
-    return /\b(wait|waiting|monitor|supervis|check inbox|check.*channel|poll|DONE|_DONE|signal|handoff)\b/i.test(
-      task
-    );
-  }
-
-  /**
-   * Wait for agent exit with idle detection and nudging.
-   * If no idle nudge config is set, falls through to simple waitForExit.
-   */
-  private async waitForExitWithIdleNudging(
-    agent: Agent,
-    agentDef: AgentDefinition,
-    step: WorkflowStep,
-    timeoutMs?: number,
-    promptTaskText?: string,
-    preserveIdleSupervisor = false
-  ): Promise<'exited' | 'timeout' | 'released' | 'force-released'> {
-    const nudgeConfig = this.currentConfig?.swarm.idleNudge;
-    if (!nudgeConfig) {
-      if (preserveIdleSupervisor) {
-        this.log(
-          `[${step.name}] Supervising agent "${agent.name}" may idle while waiting — using exit-only completion`
-        );
-        return agent.waitForExit(timeoutMs);
-      }
-
-      // Idle = done: race exit against idle, but only accept idle if verification passes.
-      const idleLoopStart = Date.now();
-      while (true) {
-        const elapsed = Date.now() - idleLoopStart;
-        const remaining = timeoutMs != null ? Math.max(0, timeoutMs - elapsed) : undefined;
-        if (remaining != null && remaining <= 0) {
-          return 'timeout';
-        }
-        const result = await Promise.race([
-          agent.waitForExit(remaining).then((r) => ({ kind: 'exit' as const, result: r })),
-          agent.waitForIdle(remaining).then((r) => ({ kind: 'idle' as const, result: r })),
-        ]);
-        if (result.kind === 'idle' && result.result === 'idle') {
-          // Check verification before treating idle as complete.
-          if (step.verification && step.verification.type === 'output_contains') {
-            const token = step.verification.value;
-            const ptyOutput = (this.ptyOutputBuffers.get(agent.name) ?? []).join('');
-            const verificationPassed = this.outputContainsVerificationToken(ptyOutput, token, promptTaskText);
-            if (!verificationPassed) {
-              // The broker fires agent_idle only once per idle transition.
-              // If the agent is still working (will produce output then idle again),
-              // continuing the loop works. But if the agent is permanently idle,
-              // waitForIdle won't resolve again. Wait briefly for new output,
-              // then release and let upstream verification handle the result.
-              this.log(
-                `[${step.name}] Agent "${agent.name}" went idle but verification not yet passed — waiting for more output`
-              );
-              const idleGraceSecs = 15;
-              const graceResult = await Promise.race([
-                agent.waitForExit(idleGraceSecs * 1000).then((r) => ({ kind: 'exit' as const, result: r })),
-                agent.waitForIdle(idleGraceSecs * 1000).then((r) => ({ kind: 'idle' as const, result: r })),
-              ]);
-              if (graceResult.kind === 'idle' && graceResult.result === 'idle') {
-                // Agent went idle again after producing output — re-check verification
-                continue;
-              }
-              if (graceResult.kind === 'exit') {
-                return graceResult.result as 'exited' | 'timeout' | 'released';
-              }
-              // Grace period timed out — agent is permanently idle without verification.
-              // Release and let upstream executeAgentStep handle verification.
-              this.log(
-                `[${step.name}] Agent "${agent.name}" still idle after ${idleGraceSecs}s grace — releasing`
-              );
-              this.postToChannel(
-                `**[${step.name}]** Agent \`${agent.name}\` idle — releasing (verification pending)`
-              );
-              await agent.release().catch(() => undefined);
-              return 'released';
-            }
-          }
-          this.log(`[${step.name}] Agent "${agent.name}" went idle — treating as complete`);
-          this.postToChannel(`**[${step.name}]** Agent \`${agent.name}\` idle — treating as complete`);
-          await agent.release().catch(() => undefined);
-          return 'released';
-        }
-        // Exit won the race, or idle returned 'exited'/'timeout' — pass through.
-        return result.result as 'exited' | 'timeout' | 'released';
-      }
-    }
-
-    const nudgeAfterMs = nudgeConfig.nudgeAfterMs ?? 120_000;
-    const escalateAfterMs = nudgeConfig.escalateAfterMs ?? 120_000;
-    const maxNudges = nudgeConfig.maxNudges ?? 1;
-
-    let nudgeCount = 0;
-    let preservedSupervisorNoticeSent = false;
-    const startTime = Date.now();
-
-    while (true) {
-      // Calculate remaining time from overall timeout
-      const elapsed = Date.now() - startTime;
-      const remaining = timeoutMs ? timeoutMs - elapsed : undefined;
-      if (remaining !== undefined && remaining <= 0) {
-        return 'timeout';
-      }
-
-      // nudgeAfterMs = how long to wait before nudging (first interval).
-      // escalateAfterMs = how long to wait between subsequent nudges.
-      //
-      // We wait for exit, not for idle. The broker's idle_threshold_secs is
-      // only 30s by default, so racing waitForExit vs waitForIdle would nudge
-      // after 30s of PTY silence regardless of nudgeAfterMs. Instead, we give
-      // the agent the full nudgeAfterMs window to finish before nudging.
-      const windowMs = nudgeCount === 0 ? nudgeAfterMs : escalateAfterMs;
-      const waitMs = remaining !== undefined ? Math.min(windowMs, remaining) : windowMs;
-
-      const exitResult = await agent.waitForExit(waitMs);
-
-      if (exitResult !== 'timeout') {
-        // Agent actually exited or was released — done
-        return exitResult;
-      }
-
-      // Agent is still running after the window expired.
-      if (timeoutMs !== undefined && Date.now() - startTime >= timeoutMs) {
-        return 'timeout';
-      }
-
-      // Nudge if we haven't exhausted the limit
-      if (nudgeCount < maxNudges) {
-        await this.nudgeIdleAgent(agent, agentDef, step);
-        nudgeCount++;
-        this.postToChannel(`**[${step.name}]** Agent \`${agent.name}\` idle — nudge #${nudgeCount} sent`);
-        this.emit({ type: 'step:nudged', runId: this.currentRunId ?? '', stepName: step.name, nudgeCount });
-        continue;
-      }
-
-      if (preserveIdleSupervisor) {
-        if (!preservedSupervisorNoticeSent) {
-          this.log(
-            `[${step.name}] Supervising agent "${agent.name}" stayed idle after ${nudgeCount} nudge(s) — preserving until exit or timeout`
-          );
-          this.postToChannel(
-            `**[${step.name}]** Supervising agent \`${agent.name}\` is waiting on handoff — keeping it alive until it exits or the step times out`
-          );
-          preservedSupervisorNoticeSent = true;
-        }
-        continue;
-      }
-
-      // Exhausted nudges — force-release
-      this.postToChannel(
-        `**[${step.name}]** Agent \`${agent.name}\` still idle after ${nudgeCount} nudge(s) — force-releasing`
-      );
-      this.emit({ type: 'step:force-released', runId: this.currentRunId ?? '', stepName: step.name });
-      await agent.release().catch(() => undefined);
-      return 'force-released';
-    }
-  }
-
-  /**
-   * Send a nudge to an idle agent. Uses hub-mediated nudge for hub patterns,
-   * or direct system injection otherwise.
-   */
-  private async nudgeIdleAgent(agent: Agent, agentDef: AgentDefinition, step: WorkflowStep): Promise<void> {
-    const hubAgent = this.resolveHubForNudge(agentDef);
-
-    if (hubAgent) {
-      // Hub-mediated: tell the hub to check on the idle agent
-      try {
-        await hubAgent.sendMessage({
-          to: agent.name,
-          text: `Agent ${agent.name} appears idle on step "${step.name}". Check on them and remind them to /exit when done.`,
-        });
-        return; // Hub nudge succeeded
-      } catch {
-        // Fall through to direct nudge
-      }
-    }
-
-    // Direct system injection via human handle
-    if (this.relay) {
-      const human = this.relay.human({ name: 'workflow-runner' });
-      await human
-        .sendMessage({
-          to: agent.name,
-          text: "You appear idle. If you've completed your task, output /exit. If still working, continue.",
-        })
-        .catch(() => {
-          // Non-critical — don't break workflow
-        });
-    }
-  }
-
-  /**
-   * Find the hub agent for hub-mediated nudging.
-   * Returns the hub's live Agent handle if this is a hub pattern and the idle agent is not the hub.
-   */
-  private resolveHubForNudge(idleAgentDef: AgentDefinition): Agent | undefined {
-    const pattern = this.currentConfig?.swarm.pattern;
-    if (!pattern || !WorkflowRunner.HUB_PATTERNS.has(pattern)) {
-      return undefined;
-    }
-
-    // Find an interactive agent with a hub-like role
-    const agents = this.currentConfig?.agents ?? [];
-
-    for (const agentDef of agents) {
-      // Skip non-interactive and the idle agent itself
-      if (agentDef.interactive === false) continue;
-      if (agentDef.name === idleAgentDef.name) continue;
-
-      const role = agentDef.role?.toLowerCase() ?? '';
-      const nameLC = agentDef.name.toLowerCase();
-
-      if (
-        WorkflowRunner.HUB_ROLES.has(nameLC) ||
-        [...WorkflowRunner.HUB_ROLES].some((r) => new RegExp(`\\b${r}\\b`).test(role))
-      ) {
-        // Found a hub candidate — check if we have a live handle
-        const handle = this.activeAgentHandles.get(agentDef.name);
-        if (handle) return handle;
-      }
-    }
-
-    return undefined;
-  }
-
-  // ── Verification ────────────────────────────────────────────────────────
-
-  private runVerification(
-    check: VerificationCheck,
-    output: string,
-    stepName: string,
-    injectedTaskText?: string,
-    options?: VerificationOptions
-  ): VerificationResult {
-    try {
-      const result = runVerification(
-        check,
-        output,
-        stepName,
-        injectedTaskText,
-        { ...options, cwd: this.cwd },
-        {
-          recordStepToolSideEffect: (name, effect) => this.recordStepToolSideEffect(name, effect),
-          getOrCreateStepEvidenceRecord: (name) => this.getOrCreateStepEvidenceRecord(name),
-          log: (message) => this.log(message),
-        }
-      );
-
-      this.updateCustomVerificationFailure(stepName, check, result.error);
-      return result;
-    } catch (error) {
-      this.updateCustomVerificationFailure(
-        stepName,
-        check,
-        error instanceof Error ? error.message : String(error)
-      );
-      throw error;
-    }
-  }
-
-  private updateCustomVerificationFailure(
-    stepName: string,
-    check: VerificationCheck,
-    errorMessage?: string
-  ): void {
-    if (check.type !== 'custom' || !check.value || !errorMessage) {
-      this.lastCustomVerificationFailure.delete(stepName);
-      return;
-    }
-
-    const marker = `custom check "${check.value}" failed\n`;
-    const markerIndex = errorMessage.indexOf(marker);
-    const output =
-      markerIndex === -1 ? errorMessage.trim() : errorMessage.slice(markerIndex + marker.length).trim();
-
-    this.lastCustomVerificationFailure.set(stepName, {
-      command: check.value,
-      output,
-    });
-  }
-
-  // ── State helpers ─────────────────────────────────────────────────────
-
-  private async updateRunStatus(runId: string, status: WorkflowRunStatus, error?: string): Promise<void> {
-    const patch: Partial<WorkflowRunRow> = {
-      status,
-      updatedAt: new Date().toISOString(),
-    };
-    if (status === 'completed' || status === 'failed' || status === 'cancelled') {
-      patch.completedAt = new Date().toISOString();
-    }
-    if (error) {
-      patch.error = error;
-    }
-    await this.db.updateRun(runId, patch);
-  }
-
-  private async markStepFailed(
-    state: StepState,
-    error: string,
-    runId: string,
-    exitInfo?: { exitCode?: number; exitSignal?: string },
-    completionReason?: WorkflowStepCompletionReason
-  ): Promise<void> {
-    this.captureStepTerminalEvidence(state.row.stepName, {}, exitInfo);
-    state.row.status = 'failed';
-    state.row.error = error;
-    state.row.completionReason = completionReason;
-    state.row.completedAt = new Date().toISOString();
-    await this.db.updateStep(state.row.id, {
-      status: 'failed',
-      error,
-      completionReason,
-      completedAt: state.row.completedAt,
-      updatedAt: new Date().toISOString(),
-    });
-    this.emit({
-      type: 'step:failed',
-      runId,
-      stepName: state.row.stepName,
-      error,
-      exitCode: exitInfo?.exitCode,
-      exitSignal: exitInfo?.exitSignal,
-    });
-    this.finalizeStepEvidence(state.row.stepName, 'failed', state.row.completedAt, completionReason);
-  }
-
-  private async captureAgentReport(
-    runId: string,
-    stepName: string,
-    agentDef: AgentDefinition | undefined,
-    cwd: string | undefined,
-    startedAt: number | undefined,
-    completedAt: number
-  ): Promise<void> {
-    if (!agentDef || !cwd || !startedAt) return;
-
-    try {
-      const report = await collectCliSession({
-        cli: agentDef.cli,
-        cwd,
-        startedAt,
-        completedAt,
-      });
-      if (!report) return;
-
-      const totalTokens = this.getTotalReportTokens(report);
-      if (this.budgetTracker && report.tokens) {
-        this.budgetTracker.recordUsage(stepName, report.tokens);
-        this.budgetTracker.isOverBudget(stepName);
-        const budgetStatus = this.budgetTracker.getBudgetStatus(stepName);
-        if (budgetStatus.agentLimitExceeded) {
-          const stepBudget = this.budgetTracker.getStepBudgetStatus(stepName);
-          const used =
-            stepBudget?.used?.toLocaleString('en-US') ?? totalTokens?.toLocaleString('en-US') ?? '0';
-          const limit = stepBudget?.limit?.toLocaleString('en-US') ?? '--';
-          this.log(`[budget] Step ${stepName} exceeded its agent budget (${used} of ${limit})`);
-        }
-      }
-
-      this.agentReports.set(stepName, report);
-      this.emit({ type: 'step:agent-report', runId, stepName, report });
-      await this.persistAgentReport(runId, stepName, report);
-    } catch (error) {
-      this.log(
-        `[${stepName}] CLI session collection failed: ${error instanceof Error ? error.message : String(error)}`
-      );
-    }
-  }
-
-  private async markDownstreamSkipped(
-    failedStepName: string,
-    allSteps: WorkflowStep[],
-    stepStates: Map<string, StepState>,
-    runId: string
-  ): Promise<void> {
-    const queue = [failedStepName];
-    const visited = new Set<string>();
-
-    while (queue.length > 0) {
-      const current = queue.shift()!;
-      if (visited.has(current)) continue;
-      visited.add(current);
-
-      for (const step of allSteps) {
-        if (step.dependsOn?.includes(current)) {
-          const state = stepStates.get(step.name);
-          if (state && state.row.status === 'pending') {
-            state.row.status = 'skipped';
-            await this.db.updateStep(state.row.id, {
-              status: 'skipped',
-              updatedAt: new Date().toISOString(),
-            });
-            this.emit({ type: 'step:skipped', runId, stepName: step.name });
-            this.postToChannel(`**[${step.name}]** Skipped — upstream dependency "${current}" failed`);
-            await this.trajectory?.stepSkipped(step, `Upstream dependency "${current}" failed`);
-            await this.trajectory?.decide(
-              `Whether to skip ${step.name}`,
-              'skip',
-              `Upstream dependency "${current}" failed`
-            );
-            queue.push(step.name);
-          }
-        }
-      }
-    }
-  }
-
-  // ── startFrom dependency resolution ─────────────────────────────────
-
-  /**
-   * Walk the dependsOn graph backwards from a target step to collect ALL
-   * transitive dependencies (i.e. every step that must complete before
-   * the target step can run). The target step itself is NOT included.
-   */
-  private collectTransitiveDeps(targetStep: string, steps: WorkflowStep[]): Set<string> {
-    const stepMap = new Map<string, WorkflowStep>();
-    for (const s of steps) stepMap.set(s.name, s);
-
-    const deps = new Set<string>();
-    const queue = [...(stepMap.get(targetStep)?.dependsOn ?? [])];
-
-    while (queue.length > 0) {
-      const current = queue.shift()!;
-      if (deps.has(current)) continue;
-      deps.add(current);
-      const step = stepMap.get(current);
-      if (step?.dependsOn) {
-        for (const dep of step.dependsOn) {
-          if (!deps.has(dep)) queue.push(dep);
-        }
-      }
-    }
-
-    return deps;
-  }
-
-  // ── Control flow helpers ──────────────────────────────────────────────
-
-  private checkAborted(): void {
-    if (this.abortController?.signal.aborted) {
-      throw new Error('Workflow aborted');
-    }
-  }
-
-  private async waitIfPaused(): Promise<void> {
-    if (!this.paused) return;
-    await new Promise<void>((resolve) => {
-      this.pauseResolver = resolve;
-    });
-  }
-
-  private delay(ms: number): Promise<void> {
-    return new Promise((resolve) => setTimeout(resolve, ms));
-  }
-
-  // ── Channel messaging ──────────────────────────────────────────────────
-
-  /**
-   * Build a metadata note about non-interactive workers for inclusion in interactive agent tasks.
-   * Returns undefined if there are no non-interactive agents.
-   */
-  private buildNonInteractiveAwareness(
-    agentMap: Map<string, AgentDefinition>,
-    stepStates: Map<string, StepState>
-  ): string | undefined {
-    return this.channelMessenger.buildNonInteractiveAwareness(agentMap, stepStates);
-  }
-
-  /**
-   * Build guidance that encourages agents to autonomously delegate subtasks
-   * to helper agents when work is too complex for a single pass.
-   */
-  /**
-   * Returns a relay registration preamble for CLIs that don't auto-call
-   * `register` via the MCP system prompt (everyone except claude).
-   *
-   * Claude reads the Relaycast system prompt and registers on its own.
-   * Codex, gemini, etc. have the MCP server configured with the workspace
-   * key, but they won't call `register` unless explicitly told to.
-   */
-  private buildRelayRegistrationNote(cli: string, agentName: string): string {
-    return this.channelMessenger.buildRelayRegistrationNote(cli, agentName);
-  }
-
-  private buildDelegationGuidance(cli: string, timeoutMs?: number): string {
-    return this.channelMessenger.buildDelegationGuidance(cli, timeoutMs);
-  }
-
-  /** Post a message to the workflow channel. Fire-and-forget — never throws or blocks. */
-  private postToChannel(text: string, options: ChannelEvidenceOptions = {}): void {
-    if (!this.relayApiKey || !this.channel) return;
-    this.recordChannelEvidence(text, options);
-
-    const stepName = options.stepName ?? this.inferStepNameFromChannelText(text);
-    if (stepName) {
-      this.recordStepToolSideEffect(stepName, {
-        type: 'post_channel_message',
-        detail: text.slice(0, 240),
-        raw: {
-          actor: options.actor,
-          role: options.role,
-          target: options.target ?? this.channel,
-          origin: options.origin ?? 'runner_post',
-        },
-      });
-    }
-
-    this.ensureRelaycastRunnerAgent()
-      .then((agent) => agent.send(this.channel!, text))
-      .catch(() => {
-        // Non-critical — don't break workflow execution
-      });
-  }
-
-  /** Post a rich completion report to the channel. */
-  private postCompletionReport(
-    workflowName: string,
-    outcomes: StepOutcome[],
-    summary: string,
-    confidence: number
-  ): void {
-    this.channelMessenger.postCompletionReport(workflowName, outcomes, summary, confidence);
-  }
-
-  /** Post a failure report to the channel. */
-  private postFailureReport(workflowName: string, outcomes: StepOutcome[], errorMsg: string): void {
-    this.channelMessenger.postFailureReport(workflowName, outcomes, errorMsg);
-  }
-
-  /**
-   * Log a human-readable run summary to the console after completion or failure.
-   * Extracts the last meaningful lines from each step's raw PTY output.
-   */
-  private logRunSummary(workflowName: string, outcomes: StepOutcome[], runId: string): void {
-    const completed = outcomes.filter((o) => o.status === 'completed');
-    const failed = outcomes.filter((o) => o.status === 'failed');
-    const skipped = outcomes.filter((o) => o.status === 'skipped');
-
-    console.log('');
-    console.log(chalk.dim('━'.repeat(70)));
-    console.log(
-      `  Workflow "${workflowName}" — ${failed.length === 0 ? chalk.green('COMPLETED') : chalk.red('FAILED')}`
-    );
-    console.log(
-      `  ${chalk.green(`${completed.length} passed`)}, ${chalk.red(`${failed.length} failed`)}, ${chalk.dim(`${skipped.length} skipped`)}`
-    );
-    console.log(chalk.dim('━'.repeat(70)));
-
-    // Always show the summary table — with agent reports when available,
-    // with just step/status/duration when not (non-interactive agents).
-    console.log(
-      formatRunSummaryTable(outcomes, this.agentReports, this.budgetTracker?.getRunSummaryBudgetData())
-    );
-
-    // Show errors and output excerpts for failed steps below the table
-    for (const outcome of outcomes) {
-      if (outcome.status !== 'failed') continue;
-
-      if (outcome.error) {
-        console.log(chalk.red(`  ${outcome.name}: ${outcome.error}`));
-      }
-
-      if (outcome.output) {
-        const excerpt = this.extractOutputExcerpt(outcome.output);
-        if (excerpt) {
-          for (const line of excerpt.split('\n')) {
-            console.log(`    ${line}`);
-          }
-        }
-      }
-    }
-
-    // Point to detailed output files
-    const outputDir = this.getStepOutputDir(runId);
-    const logsDir = path.join(this.cwd, '.agent-relay', 'team', 'worker-logs');
-    console.log('');
-    console.log(`  Run ID:      ${runId}`);
-    console.log(`  Step output: ${outputDir}`);
-    console.log(`  Agent logs:  ${logsDir}`);
-    console.log(chalk.dim('━'.repeat(70)));
-    console.log('');
-  }
-
-  /**
-   * Extract a useful excerpt from raw PTY output.
-   * Looks for the agent's final text output (ignoring ANSI, system prompts, tool calls).
-   */
-  private extractOutputExcerpt(rawOutput: string): string {
-    const stripped = WorkflowRunner.stripAnsi(rawOutput);
-
-    // Split into lines, filter out noise
-    const lines = stripped.split('\n').filter((line) => {
-      const trimmed = line.trim();
-      if (!trimmed) return false;
-      // Skip system/UI chrome
-      if (trimmed.startsWith('╭') || trimmed.startsWith('╰') || trimmed.startsWith('│')) return false;
-      if (trimmed.startsWith('─')) return false;
-      if (trimmed.startsWith('❯') || trimmed.startsWith('⏵')) return false;
-      if (trimmed.startsWith('<system-reminder>') || trimmed.startsWith('</system-reminder>')) return false;
-      if (/^\[?workflow\s/.test(trimmed)) return false;
-      // Skip tool invocations
-      if (/^(Read|Edit|Bash|Glob|Grep|Task|Explore|Write)\(/.test(trimmed)) return false;
-      // Skip thinking indicators
-      if (/^[·✳✻✽⏺]?\s*Sublimating/.test(trimmed)) return false;
-      // Skip very short lines (likely UI fragments)
-      if (trimmed.length < 10) return false;
-      return true;
-    });
-
-    if (lines.length === 0) return '';
-
-    // Take the last few meaningful lines (agent's final words)
-    const tail = lines.slice(-5);
-    const excerpt = tail.map((l) => l.trim().slice(0, 120)).join('\n');
-    return excerpt.length > 0 ? `...\n${excerpt}` : '';
-  }
-
-  // ── Trajectory helpers ────────────────────────────────────────────────
-
-  /** Analyze DAG structure for trajectory context. */
-  private analyzeDAG(steps: WorkflowStep[]): string {
-    const roots = steps.filter((s) => !s.dependsOn?.length);
-    const withDeps = steps.filter((s) => s.dependsOn?.length);
-
-    const parts = [`Parsed ${steps.length} steps`];
-    if (roots.length > 1) {
-      parts.push(`${roots.length} parallel tracks`);
-    }
-    if (withDeps.length > 0) {
-      parts.push(`${withDeps.length} dependent steps`);
-    }
-    parts.push('DAG validated, no cycles');
-    return parts.join(', ');
-  }
-
-  /** Collect step outcomes for trajectory synthesis. */
-  private collectOutcomes(stepStates: Map<string, StepState>, steps?: WorkflowStep[]): StepOutcome[] {
-    const stepsWithVerification = new Set(steps?.filter((s) => s.verification).map((s) => s.name) ?? []);
-    const outcomes: StepOutcome[] = [];
-    for (const [name, state] of stepStates) {
-      const startedAtMs = state.row.startedAt ? Date.parse(state.row.startedAt) : Number.NaN;
-      const completedAtMs = state.row.completedAt ? Date.parse(state.row.completedAt) : Number.NaN;
-      const durationMs =
-        Number.isFinite(startedAtMs) && Number.isFinite(completedAtMs)
-          ? Math.max(0, completedAtMs - startedAtMs)
-          : undefined;
-      outcomes.push({
-        name,
-        agent: state.row.agentName ?? 'deterministic',
-        status:
-          state.row.status === 'completed'
-            ? 'completed'
-            : state.row.status === 'skipped'
-              ? 'skipped'
-              : 'failed',
-        attempts: state.row.retryCount + 1,
-        output: state.row.output,
-        error: state.row.error,
-        verificationPassed: state.row.status === 'completed' && stepsWithVerification.has(name),
-        durationMs,
-        completionMode: state.row.completionReason
-          ? this.buildStepCompletionDecision(name, state.row.completionReason)?.mode
-          : undefined,
-      });
-    }
-    return outcomes;
-  }
-
-  // ── ID generation ─────────────────────────────────────────────────────
-
-  private persistRunIdHint(runId: string): void {
-    const target = process.env.AGENT_RELAY_RUN_ID_FILE?.trim();
-    if (!target) return;
-    try {
-      mkdirSync(path.dirname(target), { recursive: true });
-      writeFileSync(target, runId + '\n', 'utf8');
-    } catch {
-      // Ignore hint persistence failures.
-    }
-  }
-
-  private generateId(): string {
-    return randomBytes(12).toString('hex');
-  }
-
-  private generateShortId(): string {
-    return randomBytes(4).toString('hex');
-  }
-
-  /** Strip ANSI escape codes from terminal output — delegates to pty.ts canonical regex. */
-  private static stripAnsi(text: string): string {
-    return stripAnsiFn(text);
-  }
-
-  /**
-   * Strip TUI chrome from PTY-captured output before posting to a channel.
-   * Removes: ANSI codes, unicode spinner/thinking characters, cursor-movement
-   * artifacts, and collapses runs of blank lines to a single blank line.
-   * The raw (ANSI-stripped) output is still written to disk for step chaining.
-   */
-  private static scrubForChannel(text: string): string {
-    return scrubWorkflowOutputForChannel(text);
-  }
-
-  /** Sanitize a workflow name into a valid channel name. */
-  private sanitizeChannelName(name: string): string {
-    return name
-      .toLowerCase()
-      .replace(/[^a-z0-9-]/g, '-')
-      .replace(/-+/g, '-')
-      .slice(0, 32);
-  }
-
-  /** Validate that a runId is safe for use in file paths (no traversal). */
-  private validateRunId(runId: string): void {
-    if (/[/\\]|^\.\.?$/.test(runId) || runId.includes('..')) {
-      throw new Error(`Invalid runId: "${runId}" contains path traversal characters`);
-    }
-  }
-
-  /** Directory for persisted step outputs: .agent-relay/step-outputs/{runId}/ */
-  private getStepOutputDir(runId: string): string {
-    this.validateRunId(runId);
-    return path.join(this.cwd, '.agent-relay', 'step-outputs', runId);
-  }
-
-  /** Persist step output to disk and post full output as a channel message. */
-  private async persistStepOutput(runId: string, stepName: string, output: string): Promise<void> {
-    // 1. Write to disk
-    const outputPath = path.join(this.getStepOutputDir(runId), `${stepName}.md`);
-    try {
-      const dir = this.getStepOutputDir(runId);
-      mkdirSync(dir, { recursive: true });
-      const cleaned = WorkflowRunner.stripAnsi(output);
-      await writeFile(outputPath, cleaned);
-    } catch {
-      // Non-critical
-    }
-    this.recordStepToolSideEffect(stepName, {
-      type: 'persist_step_output',
-      detail: `Persisted step output to ${this.normalizeEvidencePath(outputPath)}`,
-      raw: { path: outputPath },
-    });
-
-    // 2. Post scrubbed output as a single channel message (most recent tail only)
-    const scrubbed = WorkflowRunner.scrubForChannel(output);
-    if (scrubbed.length === 0) {
-      this.postToChannel(`**[${stepName}]** Step completed — output written to disk`, { stepName });
-      return;
-    }
-
-    const maxMsg = 2000;
-    const preview = scrubbed.length > maxMsg ? scrubbed.slice(-maxMsg) : scrubbed;
-    // Surface the final output preview in the local workflow log immediately.
-    // Some deterministic wrappers grep stdout/stderr for completion sentinels,
-    // and fire-and-forget channel delivery can arrive too late for single-step runs.
-    this.log(`[${stepName}] Output:\n\`\`\`\n${preview}\n\`\`\``);
-    this.postToChannel(`**[${stepName}] Output:**\n\`\`\`\n${preview}\n\`\`\``, { stepName });
-  }
-
-  private async persistAgentReport(runId: string, stepName: string, report: CliSessionReport): Promise<void> {
-    const reportPath = path.join(this.getStepOutputDir(runId), `${stepName}.report.json`);
-    try {
-      mkdirSync(this.getStepOutputDir(runId), { recursive: true });
-      await writeFile(reportPath, JSON.stringify(report, null, 2), 'utf8');
-    } catch {
-      // Non-critical
-    }
-  }
-
-  /** Scan .agent-relay/step-outputs/ for the most recent run directory containing the needed steps. */
-  private findMostRecentRunWithSteps(stepNames: Set<string>): string | undefined {
-    try {
-      const baseDir = path.join(this.cwd, '.agent-relay', 'step-outputs');
-      if (!existsSync(baseDir)) return undefined;
-
-      const entries = readdirSync(baseDir);
-      let best: { name: string; mtime: number } | undefined;
-
-      for (const entry of entries) {
-        const dirPath = path.join(baseDir, entry);
-        try {
-          const stat = statSync(dirPath);
-          if (!stat.isDirectory()) continue;
-
-          // Check if this directory has at least one of the needed step files
-          const hasAny = [...stepNames].some((name) => existsSync(path.join(dirPath, `${name}.md`)));
-          if (!hasAny) continue;
-
-          if (!best || stat.mtimeMs > best.mtime) {
-            best = { name: entry, mtime: stat.mtimeMs };
-          }
-        } catch {
-          continue;
-        }
-      }
-
-      return best?.name;
-    } catch {
-      return undefined;
-    }
-  }
-
-  /** Load persisted step output from disk. */
-  private loadStepOutput(runId: string, stepName: string): string | undefined {
-    try {
-      const filePath = path.join(this.getStepOutputDir(runId), `${stepName}.md`);
-      if (!existsSync(filePath)) return undefined;
-      return readFileSync(filePath, 'utf-8');
-    } catch {
-      return undefined;
-    }
-  }
-
-  /** Match the best workflow from config given a set of cached step names. */
-  private matchWorkflowFromCache(
-    workflows: WorkflowDefinition[],
-    cachedStepNames: Set<string>
-  ): WorkflowDefinition | null {
-    if (workflows.length === 1) return workflows[0];
-
-    if (cachedStepNames.size === 0) {
-      // No cached steps to disambiguate — ambiguous when multiple workflows exist
-      this.log('[resume] Multiple workflows in config with empty cache — cannot disambiguate');
-      return null;
-    }
-
-    // Score each workflow by how many cached steps match, excluding those with unknown steps
-    const scored = workflows
-      .map((candidate) => ({
-        workflow: candidate,
-        matchedSteps: candidate.steps.filter((step) => cachedStepNames.has(step.name)).length,
-        unknownSteps: [...cachedStepNames].filter(
-          (name) => !candidate.steps.some((step) => step.name === name)
-        ).length,
-      }))
-      .filter((candidate) => candidate.unknownSteps === 0)
-      .sort((a, b) => b.matchedSteps - a.matchedSteps);
-
-    return scored[0]?.workflow ?? null;
-  }
-
-  private reconstructRunFromCache(
-    runId: string,
-    config?: RelayYamlConfig
-  ): { run: WorkflowRunRow; stepStates: Map<string, StepState> } | null {
-    const stepOutputDir = this.getStepOutputDir(runId);
-    if (!existsSync(stepOutputDir)) return null;
-
-    let resumeConfig = config ?? this.currentConfig;
-    if (!resumeConfig) {
-      // Attempt to load config from relay.yaml on disk (resume() may call before runWorkflowCore sets currentConfig)
-      const yamlPath = path.join(this.cwd, 'relay.yaml');
-      if (existsSync(yamlPath)) {
-        try {
-          const raw = readFileSync(yamlPath, 'utf-8');
-          resumeConfig = this.parseYamlString(raw, yamlPath);
-        } catch {
-          return null;
-        }
-      } else {
-        return null;
-      }
-    }
-
-    let entries: Dirent[];
-    try {
-      entries = readdirSync(stepOutputDir, { withFileTypes: true });
-    } catch {
-      return null;
-    }
-
-    const cachedStepNames = new Set(
-      entries
-        .filter((entry) => entry.isFile() && entry.name.endsWith('.md'))
-        .map((entry) => entry.name.slice(0, -3))
-        .filter(Boolean)
-    );
-    const workflows = resumeConfig.workflows ?? [];
-    if (workflows.length === 0) return null;
-
-    // Empty cache directory is valid — all steps will be re-run
-    const workflow = this.matchWorkflowFromCache(workflows, cachedStepNames);
-    if (!workflow) return null;
-
-    // Use actual file modification times from cached outputs instead of synthetic timestamps
-    const stepMtimes = new Map<string, string>();
-    let earliestMtime = Date.now();
-    for (const stepName of cachedStepNames) {
-      try {
-        const mdPath = path.join(stepOutputDir, `${stepName}.md`);
-        const reportPath = path.join(stepOutputDir, `${stepName}.report.json`);
-        const mdStat = existsSync(mdPath) ? statSync(mdPath) : null;
-        const reportStat = existsSync(reportPath) ? statSync(reportPath) : null;
-        // Use the latest mtime between .md and .report.json
-        const mtime = Math.max(mdStat?.mtimeMs ?? 0, reportStat?.mtimeMs ?? 0);
-        if (mtime > 0) {
-          stepMtimes.set(stepName, new Date(mtime).toISOString());
-          if (mtime < earliestMtime) earliestMtime = mtime;
-        }
-      } catch {
-        // Fall back to current time if stat fails
-      }
-    }
-    const fallbackTime = new Date().toISOString();
-
-    const completedSteps = new Set(
-      workflow.steps.filter((step) => cachedStepNames.has(step.name)).map((step) => step.name)
-    );
-    // Heuristic: mark the first eligible non-completed step as failed (the likely failure point)
-    const failedStepName = workflow.steps.find(
-      (step) =>
-        !completedSteps.has(step.name) && (step.dependsOn ?? []).every((dep) => completedSteps.has(dep))
-    )?.name;
-
-    const runStartedAt = new Date(earliestMtime).toISOString();
-    const run: WorkflowRunRow = {
-      id: runId,
-      workspaceId: this.workspaceId,
-      workflowName: workflow.name,
-      pattern: resumeConfig.swarm.pattern,
-      status: 'failed',
-      config: resumeConfig,
-      startedAt: runStartedAt,
-      createdAt: runStartedAt,
-      updatedAt: fallbackTime,
-    };
-
-    const stepStates = new Map<string, StepState>();
-    for (const step of workflow.steps) {
-      const isNonAgent =
-        step.type === 'deterministic' || step.type === 'worktree' || step.type === 'integration';
-      const cachedOutput = completedSteps.has(step.name) ? this.loadStepOutput(runId, step.name) : undefined;
-      const status: WorkflowStepStatus = completedSteps.has(step.name)
-        ? 'completed'
-        : step.name === failedStepName
-          ? 'failed'
-          : 'pending';
-
-      const stepRow: WorkflowStepRow = {
-        id: this.generateId(),
-        runId,
-        stepName: step.name,
-        agentName: isNonAgent ? null : (step.agent ?? null),
-        stepType: isNonAgent ? (step.type as 'deterministic' | 'worktree' | 'integration') : 'agent',
-        status,
-        task:
-          step.type === 'deterministic'
-            ? (step.command ?? '')
-            : step.type === 'worktree'
-              ? (step.branch ?? '')
-              : step.type === 'integration'
-                ? `${step.integration}.${step.action}`
-                : (step.task ?? ''),
-        dependsOn: step.dependsOn ?? [],
-        output: cachedOutput,
-        error: status === 'failed' ? 'Recovered from cached step outputs' : undefined,
-        completedAt: status === 'completed' ? (stepMtimes.get(step.name) ?? fallbackTime) : undefined,
-        retryCount: 0,
-        createdAt: stepMtimes.get(step.name) ?? fallbackTime,
-        updatedAt: stepMtimes.get(step.name) ?? fallbackTime,
-      };
-      stepStates.set(step.name, { row: stepRow });
-    }
-
-    return { run, stepStates };
-  }
-
-  /** Get or create the worker logs directory (.agent-relay/team/worker-logs) */
-  private getWorkerLogsDir(): string {
-    const logsDir = path.join(this.cwd, '.agent-relay', 'team', 'worker-logs');
-    mkdirSync(logsDir, { recursive: true });
-    return logsDir;
-  }
-
-  /** Register a spawned agent in workers.json so `agents:kill` can find it. */
-  private registerWorker(
-    agentName: string,
-    cli: string,
-    task: string,
-    pid?: number,
-    interactive = true
-  ): void {
-    // Track in memory first (no race condition)
-    const workerEntry = {
-      cli,
-      task: task.slice(0, 500),
-      spawnedAt: Date.now(),
-      pid,
-      interactive,
-      logFile: path.join(this.getWorkerLogsDir(), `${agentName}.log`),
-    };
-    this.activeWorkers.set(agentName, workerEntry);
-
-    // Serialize file writes with mutex to prevent race conditions
-    this.workersFileLock = this.workersFileLock.then(() => {
-      try {
-        mkdirSync(path.dirname(this.workersPath), { recursive: true });
-        // Filter out any existing entry with the same name before adding
-        const existing = this.readWorkers().filter((w) => w.name !== agentName);
-        existing.push({ name: agentName, ...workerEntry });
-        this.writeWorkers(existing);
-      } catch {
-        // Non-critical — don't fail the workflow if workers.json can't be written
-      }
-    });
-  }
-
-  /** Remove a spawned agent from workers.json after it exits. */
-  private unregisterWorker(agentName: string): void {
-    // Remove from in-memory tracking first
-    this.activeWorkers.delete(agentName);
-
-    // Serialize file writes with mutex to prevent race conditions
-    this.workersFileLock = this.workersFileLock.then(() => {
-      try {
-        const existing = this.readWorkers();
-        const filtered = existing.filter((w) => w.name !== agentName);
-        this.writeWorkers(filtered);
-      } catch {
-        // Non-critical
-      }
-    });
-  }
-
-  private readWorkers(): Array<Record<string, unknown>> {
-    try {
-      if (!existsSync(this.workersPath)) return [];
-      const raw = JSON.parse(readFileSync(this.workersPath, 'utf-8'));
-      return Array.isArray(raw?.workers) ? raw.workers : [];
-    } catch {
-      return [];
-    }
-  }
-
-  private writeWorkers(workers: Array<Record<string, unknown>>): void {
-    writeFileSync(this.workersPath, JSON.stringify({ workers }, null, 2));
-  }
-}
diff --git a/packages/sdk/src/workflows/schema.json b/packages/sdk/src/workflows/schema.json
deleted file mode 100644
index c04325384..000000000
--- a/packages/sdk/src/workflows/schema.json
+++ /dev/null
@@ -1,940 +0,0 @@
-{
-  "$schema": "http://json-schema.org/draft-07/schema#",
-  "$id": "RelayYamlConfig",
-  "title": "Relay YAML Configuration",
-  "description": "Schema for relay.yaml workflow configuration files",
-  "type": "object",
-  "required": ["version", "name", "swarm"],
-  "additionalProperties": false,
-  "properties": {
-    "version": {
-      "type": "string",
-      "description": "Configuration schema version"
-    },
-    "name": {
-      "type": "string",
-      "description": "Human-readable name for this relay configuration"
-    },
-    "description": {
-      "type": "string",
-      "description": "Optional description of the configuration"
-    },
-    "permission_profiles": {
-      "type": "object",
-      "description": "Reusable permission profiles that agents can reference via permissions.profile.",
-      "additionalProperties": {
-        "$ref": "#/definitions/PermissionProfile"
-      }
-    },
-    "paths": {
-      "type": "array",
-      "description": "Named paths to external directories. The primary working directory defaults to cwd. Use this to declare additional directories so the runner can validate them in preflight and agents can reference them via workdir.",
-      "items": {
-        "$ref": "#/definitions/PathDefinition"
-      }
-    },
-    "swarm": {
-      "$ref": "#/definitions/SwarmConfig"
-    },
-    "agents": {
-      "type": "array",
-      "items": {
-        "$ref": "#/definitions/AgentDefinition"
-      }
-    },
-    "workflows": {
-      "type": "array",
-      "items": {
-        "$ref": "#/definitions/WorkflowDefinition"
-      }
-    },
-    "coordination": {
-      "$ref": "#/definitions/CoordinationConfig"
-    },
-    "state": {
-      "$ref": "#/definitions/StateConfig"
-    },
-    "errorHandling": {
-      "$ref": "#/definitions/ErrorHandlingConfig"
-    },
-    "trajectories": {
-      "description": "Trajectory recording config, or false to disable trajectory output",
-      "anyOf": [
-        {
-          "$ref": "#/definitions/TrajectoryConfig"
-        },
-        {
-          "type": "boolean",
-          "enum": [false]
-        }
-      ]
-    }
-  },
-  "definitions": {
-    "PathDefinition": {
-      "type": "object",
-      "required": ["name", "path"],
-      "additionalProperties": false,
-      "properties": {
-        "name": {
-          "type": "string",
-          "description": "Unique name used to reference this project (e.g. 'relaycast', 'relay')"
-        },
-        "path": {
-          "type": "string",
-          "description": "Path to the project root, resolved relative to the YAML file. Supports env vars: $HOME/.openclaw"
-        },
-        "description": {
-          "type": "string",
-          "description": "Human-readable description of this project's role in the workflow"
-        },
-        "required": {
-          "type": "boolean",
-          "default": true,
-          "description": "Whether this project is required. If true (default), preflight fails if path doesn't exist."
-        }
-      }
-    },
-    "SwarmConfig": {
-      "type": "object",
-      "required": ["pattern"],
-      "additionalProperties": false,
-      "properties": {
-        "pattern": {
-          "$ref": "#/definitions/SwarmPattern"
-        },
-        "maxConcurrency": {
-          "type": "integer",
-          "minimum": 1,
-          "description": "Maximum number of agents running concurrently"
-        },
-        "timeoutMs": {
-          "type": "integer",
-          "minimum": 0,
-          "description": "Global swarm timeout in milliseconds"
-        },
-        "tokenBudget": {
-          "type": "integer",
-          "minimum": 0,
-          "description": "Maximum total tokens allowed across all workflow steps"
-        },
-        "channel": {
-          "type": "string",
-          "description": "Default relay channel for agent communication"
-        },
-        "idleNudge": {
-          "$ref": "#/definitions/IdleNudgeConfig"
-        },
-        "completionGracePeriodMs": {
-          "type": "integer",
-          "minimum": 0,
-          "default": 5000,
-          "description": "Grace period (ms) after an agent exits with code 0 but without posting the expected coordination signal. During this window the runner checks verification gates and evidence before failing. Set to 0 to disable."
-        }
-      }
-    },
-    "IdleNudgeConfig": {
-      "type": "object",
-      "additionalProperties": false,
-      "description": "Configuration for idle agent detection and nudging",
-      "properties": {
-        "nudgeAfterMs": {
-          "type": "integer",
-          "minimum": 0,
-          "description": "Milliseconds after idle detection before first nudge (default: 120000)"
-        },
-        "escalateAfterMs": {
-          "type": "integer",
-          "minimum": 0,
-          "description": "Milliseconds after nudge before force-release (default: 120000)"
-        },
-        "maxNudges": {
-          "type": "integer",
-          "minimum": 0,
-          "description": "Maximum nudges before escalation (default: 1)"
-        }
-      }
-    },
-    "SwarmPattern": {
-      "type": "string",
-      "enum": [
-        "fan-out",
-        "pipeline",
-        "hub-spoke",
-        "consensus",
-        "mesh",
-        "handoff",
-        "cascade",
-        "dag",
-        "debate",
-        "hierarchical",
-        "map-reduce",
-        "scatter-gather",
-        "supervisor",
-        "reflection",
-        "red-team",
-        "verifier",
-        "auction",
-        "escalation",
-        "saga",
-        "circuit-breaker",
-        "blackboard",
-        "swarm",
-        "competitive"
-      ]
-    },
-    "AgentDefinition": {
-      "type": "object",
-      "required": ["name", "cli"],
-      "additionalProperties": false,
-      "properties": {
-        "name": {
-          "type": "string",
-          "description": "Unique agent name within the workflow"
-        },
-        "cli": {
-          "$ref": "#/definitions/AgentCli"
-        },
-        "role": {
-          "type": "string",
-          "description": "Agent role description"
-        },
-        "task": {
-          "type": "string",
-          "description": "Default task assigned to the agent"
-        },
-        "channels": {
-          "type": "array",
-          "items": {
-            "type": "string"
-          },
-          "description": "Relay channels the agent should join"
-        },
-        "constraints": {
-          "$ref": "#/definitions/AgentConstraints"
-        },
-        "interactive": {
-          "type": "boolean",
-          "default": true,
-          "description": "When false, the agent runs as a non-interactive subprocess (no PTY, no relay messaging). It receives its task as a CLI prompt argument and returns stdout as output. Default: true."
-        },
-        "cwd": {
-          "type": "string",
-          "description": "Working directory for this agent, resolved relative to the YAML file."
-        },
-        "workdir": {
-          "type": "string",
-          "description": "Sets this agent's working directory to a named entry from the top-level paths array. Mutually exclusive with cwd."
-        },
-        "additionalPaths": {
-          "type": "array",
-          "items": {
-            "type": "string"
-          },
-          "description": "Additional paths the agent needs read/write access to."
-        },
-        "permissions": {
-          "$ref": "#/definitions/AgentPermissions"
-        },
-        "preset": {
-          "type": "string",
-          "enum": ["lead", "worker", "reviewer", "analyst"],
-          "description": "Role preset that automatically configures interactive mode and injects appropriate task guardrails. lead: interactive PTY, relay-aware. worker/reviewer/analyst: interactive: false, no sub-agents."
-        }
-      }
-    },
-    "AgentCli": {
-      "type": "string",
-      "enum": [
-        "claude",
-        "codex",
-        "gemini",
-        "aider",
-        "goose",
-        "opencode",
-        "droid",
-        "cursor",
-        "cursor-agent",
-        "agent"
-      ]
-    },
-    "PermissionProfile": {
-      "type": "object",
-      "additionalProperties": false,
-      "description": "Reusable named permission profile shared by one or more agents.",
-      "properties": {
-        "description": {
-          "type": "string",
-          "description": "Human-readable summary of the profile's intended use."
-        },
-        "why": {
-          "type": "string",
-          "description": "Explain why this profile exists or what constraint it is protecting."
-        },
-        "access": {
-          "type": "string",
-          "enum": ["readonly", "readwrite", "restricted", "full"],
-          "description": "Access preset that expands to a predefined permission profile."
-        },
-        "inherit": {
-          "type": "boolean",
-          "default": true,
-          "description": "Whether to inherit restrictions from existing workspace dotfiles and defaults."
-        },
-        "files": {
-          "type": "object",
-          "additionalProperties": false,
-          "description": "Optional file path rules for agent filesystem access.",
-          "properties": {
-            "read": {
-              "type": "array",
-              "items": {
-                "type": "string"
-              },
-              "description": "Glob patterns the agent may read."
-            },
-            "write": {
-              "type": "array",
-              "items": {
-                "type": "string"
-              },
-              "description": "Glob patterns the agent may write."
-            },
-            "deny": {
-              "type": "array",
-              "items": {
-                "type": "string"
-              },
-              "description": "Glob patterns explicitly denied to the agent."
-            }
-          }
-        },
-        "scopes": {
-          "type": "array",
-          "items": {
-            "type": "string"
-          },
-          "description": "Raw relayauth scopes to grant to the agent."
-        },
-        "network": {
-          "oneOf": [
-            { "type": "boolean" },
-            {
-              "type": "object",
-              "properties": {
-                "allow": { "type": "array", "items": { "type": "string" } },
-                "deny": { "type": "array", "items": { "type": "string" } }
-              },
-              "additionalProperties": false
-            }
-          ],
-          "description": "Network access control: boolean to allow/deny all, or object with allow/deny host:port arrays."
-        },
-        "exec": {
-          "type": "array",
-          "items": {
-            "type": "string"
-          },
-          "description": "Command patterns the agent is allowed to execute."
-        }
-      }
-    },
-    "AgentPermissions": {
-      "type": "object",
-      "additionalProperties": false,
-      "description": "Optional permission controls for this agent, including file access rules, access presets, inherited restrictions, raw relayauth scopes, network access, and allowed commands.",
-      "properties": {
-        "description": {
-          "type": "string",
-          "description": "Human-readable summary of what this permission block is for."
-        },
-        "profile": {
-          "type": "string",
-          "description": "Reference a reusable entry from the top-level permission_profiles map."
-        },
-        "why": {
-          "type": "string",
-          "description": "Explain why these permissions are needed or intentionally constrained."
-        },
-        "access": {
-          "type": "string",
-          "enum": ["readonly", "readwrite", "restricted", "full"],
-          "description": "Access preset that expands to a predefined permission profile."
-        },
-        "inherit": {
-          "type": "boolean",
-          "default": true,
-          "description": "Whether to inherit restrictions from existing workspace dotfiles and defaults."
-        },
-        "files": {
-          "type": "object",
-          "additionalProperties": false,
-          "description": "Optional file path rules for agent filesystem access.",
-          "properties": {
-            "read": {
-              "type": "array",
-              "items": {
-                "type": "string"
-              },
-              "description": "Glob patterns the agent may read."
-            },
-            "write": {
-              "type": "array",
-              "items": {
-                "type": "string"
-              },
-              "description": "Glob patterns the agent may write."
-            },
-            "deny": {
-              "type": "array",
-              "items": {
-                "type": "string"
-              },
-              "description": "Glob patterns explicitly denied to the agent."
-            }
-          }
-        },
-        "scopes": {
-          "type": "array",
-          "items": {
-            "type": "string"
-          },
-          "description": "Raw relayauth scopes to grant to the agent."
-        },
-        "network": {
-          "oneOf": [
-            { "type": "boolean" },
-            {
-              "type": "object",
-              "properties": {
-                "allow": { "type": "array", "items": { "type": "string" } },
-                "deny": { "type": "array", "items": { "type": "string" } }
-              },
-              "additionalProperties": false
-            }
-          ],
-          "description": "Network access control: boolean to allow/deny all, or object with allow/deny host:port arrays."
-        },
-        "exec": {
-          "type": "array",
-          "items": {
-            "type": "string"
-          },
-          "description": "Command patterns the agent is allowed to execute."
-        }
-      }
-    },
-    "AgentConstraints": {
-      "type": "object",
-      "additionalProperties": false,
-      "properties": {
-        "maxTokens": {
-          "type": "integer",
-          "minimum": 1,
-          "description": "Maximum token budget for the agent"
-        },
-        "timeoutMs": {
-          "type": "integer",
-          "minimum": 0,
-          "description": "Per-agent timeout in milliseconds"
-        },
-        "retries": {
-          "type": "integer",
-          "minimum": 0,
-          "description": "Number of retry attempts on failure"
-        },
-        "model": {
-          "type": "string",
-          "description": "Model override for the agent"
-        },
-        "idleThresholdSecs": {
-          "type": "integer",
-          "minimum": 0,
-          "description": "Seconds of inactivity before agent is considered idle (0 = disabled)"
-        }
-      }
-    },
-    "TrajectoryConfig": {
-      "type": "object",
-      "additionalProperties": false,
-      "properties": {
-        "enabled": {
-          "type": "boolean",
-          "description": "Enable trajectory recording"
-        },
-        "reflectOnBarriers": {
-          "type": "boolean",
-          "description": "Auto-reflect when barriers resolve"
-        },
-        "reflectOnConverge": {
-          "type": "boolean",
-          "description": "Auto-reflect when parallel tracks converge"
-        },
-        "autoDecisions": {
-          "type": "boolean",
-          "description": "Auto-record retry/skip/fail decisions"
-        }
-      }
-    },
-    "WorkflowDefinition": {
-      "type": "object",
-      "required": ["name", "steps"],
-      "additionalProperties": false,
-      "properties": {
-        "name": {
-          "type": "string",
-          "description": "Unique workflow name"
-        },
-        "description": {
-          "type": "string"
-        },
-        "preflight": {
-          "type": "array",
-          "items": {
-            "$ref": "#/definitions/PreflightCheck"
-          },
-          "description": "Preflight checks that run before any steps. All must pass."
-        },
-        "steps": {
-          "type": "array",
-          "items": {
-            "$ref": "#/definitions/WorkflowStep"
-          },
-          "minItems": 1
-        },
-        "onError": {
-          "type": "string",
-          "enum": ["fail", "skip", "retry"],
-          "description": "Error handling strategy for this workflow"
-        }
-      }
-    },
-    "PreflightCheck": {
-      "type": "object",
-      "required": ["command"],
-      "additionalProperties": false,
-      "properties": {
-        "command": {
-          "type": "string",
-          "description": "Shell command to execute"
-        },
-        "failIf": {
-          "type": "string",
-          "description": "Fail if output matches: 'non-empty', 'empty', or a regex pattern"
-        },
-        "successIf": {
-          "type": "string",
-          "description": "Succeed only if output matches this condition"
-        },
-        "description": {
-          "type": "string",
-          "description": "Human-readable description of what this check validates"
-        }
-      }
-    },
-    "WorkflowStep": {
-      "oneOf": [
-        {
-          "$ref": "#/definitions/AgentWorkflowStep"
-        },
-        {
-          "$ref": "#/definitions/DeterministicWorkflowStep"
-        },
-        {
-          "$ref": "#/definitions/WorktreeWorkflowStep"
-        },
-        {
-          "$ref": "#/definitions/CustomWorkflowStep"
-        }
-      ]
-    },
-    "AgentWorkflowStep": {
-      "type": "object",
-      "required": ["name", "agent", "task"],
-      "additionalProperties": false,
-      "properties": {
-        "type": {
-          "type": "string",
-          "enum": ["agent"],
-          "description": "Step type (optional for agent steps, defaults to 'agent')"
-        },
-        "name": {
-          "type": "string",
-          "description": "Unique step name within the workflow"
-        },
-        "agent": {
-          "type": "string",
-          "description": "Name of the agent to execute this step"
-        },
-        "task": {
-          "type": "string",
-          "description": "Task description for the agent"
-        },
-        "dependsOn": {
-          "type": "array",
-          "items": {
-            "type": "string"
-          },
-          "description": "Step names that must complete before this step runs"
-        },
-        "verification": {
-          "$ref": "#/definitions/VerificationCheck"
-        },
-        "timeoutMs": {
-          "type": "integer",
-          "minimum": 0
-        },
-        "retries": {
-          "type": "integer",
-          "minimum": 0
-        },
-        "maxIterations": {
-          "type": "integer",
-          "minimum": 1,
-          "description": "Maximum iterations for steps that may need to retry"
-        },
-        "workdir": {
-          "type": "string",
-          "description": "Sets this step's working directory to a named entry from the top-level paths array."
-        }
-      }
-    },
-    "DeterministicWorkflowStep": {
-      "type": "object",
-      "required": ["name", "type", "command"],
-      "additionalProperties": false,
-      "properties": {
-        "type": {
-          "type": "string",
-          "enum": ["deterministic"],
-          "description": "Step type - must be 'deterministic' for shell command steps"
-        },
-        "name": {
-          "type": "string",
-          "description": "Unique step name within the workflow"
-        },
-        "command": {
-          "type": "string",
-          "description": "Shell command to execute. Supports {{variable}} interpolation."
-        },
-        "dependsOn": {
-          "type": "array",
-          "items": {
-            "type": "string"
-          },
-          "description": "Step names that must complete before this step runs"
-        },
-        "timeoutMs": {
-          "type": "integer",
-          "minimum": 0
-        },
-        "failOnError": {
-          "type": "boolean",
-          "default": true,
-          "description": "Fail if command exit code is non-zero"
-        },
-        "captureOutput": {
-          "type": "boolean",
-          "default": true,
-          "description": "Capture stdout as step output for downstream steps"
-        },
-        "workdir": {
-          "type": "string",
-          "description": "Sets this step's working directory to a named entry from the top-level paths array."
-        }
-      }
-    },
-    "WorktreeWorkflowStep": {
-      "type": "object",
-      "required": ["name", "type", "branch"],
-      "additionalProperties": false,
-      "properties": {
-        "type": {
-          "type": "string",
-          "enum": ["worktree"],
-          "description": "Step type - must be 'worktree' for git worktree setup steps"
-        },
-        "name": {
-          "type": "string",
-          "description": "Unique step name within the workflow"
-        },
-        "branch": {
-          "type": "string",
-          "description": "Branch name for the worktree. Supports {{variable}} interpolation."
-        },
-        "baseBranch": {
-          "type": "string",
-          "description": "Base branch to create the worktree from. Default: HEAD."
-        },
-        "path": {
-          "type": "string",
-          "description": "Explicit path for the worktree. Default: .worktrees/<step-name>."
-        },
-        "createBranch": {
-          "type": "boolean",
-          "default": true,
-          "description": "Create the branch if it doesn't exist"
-        },
-        "dependsOn": {
-          "type": "array",
-          "items": {
-            "type": "string"
-          },
-          "description": "Step names that must complete before this step runs"
-        },
-        "timeoutMs": {
-          "type": "integer",
-          "minimum": 0
-        },
-        "workdir": {
-          "type": "string",
-          "description": "Sets this step's working directory to a named entry from the top-level paths array."
-        }
-      }
-    },
-    "CustomWorkflowStep": {
-      "type": "object",
-      "required": ["name", "use"],
-      "additionalProperties": true,
-      "properties": {
-        "name": {
-          "type": "string",
-          "description": "Unique step name within the workflow"
-        },
-        "use": {
-          "type": "string",
-          "description": "Reference to a custom step definition from .relay/steps.yaml"
-        },
-        "dependsOn": {
-          "type": "array",
-          "items": {
-            "type": "string"
-          },
-          "description": "Step names that must complete before this step runs"
-        },
-        "timeoutMs": {
-          "type": "integer",
-          "minimum": 0
-        }
-      }
-    },
-    "CustomStepParam": {
-      "type": "object",
-      "required": ["name"],
-      "additionalProperties": false,
-      "properties": {
-        "name": {
-          "type": "string",
-          "description": "Parameter name"
-        },
-        "required": {
-          "type": "boolean",
-          "default": false,
-          "description": "Whether this parameter is required"
-        },
-        "default": {
-          "type": "string",
-          "description": "Default value if not provided"
-        },
-        "description": {
-          "type": "string",
-          "description": "Human-readable description of the parameter"
-        }
-      }
-    },
-    "CustomStepDefinition": {
-      "type": "object",
-      "additionalProperties": false,
-      "properties": {
-        "params": {
-          "type": "array",
-          "items": {
-            "$ref": "#/definitions/CustomStepParam"
-          },
-          "description": "Parameters that can be passed when using this step"
-        },
-        "type": {
-          "type": "string",
-          "enum": ["deterministic", "worktree"],
-          "description": "Step type"
-        },
-        "command": {
-          "type": "string",
-          "description": "Shell command to execute (for deterministic steps)"
-        },
-        "branch": {
-          "type": "string",
-          "description": "Branch name (for worktree steps)"
-        },
-        "baseBranch": {
-          "type": "string",
-          "description": "Base branch (for worktree steps)"
-        },
-        "path": {
-          "type": "string",
-          "description": "Worktree path (for worktree steps)"
-        },
-        "createBranch": {
-          "type": "boolean",
-          "description": "Create branch if missing (for worktree steps)"
-        },
-        "failOnError": {
-          "type": "boolean",
-          "default": true,
-          "description": "Fail if command exit code is non-zero"
-        },
-        "captureOutput": {
-          "type": "boolean",
-          "default": true,
-          "description": "Capture stdout as step output"
-        },
-        "timeoutMs": {
-          "type": "integer",
-          "minimum": 0,
-          "description": "Timeout in milliseconds"
-        },
-        "description": {
-          "type": "string",
-          "description": "Human-readable description of this step"
-        }
-      }
-    },
-    "CustomStepsConfig": {
-      "type": "object",
-      "required": ["steps"],
-      "additionalProperties": false,
-      "properties": {
-        "steps": {
-          "type": "object",
-          "additionalProperties": {
-            "$ref": "#/definitions/CustomStepDefinition"
-          },
-          "description": "Map of step name to step definition"
-        }
-      }
-    },
-    "VerificationCheck": {
-      "type": "object",
-      "required": ["type", "value"],
-      "additionalProperties": false,
-      "properties": {
-        "type": {
-          "type": "string",
-          "enum": ["output_contains", "exit_code", "file_exists", "custom"],
-          "description": "Type of verification to perform"
-        },
-        "value": {
-          "type": "string",
-          "description": "Expected value or expression for verification. For custom type: a shell command (exit 0 = pass, step output in $STEP_OUTPUT) or 'regex:<pattern>' for regex matching against output."
-        },
-        "description": {
-          "type": "string",
-          "description": "Human-readable description of what is being verified"
-        }
-      }
-    },
-    "CoordinationConfig": {
-      "type": "object",
-      "additionalProperties": false,
-      "properties": {
-        "barriers": {
-          "type": "array",
-          "items": {
-            "$ref": "#/definitions/Barrier"
-          }
-        },
-        "votingThreshold": {
-          "type": "number",
-          "minimum": 0,
-          "maximum": 1,
-          "description": "Fraction of agents required for voting (0-1)"
-        },
-        "consensusStrategy": {
-          "type": "string",
-          "enum": ["majority", "unanimous", "quorum"],
-          "description": "Strategy for reaching consensus among agents"
-        }
-      }
-    },
-    "Barrier": {
-      "type": "object",
-      "required": ["name", "waitFor"],
-      "additionalProperties": false,
-      "properties": {
-        "name": {
-          "type": "string",
-          "description": "Unique barrier name"
-        },
-        "waitFor": {
-          "type": "array",
-          "items": {
-            "type": "string"
-          },
-          "minItems": 1,
-          "description": "Agent or step names to wait for before proceeding"
-        },
-        "timeoutMs": {
-          "type": "integer",
-          "minimum": 0,
-          "description": "Timeout for the barrier in milliseconds"
-        }
-      }
-    },
-    "StateConfig": {
-      "type": "object",
-      "required": ["backend"],
-      "additionalProperties": false,
-      "properties": {
-        "backend": {
-          "type": "string",
-          "enum": ["memory", "redis", "database"],
-          "description": "State storage backend"
-        },
-        "ttlMs": {
-          "type": "integer",
-          "minimum": 0,
-          "description": "Time-to-live for state entries in milliseconds"
-        },
-        "namespace": {
-          "type": "string",
-          "description": "Namespace prefix for state keys"
-        }
-      }
-    },
-    "ErrorHandlingConfig": {
-      "type": "object",
-      "required": ["strategy"],
-      "additionalProperties": false,
-      "properties": {
-        "strategy": {
-          "type": "string",
-          "enum": ["fail-fast", "continue", "retry"],
-          "description": "Global error handling strategy"
-        },
-        "maxRetries": {
-          "type": "integer",
-          "minimum": 0,
-          "description": "Maximum number of retries"
-        },
-        "retryDelayMs": {
-          "type": "integer",
-          "minimum": 0,
-          "description": "Delay between retries in milliseconds"
-        },
-        "notifyChannel": {
-          "type": "string",
-          "description": "Relay channel to notify on errors"
-        },
-        "repairAgent": {
-          "type": "string",
-          "description": "Agent to use when a deterministic gate fails and needs code/workflow repair"
-        },
-        "repairRetries": {
-          "type": "integer",
-          "minimum": 0,
-          "description": "Retry budget for repair agents before terminal failure. Defaults to the retry budget when repair-capable agents are available; set 0 to disable repair agents."
-        }
-      }
-    }
-  }
-}
diff --git a/packages/sdk/src/workflows/sibling-links.ts b/packages/sdk/src/workflows/sibling-links.ts
deleted file mode 100644
index b8ba7a887..000000000
--- a/packages/sdk/src/workflows/sibling-links.ts
+++ /dev/null
@@ -1,265 +0,0 @@
-/**
- * Sibling-package link setup for workflows that consume a package living in
- * a sibling repo / worktree on disk.
- *
- * Problem it solves: agents running inside a workflow sometimes find that
- * `npm install` (or `pip install`) resolved an older version of a package
- * than the one the workflow actually needs — for example when the consumer
- * workflow runs before the producer has published a new release. Rather
- * than letting agents see a stale interface (and react by augmenting the
- * module or writing fallback implementations), linking redirects the
- * package resolution at dev-time to the sibling's on-disk build output.
- *
- * Usage (ESM):
- *
- *   import { workflow, applySiblingLinks } from '@agent-relay/sdk/workflows';
- *
- *   const base = workflow('my-feature').pattern('dag').agent('impl', ...);
- *   const wf = applySiblingLinks(base, {
- *     dependsOn: ['install-deps'],
- *     links: [
- *       {
- *         name: '@agent-assistant/proactive',
- *         path: '../agent-assistant/packages/proactive',
- *         expect: ['recordSignal', 'drainSignals'],
- *       },
- *       {
- *         name: '@agent-assistant/surfaces',
- *         path: '../agent-assistant/packages/surfaces',
- *         expect: ['classifySlackPresenceSignal'],
- *       },
- *     ],
- *   });
- *
- *   await wf.step('plan', { agent: 'impl', dependsOn: ['setup-sibling-links'], task: ... })
- *     .run({ cwd: process.cwd() });
- *
- * MVP language support: npm (package.json), Python (pyproject.toml /
- * setup.py / setup.cfg). Auto-detects from the sibling's manifest. Fails
- * fast on missing path, unknown manifest, or missing expected exports.
- */
-
-/** A single sibling package to link into the workflow's working directory. */
-export interface SiblingLink {
-  /**
-   * Package name as it appears in imports (e.g. "@agent-assistant/proactive",
-   * "my_python_pkg"). For Python, use the import name (underscored), not the
-   * distribution name.
-   */
-  name: string;
-
-  /**
-   * Path to the sibling package root, relative to the workflow's cwd.
-   * For npm, this is the directory containing package.json.
-   * For Python, the directory containing pyproject.toml / setup.py.
-   */
-  path: string;
-
-  /**
-   * Optional list of top-level named exports / attributes the workflow
-   * expects to find on the linked package post-setup. When provided, a
-   * language-appropriate import smoke test runs and fails the step if any
-   * are missing.
-   */
-  expect?: string[];
-}
-
-export interface SiblingLinkOptions {
-  /** Link declarations. All must succeed (fail-fast on any error). */
-  links: SiblingLink[];
-
-  /**
-   * Step name for the setup step emitted by this helper.
-   * Defaults to `"setup-sibling-links"`.
-   */
-  stepName?: string;
-
-  /**
-   * dependsOn for the setup step. Typically `['install-deps']` so that
-   * `npm install` / `pip install` has run first.
-   * Defaults to `['install-deps']`.
-   */
-  dependsOn?: string[];
-}
-
-/** Minimal builder shape — accepts anything with a chainable `.step()` method. */
-interface StepChain {
-  step: (name: string, cfg: unknown) => StepChain;
-}
-
-/**
- * Adds a single deterministic step to the workflow that links each sibling
- * package into the workflow's working directory using the appropriate
- * language-specific mechanism, then smoke-tests each linked package for
- * expected exports.
- *
- * The step fails fast on:
- *   - Sibling path missing
- *   - Unknown manifest (no package.json / pyproject.toml / setup.py)
- *   - Link command failure
- *   - Missing expected export
- */
-export function applySiblingLinks<T>(wf: T, opts: SiblingLinkOptions): T {
-  if (opts.links.length === 0) {
-    return wf;
-  }
-
-  const stepName = opts.stepName ?? 'setup-sibling-links';
-  const dependsOn = opts.dependsOn ?? ['install-deps'];
-
-  const script = buildSiblingLinkScript(opts.links);
-  const chain = wf as unknown as StepChain;
-  chain.step(stepName, {
-    type: 'deterministic',
-    dependsOn,
-    command: `bash -c ${shSingleQuote(script)}`,
-    captureOutput: true,
-    failOnError: true,
-  });
-  return wf;
-}
-
-// ─── Internal: shell-script generation ─────────────────────────────────────
-
-/**
- * Shell-quote a string for safe single-quoted inclusion in a bash command.
- * Single-quoted strings in bash are literal for every character except the
- * single quote itself, so `$` and backticks are NOT interpreted — which is
- * exactly what we want for link.name / link.path / JSON payloads that must
- * pass through bash unchanged.
- *
- * Embedded single quotes are escaped via the standard `'\''` POSIX idiom
- * (close, escape, reopen).
- */
-function shSingleQuote(value: string): string {
-  return `'${value.replace(/'/g, `'\\''`)}'`;
-}
-
-/**
- * Builds a bash script that:
- *   1. For each link, detects its manifest and applies the right link command.
- *   2. After all links succeed, runs one import smoke test per link that
- *      declared expected exports.
- *
- * Exported for test visibility; not part of the public API.
- */
-export function buildSiblingLinkScript(links: SiblingLink[]): string {
-  const lines: string[] = ['set -euo pipefail', 'echo "=== applySiblingLinks: setting up ==="'];
-
-  for (const link of links) {
-    // Use SINGLE-quoted shell literals for the assignments. Double-quoted
-    // literals (via JSON.stringify) would let `$`, backticks, and `\` still
-    // trigger substitution or escaping — single-quoted is literal end-to-end.
-    const escapedName = shSingleQuote(link.name);
-    const escapedPath = shSingleQuote(link.path);
-    lines.push(linkOneBlock(link, escapedName, escapedPath));
-  }
-
-  lines.push('echo "=== applySiblingLinks: verifying exports ==="');
-  for (const link of links) {
-    if (!link.expect || link.expect.length === 0) {
-      continue;
-    }
-    lines.push(verifyExportsBlock(link));
-  }
-
-  lines.push('echo "APPLY_SIBLING_LINKS_OK"');
-  return lines.join('\n');
-}
-
-function linkOneBlock(link: SiblingLink, escapedName: string, escapedPath: string): string {
-  void link;
-  return [
-    `SIBLING_PATH=${escapedPath}`,
-    `SIBLING_NAME=${escapedName}`,
-    'echo "--- link: $SIBLING_NAME <- $SIBLING_PATH ---"',
-    'if [ ! -d "$SIBLING_PATH" ]; then',
-    '  echo "SIBLING_PATH_MISSING: $SIBLING_PATH" >&2',
-    '  exit 1',
-    'fi',
-    'if [ -f "$SIBLING_PATH/package.json" ]; then',
-    '  echo "detected: npm"',
-    '  ( cd "$SIBLING_PATH" && npm link --silent )',
-    '  npm link --silent "$SIBLING_NAME"',
-    'elif [ -f "$SIBLING_PATH/pyproject.toml" ] || [ -f "$SIBLING_PATH/setup.py" ] || [ -f "$SIBLING_PATH/setup.cfg" ]; then',
-    '  echo "detected: python"',
-    // Try uv first (fastest when available), but uv refuses to install
-    // outside a venv without --system. Pass --system explicitly so uv
-    // works in non-venv sandboxes (common CI/agent runner shape).
-    // If uv still fails (e.g. broken install), fall through to pip/pip3
-    // via the explicit OR chain rather than relying on `set -e` to
-    // short-circuit between elif branches.
-    '  if command -v uv >/dev/null 2>&1 && uv pip install --system -e "$SIBLING_PATH" --quiet 2>/dev/null; then',
-    '    :',
-    '  elif command -v pip >/dev/null 2>&1; then',
-    '    pip install -e "$SIBLING_PATH" --quiet',
-    '  elif command -v pip3 >/dev/null 2>&1; then',
-    '    pip3 install -e "$SIBLING_PATH" --quiet',
-    '  else',
-    '    echo "NO_PYTHON_INSTALLER: uv / pip / pip3 not found or all failed" >&2',
-    '    exit 1',
-    '  fi',
-    'else',
-    '  echo "UNKNOWN_MANIFEST: expected package.json / pyproject.toml / setup.py / setup.cfg at $SIBLING_PATH" >&2',
-    '  exit 1',
-    'fi',
-  ].join('\n');
-}
-
-function verifyExportsBlock(link: SiblingLink): string {
-  const escapedName = shSingleQuote(link.name);
-  const escapedPath = shSingleQuote(link.path);
-  const expectJson = JSON.stringify(link.expect ?? []);
-  // Pick the smoke-test runtime based on what manifest type the sibling had.
-  // Single-quoted assignments are literal — the JSON payload inside EXPECT
-  // survives bash untouched and downstream Node/Python JSON.parse it back.
-  return [
-    `SIBLING_PATH=${escapedPath}`,
-    `SIBLING_NAME=${escapedName}`,
-    `EXPECT=${shSingleQuote(expectJson)}`,
-    'if [ -f "$SIBLING_PATH/package.json" ]; then',
-    nodeVerifyCommand(),
-    'else',
-    pythonVerifyCommand(),
-    'fi',
-  ].join('\n');
-}
-
-function nodeVerifyCommand(): string {
-  const script = [
-    'const want = JSON.parse(process.env.APPLY_SIBLING_LINKS_EXPECT);',
-    'const name = process.env.APPLY_SIBLING_LINKS_NAME;',
-    'const mod = await import(name);',
-    'const missing = want.filter((k) => !(k in mod));',
-    'if (missing.length) {',
-    '  console.error(`MISSING_EXPORTS in ${name}: ${missing.join(",")}`);',
-    '  process.exit(1);',
-    '}',
-    'console.log(`${name} OK: ${want.join(",")}`);',
-  ].join(' ');
-  return `  APPLY_SIBLING_LINKS_NAME="$SIBLING_NAME" APPLY_SIBLING_LINKS_EXPECT="$EXPECT" node --input-type=module -e ${shSingleQuote(script)}`;
-}
-
-function pythonVerifyCommand(): string {
-  // Python < 3.12 forbids backslashes inside f-string expressions, so we
-  // can't inline `{",".join(missing)}` (which needs `\",\".` when written
-  // as a JS string literal). Bind the separator to a name outside the
-  // f-string first.
-  const script = [
-    'import json, os, importlib',
-    'name = os.environ["APPLY_SIBLING_LINKS_NAME"]',
-    'want = json.loads(os.environ["APPLY_SIBLING_LINKS_EXPECT"])',
-    'mod = importlib.import_module(name)',
-    'missing = [k for k in want if not hasattr(mod, k)]',
-    'sep = ","',
-    'if missing:',
-    '    print(f"MISSING_EXPORTS in {name}: {sep.join(missing)}", flush=True)',
-    '    raise SystemExit(1)',
-    'print(f"{name} OK: {sep.join(want)}", flush=True)',
-  ].join('\n');
-  return [
-    '  APPLY_SIBLING_LINKS_NAME="$SIBLING_NAME" APPLY_SIBLING_LINKS_EXPECT="$EXPECT" \\',
-    `  python3 -c ${shSingleQuote(script)} 2>/dev/null || \\`,
-    `  APPLY_SIBLING_LINKS_NAME="$SIBLING_NAME" APPLY_SIBLING_LINKS_EXPECT="$EXPECT" python -c ${shSingleQuote(script)}`,
-  ].join('\n');
-}
diff --git a/packages/sdk/src/workflows/state.ts b/packages/sdk/src/workflows/state.ts
deleted file mode 100644
index 688ecc776..000000000
--- a/packages/sdk/src/workflows/state.ts
+++ /dev/null
@@ -1,248 +0,0 @@
-/**
- * State Store — CRUD on swarm_state with optional consensus-gated writes.
- *
- * Provides a key-value store scoped to a workflow run and namespace.
- * When consensus gating is enabled, writes require approval from a
- * ConsensusEngine before being committed.
- */
-
-import { randomBytes } from 'node:crypto';
-import { EventEmitter } from 'node:events';
-import type { DbClient } from './coordinator.js';
-
-// ── Types ───────────────────────────────────────────────────────────────────
-
-export interface StateEntry {
-  id: string;
-  runId: string;
-  namespace: string;
-  key: string;
-  value: unknown;
-  expiresAt: string | null;
-  createdAt: string;
-  updatedAt: string;
-}
-
-export interface StateStoreOptions {
-  /** Default namespace for keys. */
-  namespace?: string;
-  /** Default TTL in milliseconds for new entries. */
-  defaultTtlMs?: number;
-}
-
-export interface WriteOptions {
-  namespace?: string;
-  ttlMs?: number;
-}
-
-export interface ReadOptions {
-  namespace?: string;
-}
-
-/** Callback invoked to gate a write. Return true to allow, false to reject. */
-export type ConsensusGate = (runId: string, key: string, value: unknown, agent: string) => Promise<boolean>;
-
-export interface StateStoreEvents {
-  'state:set': (entry: StateEntry) => void;
-  'state:deleted': (runId: string, key: string, namespace: string) => void;
-  'state:gated': (runId: string, key: string, agent: string) => void;
-}
-
-// ── Store ───────────────────────────────────────────────────────────────────
-
-export class StateStore extends EventEmitter {
-  private db: DbClient;
-  private defaultNamespace: string;
-  private defaultTtlMs: number | null;
-  private consensusGate: ConsensusGate | null = null;
-
-  constructor(db: DbClient, options: StateStoreOptions = {}) {
-    super();
-    this.db = db;
-    this.defaultNamespace = options.namespace ?? 'default';
-    this.defaultTtlMs = options.defaultTtlMs ?? null;
-  }
-
-  // ── Consensus gating ──────────────────────────────────────────────────
-
-  /**
-   * Enable consensus-gated writes. When set, every `set()` call will
-   * invoke the gate function before persisting. If the gate returns false,
-   * the write is rejected.
-   */
-  setConsensusGate(gate: ConsensusGate): void {
-    this.consensusGate = gate;
-  }
-
-  clearConsensusGate(): void {
-    this.consensusGate = null;
-  }
-
-  // ── Write ─────────────────────────────────────────────────────────────
-
-  /**
-   * Set a key-value pair. If consensus gating is enabled, the write is
-   * subject to approval.
-   *
-   * @param agent - The agent requesting the write (used for consensus gating).
-   */
-  async set(
-    runId: string,
-    key: string,
-    value: unknown,
-    agent: string,
-    options: WriteOptions = {}
-  ): Promise<StateEntry> {
-    // Consensus gate check.
-    if (this.consensusGate) {
-      const allowed = await this.consensusGate(runId, key, value, agent);
-      if (!allowed) {
-        this.emit('state:gated', runId, key, agent);
-        throw new Error(`Write to "${key}" rejected by consensus gate for agent "${agent}"`);
-      }
-    }
-
-    const namespace = options.namespace ?? this.defaultNamespace;
-    const ttlMs = options.ttlMs ?? this.defaultTtlMs;
-    const expiresAt = ttlMs ? new Date(Date.now() + ttlMs).toISOString() : null;
-    const id = `st_${Date.now()}_${randomBytes(4).toString('hex')}`;
-    const now = new Date().toISOString();
-
-    // Upsert: use the unique (run_id, namespace, key) constraint.
-    const { rows } = await this.db.query<StateEntry>(
-      `INSERT INTO swarm_state (id, run_id, namespace, key, value, expires_at, created_at, updated_at)
-       VALUES ($1, $2, $3, $4, $5, $6, $7, $7)
-       ON CONFLICT (run_id, namespace, key)
-       DO UPDATE SET value = EXCLUDED.value, expires_at = EXCLUDED.expires_at, updated_at = EXCLUDED.updated_at
-       RETURNING *`,
-      [id, runId, namespace, key, JSON.stringify(value), expiresAt, now]
-    );
-
-    const entry = rows[0];
-    this.emit('state:set', entry);
-    return entry;
-  }
-
-  // ── Read ──────────────────────────────────────────────────────────────
-
-  async get(runId: string, key: string, options: ReadOptions = {}): Promise<unknown | null> {
-    const namespace = options.namespace ?? this.defaultNamespace;
-
-    const { rows } = await this.db.query<StateEntry>(
-      `SELECT * FROM swarm_state
-       WHERE run_id = $1 AND namespace = $2 AND key = $3
-         AND (expires_at IS NULL OR expires_at > now())`,
-      [runId, namespace, key]
-    );
-
-    if (rows.length === 0) return null;
-    return rows[0].value;
-  }
-
-  async getEntry(runId: string, key: string, options: ReadOptions = {}): Promise<StateEntry | null> {
-    const namespace = options.namespace ?? this.defaultNamespace;
-
-    const { rows } = await this.db.query<StateEntry>(
-      `SELECT * FROM swarm_state
-       WHERE run_id = $1 AND namespace = $2 AND key = $3
-         AND (expires_at IS NULL OR expires_at > now())`,
-      [runId, namespace, key]
-    );
-
-    return rows[0] ?? null;
-  }
-
-  async getAll(runId: string, options: ReadOptions = {}): Promise<StateEntry[]> {
-    const namespace = options.namespace ?? this.defaultNamespace;
-
-    const { rows } = await this.db.query<StateEntry>(
-      `SELECT * FROM swarm_state
-       WHERE run_id = $1 AND namespace = $2
-         AND (expires_at IS NULL OR expires_at > now())
-       ORDER BY key ASC`,
-      [runId, namespace]
-    );
-
-    return rows;
-  }
-
-  async keys(runId: string, options: ReadOptions = {}): Promise<string[]> {
-    const namespace = options.namespace ?? this.defaultNamespace;
-
-    const { rows } = await this.db.query<{ key: string }>(
-      `SELECT key FROM swarm_state
-       WHERE run_id = $1 AND namespace = $2
-         AND (expires_at IS NULL OR expires_at > now())
-       ORDER BY key ASC`,
-      [runId, namespace]
-    );
-
-    return rows.map((r) => r.key);
-  }
-
-  // ── Delete ────────────────────────────────────────────────────────────
-
-  async delete(runId: string, key: string, options: ReadOptions = {}): Promise<boolean> {
-    const namespace = options.namespace ?? this.defaultNamespace;
-
-    const { rows } = await this.db.query(
-      `DELETE FROM swarm_state WHERE run_id = $1 AND namespace = $2 AND key = $3 RETURNING id`,
-      [runId, namespace, key]
-    );
-
-    if (rows.length > 0) {
-      this.emit('state:deleted', runId, key, namespace);
-      return true;
-    }
-
-    return false;
-  }
-
-  async deleteAll(runId: string, options: ReadOptions = {}): Promise<number> {
-    const namespace = options.namespace ?? this.defaultNamespace;
-
-    const { rows } = await this.db.query(
-      `DELETE FROM swarm_state WHERE run_id = $1 AND namespace = $2 RETURNING id`,
-      [runId, namespace]
-    );
-
-    return rows.length;
-  }
-
-  // ── Expiry cleanup ────────────────────────────────────────────────────
-
-  /**
-   * Remove all expired entries for a run (or globally if runId is omitted).
-   * Returns the number of entries purged.
-   */
-  async purgeExpired(runId?: string): Promise<number> {
-    if (runId) {
-      const { rows } = await this.db.query(
-        `DELETE FROM swarm_state WHERE run_id = $1 AND expires_at IS NOT NULL AND expires_at <= now() RETURNING id`,
-        [runId]
-      );
-      return rows.length;
-    }
-
-    const { rows } = await this.db.query(
-      `DELETE FROM swarm_state WHERE expires_at IS NOT NULL AND expires_at <= now() RETURNING id`,
-      []
-    );
-    return rows.length;
-  }
-
-  // ── Snapshot ───────────────────────────────────────────────────────────
-
-  /**
-   * Take a snapshot of all state for a run as a plain object.
-   * Useful for persisting into workflow_runs.state_snapshot.
-   */
-  async snapshot(runId: string, options: ReadOptions = {}): Promise<Record<string, unknown>> {
-    const entries = await this.getAll(runId, options);
-    const result: Record<string, unknown> = {};
-    for (const entry of entries) {
-      result[entry.key] = entry.value;
-    }
-    return result;
-  }
-}
diff --git a/packages/sdk/src/workflows/step-executor.ts b/packages/sdk/src/workflows/step-executor.ts
deleted file mode 100644
index a9f8f950c..000000000
--- a/packages/sdk/src/workflows/step-executor.ts
+++ /dev/null
@@ -1,579 +0,0 @@
-import { ChannelMessenger } from './channel-messenger.js';
-import type { ProcessSpawner } from './process-spawner.js';
-import { TemplateResolver } from './template-resolver.js';
-import type { StepOutcome } from './trajectory.js';
-import type {
-  AgentDefinition,
-  ErrorHandlingConfig,
-  StepCompletionMode,
-  VerificationCheck,
-  WorkflowStep,
-  WorkflowStepCompletionReason,
-  WorkflowStepRow,
-  WorkflowStepStatus,
-} from './types.js';
-import {
-  runVerification,
-  type VerificationOptions,
-  type VerificationResult,
-  type VerificationSideEffects,
-} from './verification.js';
-
-type StateLike = {
-  row: WorkflowStepRow;
-};
-
-export interface StepResult {
-  status: WorkflowStepStatus;
-  output: string;
-  exitCode?: number;
-  exitSignal?: string;
-  duration: number;
-  retries: number;
-  completionReason?: WorkflowStepCompletionReason;
-  error?: string;
-}
-
-export interface StepSchedule {
-  step: WorkflowStep;
-  readyAt: number;
-  staggerDelay: number;
-}
-
-export interface StepExecutorDeps<TState extends StateLike = StateLike> {
-  cwd: string;
-  runId?: string;
-  postToChannel?: (text: string) => void;
-  persistStepRow?: (stepId: string, patch: Partial<WorkflowStepRow>) => Promise<void>;
-  persistStepOutput?: (runId: string, stepName: string, output: string) => Promise<void>;
-  resolveTemplate?: (template: string, context: Record<string, unknown>) => string;
-  getStepOutput?: (stepName: string) => string | undefined;
-  loadStepOutput?: (runId: string, stepName: string) => string | undefined;
-  checkAborted?: () => void;
-  waitIfPaused?: () => Promise<void>;
-  log?: (message: string) => void;
-  processSpawner?: ProcessSpawner;
-  templateResolver?: TemplateResolver;
-  channelMessenger?: ChannelMessenger;
-  verificationRunner?: (
-    check: VerificationCheck,
-    output: string,
-    stepName: string,
-    injectedTaskText?: string,
-    options?: VerificationOptions,
-    sideEffects?: VerificationSideEffects
-  ) => VerificationResult;
-  executeStep?: (
-    step: WorkflowStep,
-    state: TState,
-    agentMap: Map<string, AgentDefinition>,
-    errorHandling?: ErrorHandlingConfig
-  ) => Promise<Partial<StepResult> | void>;
-  onStepStarted?: (step: WorkflowStep, state: TState) => Promise<void> | void;
-  onStepRetried?: (
-    step: WorkflowStep,
-    state: TState,
-    attempt: number,
-    maxRetries: number
-  ) => Promise<void> | void;
-  onStepCompleted?: (step: WorkflowStep, state: TState, result: StepResult) => Promise<void> | void;
-  onStepFailed?: (step: WorkflowStep, state: TState, result: StepResult) => Promise<void> | void;
-  onBeginTrack?: (steps: WorkflowStep[]) => Promise<void> | void;
-  onConverge?: (steps: WorkflowStep[], outcomes: StepOutcome[]) => Promise<void> | void;
-  markDownstreamSkipped?: (failedStepName: string) => Promise<void>;
-  buildCompletionMode?: (
-    stepName: string,
-    completionReason?: WorkflowStepCompletionReason
-  ) => StepCompletionMode | undefined;
-}
-
-export interface MonitorStepOptions<TState extends StateLike, TResult> {
-  maxRetries?: number;
-  retryDelayMs?: number;
-  startMessage?: string;
-  onStart?: (attempt: number, state: TState) => Promise<void> | void;
-  onRetry?: (attempt: number, maxRetries: number, state: TState) => Promise<void> | void;
-  execute: (attempt: number, state: TState) => Promise<TResult>;
-  toCompletionResult: (result: TResult, attempt: number, state: TState) => Partial<StepResult>;
-  onAttemptFailed?: (error: unknown, attempt: number, state: TState) => Promise<void> | void;
-  getFailureResult?: (error: unknown, attempt: number, state: TState) => Partial<StepResult>;
-}
-
-export class StepExecutor<TState extends StateLike = StateLike> {
-  private readonly templateResolver: TemplateResolver;
-  private readonly channelMessenger: ChannelMessenger;
-  private readonly verificationRunner: NonNullable<StepExecutorDeps<TState>['verificationRunner']>;
-
-  constructor(private readonly deps: StepExecutorDeps<TState>) {
-    this.templateResolver = deps.templateResolver ?? new TemplateResolver();
-    this.channelMessenger = deps.channelMessenger ?? new ChannelMessenger({ postFn: deps.postToChannel });
-    this.verificationRunner = deps.verificationRunner ?? runVerification;
-  }
-
-  findReady(
-    steps: WorkflowStep[],
-    statuses: Map<string, WorkflowStepStatus> | Map<string, TState>
-  ): WorkflowStep[] {
-    return steps.filter((step) => {
-      const state = statuses.get(step.name);
-      const status = this.getStatus(state);
-      if (status !== 'pending') return false;
-
-      return (step.dependsOn ?? []).every((dependency) => {
-        const depState = statuses.get(dependency);
-        const depStatus = this.getStatus(depState);
-        return depStatus === 'completed' || depStatus === 'skipped';
-      });
-    });
-  }
-
-  /** @deprecated Use {@link findReady} instead. This is an alias kept for backward compatibility. */
-  findReadySteps(
-    steps: WorkflowStep[],
-    statuses: Map<string, WorkflowStepStatus> | Map<string, TState>
-  ): WorkflowStep[] {
-    return this.findReady(steps, statuses);
-  }
-
-  scheduleStep(step: WorkflowStep, options: { readyAt?: number; staggerDelay?: number } = {}): StepSchedule {
-    return {
-      step,
-      readyAt: options.readyAt ?? Date.now(),
-      staggerDelay: options.staggerDelay ?? 0,
-    };
-  }
-
-  async startStep(step: WorkflowStep, state: TState, startMessage?: string): Promise<void> {
-    const startedAt = new Date().toISOString();
-    state.row.status = 'running';
-    state.row.error = undefined;
-    state.row.completionReason = undefined;
-    state.row.startedAt = startedAt;
-
-    await this.deps.persistStepRow?.(state.row.id, {
-      status: 'running',
-      error: undefined,
-      completionReason: undefined,
-      startedAt,
-      updatedAt: new Date().toISOString(),
-    });
-
-    if (startMessage) {
-      this.deps.postToChannel?.(startMessage);
-    }
-    await this.deps.onStepStarted?.(step, state);
-  }
-
-  async retryStep(step: WorkflowStep, state: TState, attempt: number, maxRetries: number): Promise<void> {
-    state.row.retryCount = attempt;
-    await this.deps.persistStepRow?.(state.row.id, {
-      retryCount: attempt,
-      updatedAt: new Date().toISOString(),
-    });
-    await this.deps.onStepRetried?.(step, state, attempt, maxRetries);
-  }
-
-  async completeStep(step: WorkflowStep, state: TState, result: Partial<StepResult>): Promise<StepResult> {
-    const completedAt = new Date().toISOString();
-    const finalResult: StepResult = {
-      status: result.status ?? 'completed',
-      output: result.output ?? '',
-      exitCode: result.exitCode,
-      exitSignal: result.exitSignal,
-      duration: result.duration ?? 0,
-      retries: result.retries ?? state.row.retryCount,
-      completionReason: result.completionReason,
-      error: result.error,
-    };
-
-    state.row.status = finalResult.status;
-    state.row.output = finalResult.output;
-    state.row.error = finalResult.error;
-    state.row.completionReason = finalResult.completionReason;
-    state.row.completedAt = completedAt;
-
-    await this.deps.persistStepRow?.(state.row.id, {
-      status: finalResult.status,
-      output: finalResult.output,
-      error: finalResult.error,
-      completionReason: finalResult.completionReason,
-      completedAt,
-      updatedAt: new Date().toISOString(),
-    });
-    if (finalResult.status === 'completed' && this.deps.runId && finalResult.output) {
-      await this.deps.persistStepOutput?.(this.deps.runId, step.name, finalResult.output);
-    }
-
-    if (finalResult.status === 'failed') {
-      await this.deps.onStepFailed?.(step, state, finalResult);
-    } else {
-      await this.deps.onStepCompleted?.(step, state, finalResult);
-    }
-    return finalResult;
-  }
-
-  async monitorStep<TResult>(
-    step: WorkflowStep,
-    state: TState,
-    options: MonitorStepOptions<TState, TResult>
-  ): Promise<StepResult> {
-    const maxRetries = options.maxRetries ?? 0;
-    const retryDelayMs = options.retryDelayMs ?? 1000;
-    let lastError: unknown;
-
-    for (let attempt = 0; attempt <= maxRetries; attempt += 1) {
-      this.deps.checkAborted?.();
-      await this.deps.waitIfPaused?.();
-
-      if (attempt > 0) {
-        await this.retryStep(step, state, attempt, maxRetries);
-        await options.onRetry?.(attempt, maxRetries, state);
-        if (retryDelayMs > 0) {
-          await delay(retryDelayMs);
-        }
-      }
-
-      const attemptStartedAt = Date.now();
-      await this.startStep(step, state, options.startMessage);
-      await options.onStart?.(attempt, state);
-
-      try {
-        const rawResult = await options.execute(attempt, state);
-        const completion = options.toCompletionResult(rawResult, attempt, state);
-        return await this.completeStep(step, state, {
-          ...completion,
-          duration: completion.duration ?? Date.now() - attemptStartedAt,
-          retries: completion.retries ?? attempt,
-        });
-      } catch (error) {
-        lastError = error;
-        await options.onAttemptFailed?.(error, attempt, state);
-      }
-    }
-
-    const failure = options.getFailureResult?.(lastError, maxRetries, state) ?? {
-      status: 'failed' as const,
-      output: '',
-      error: lastError instanceof Error ? lastError.message : String(lastError ?? 'Unknown error'),
-      retries: maxRetries,
-    };
-    return this.completeStep(step, state, {
-      ...failure,
-      status: 'failed',
-    });
-  }
-
-  async executeAll(
-    steps: WorkflowStep[],
-    agentMap: Map<string, AgentDefinition>,
-    errorHandling?: ErrorHandlingConfig,
-    providedStates?: Map<string, TState>
-  ): Promise<Map<string, StepResult>> {
-    const states = providedStates ?? this.createEphemeralStates(steps);
-    const strategy = normalizeStrategy(errorHandling?.strategy ?? 'fail-fast');
-    const results = new Map<string, StepResult>();
-
-    while (true) {
-      this.deps.checkAborted?.();
-      await this.deps.waitIfPaused?.();
-
-      const readySteps = this.findReady(steps, states);
-      if (readySteps.length === 0) break;
-
-      const schedules = readySteps.map((step, index) =>
-        this.scheduleStep(step, {
-          readyAt: Date.now(),
-          staggerDelay: readySteps.length > 3 ? index * 2_000 : 0,
-        })
-      );
-
-      if (schedules.length > 1) {
-        await this.deps.onBeginTrack?.(readySteps);
-      }
-
-      const settled = await Promise.allSettled(
-        schedules.map(async (schedule) => {
-          if (schedule.staggerDelay > 0) {
-            await delay(schedule.staggerDelay);
-          }
-          return this.executeScheduledStep(schedule.step, states, agentMap, errorHandling);
-        })
-      );
-
-      const batchOutcomes: StepOutcome[] = [];
-
-      for (let index = 0; index < settled.length; index += 1) {
-        const settledResult = settled[index];
-        const step = readySteps[index];
-        const state = states.get(step.name);
-
-        if (settledResult.status === 'fulfilled') {
-          const result = settledResult.value;
-          const outcomeStatus =
-            result.status === 'completed' || result.status === 'skipped' ? result.status : 'failed';
-          results.set(step.name, result);
-          batchOutcomes.push({
-            name: step.name,
-            agent: step.agent ?? 'deterministic',
-            status: outcomeStatus,
-            attempts: result.retries + 1,
-            output: result.output,
-            error: result.error,
-            verificationPassed: outcomeStatus === 'completed' && step.verification !== undefined,
-            completionMode:
-              result.completionReason !== undefined
-                ? this.deps.buildCompletionMode?.(step.name, result.completionReason)
-                : undefined,
-          });
-
-          if (result.status === 'failed') {
-            await this.deps.markDownstreamSkipped?.(step.name);
-            if (strategy === 'fail-fast') {
-              throw new Error(`Step "${step.name}" failed: ${result.error ?? 'unknown error'}`);
-            }
-          }
-          continue;
-        }
-
-        const error =
-          settledResult.reason instanceof Error ? settledResult.reason.message : String(settledResult.reason);
-        if (state) {
-          const failed =
-            state.row.status === 'failed'
-              ? {
-                  status: 'failed' as const,
-                  output: state.row.output ?? '',
-                  duration: 0,
-                  retries: state.row.retryCount,
-                  completionReason: state.row.completionReason,
-                  error: state.row.error ?? error,
-                }
-              : await this.completeStep(step, state, {
-                  status: 'failed',
-                  output: '',
-                  error,
-                  retries: state.row.retryCount,
-                });
-          results.set(step.name, failed);
-        }
-        batchOutcomes.push({
-          name: step.name,
-          agent: step.agent ?? 'deterministic',
-          status: 'failed',
-          attempts: (state?.row.retryCount ?? 0) + 1,
-          error,
-        });
-        await this.deps.markDownstreamSkipped?.(step.name);
-        if (strategy === 'fail-fast') {
-          throw new Error(`Step "${step.name}" failed: ${error}`);
-        }
-      }
-
-      if (readySteps.length > 1 && batchOutcomes.length > 0) {
-        await this.deps.onConverge?.(readySteps, batchOutcomes);
-      }
-    }
-
-    return results;
-  }
-
-  async executeOne(
-    step: WorkflowStep,
-    agentMap: Map<string, AgentDefinition>,
-    errorHandling?: ErrorHandlingConfig,
-    providedState?: TState
-  ): Promise<StepResult> {
-    const state = providedState ?? this.createEphemeralState(step);
-    if (this.deps.executeStep) {
-      const result = await this.deps.executeStep(step, state, agentMap, errorHandling);
-      if (state.row.status !== 'pending' && state.row.status !== 'running') {
-        return {
-          status: state.row.status,
-          output: state.row.output ?? '',
-          duration: result?.duration ?? 0,
-          retries: result?.retries ?? state.row.retryCount,
-          exitCode: result?.exitCode,
-          exitSignal: result?.exitSignal,
-          completionReason: state.row.completionReason ?? result?.completionReason,
-          error: state.row.error ?? result?.error,
-        };
-      }
-      return this.completeStep(step, state, {
-        status: result?.status ?? 'completed',
-        output: result?.output ?? '',
-        exitCode: result?.exitCode,
-        exitSignal: result?.exitSignal,
-        completionReason: result?.completionReason,
-        retries: result?.retries ?? state.row.retryCount,
-        duration: result?.duration ?? 0,
-        error: result?.error,
-      });
-    }
-
-    return this.executeWithProcessSpawner(step, state, agentMap, errorHandling);
-  }
-
-  async markFailed(stepName: string, error: string): Promise<void> {
-    this.deps.postToChannel?.(`**[${stepName}]** Failed: ${error}`);
-  }
-
-  buildStepOutputContext(stepStates: Map<string, TState>): Record<string, { output: string }> {
-    const steps: Record<string, { output: string }> = {};
-    for (const [name, state] of stepStates) {
-      if (state.row.status === 'completed' && state.row.output !== undefined) {
-        steps[name] = { output: state.row.output };
-        continue;
-      }
-      if (state.row.status === 'completed' && this.deps.runId) {
-        const persisted = this.deps.loadStepOutput?.(this.deps.runId, name);
-        if (persisted !== undefined) {
-          state.row.output = persisted;
-          steps[name] = { output: persisted };
-        }
-      }
-    }
-    return steps;
-  }
-
-  resolveStepTemplate(template: string, context: Record<string, unknown>): string {
-    if (this.deps.resolveTemplate) {
-      return this.deps.resolveTemplate(template, context);
-    }
-    return this.templateResolver.interpolateStepTask(template, context);
-  }
-
-  getChannelMessenger(): ChannelMessenger {
-    return this.channelMessenger;
-  }
-
-  runVerification(
-    check: VerificationCheck,
-    output: string,
-    stepName: string,
-    injectedTaskText?: string,
-    options?: VerificationOptions
-  ): VerificationResult {
-    return this.verificationRunner(check, output, stepName, injectedTaskText, {
-      ...options,
-      cwd: options?.cwd ?? this.deps.cwd,
-    });
-  }
-
-  private async executeScheduledStep(
-    step: WorkflowStep,
-    states: Map<string, TState>,
-    agentMap: Map<string, AgentDefinition>,
-    errorHandling?: ErrorHandlingConfig
-  ): Promise<StepResult> {
-    const state = states.get(step.name) ?? this.createEphemeralState(step);
-    if (!states.has(step.name)) {
-      states.set(step.name, state);
-    }
-    return this.executeOne(step, agentMap, errorHandling, state);
-  }
-
-  private async executeWithProcessSpawner(
-    step: WorkflowStep,
-    state: TState,
-    agentMap: Map<string, AgentDefinition>,
-    errorHandling?: ErrorHandlingConfig
-  ): Promise<StepResult> {
-    const spawner = this.deps.processSpawner;
-    if (!spawner) {
-      throw new Error(`No step execution callback or process spawner configured for step "${step.name}"`);
-    }
-
-    const maxRetries = step.retries ?? errorHandling?.maxRetries ?? 0;
-    return this.monitorStep(step, state, {
-      maxRetries,
-      retryDelayMs: errorHandling?.retryDelayMs ?? 1000,
-      startMessage: `**[${step.name}]** Started`,
-      onRetry: (attempt, total) => {
-        this.deps.postToChannel?.(`**[${step.name}]** Retrying (attempt ${attempt + 1}/${total + 1})`);
-      },
-      execute: async () => {
-        if (step.type === 'deterministic') {
-          const command = step.command ?? '';
-          return spawner.spawnShell(command, { cwd: this.deps.cwd, timeoutMs: step.timeoutMs });
-        }
-
-        const agent = step.agent ? agentMap.get(step.agent) : undefined;
-        if (!agent) {
-          throw new Error(`Agent "${step.agent ?? '(missing)'}" not found in config`);
-        }
-
-        const task = step.task ?? '';
-        if (agent.interactive === false) {
-          return spawner.spawnAgent(agent, task, { cwd: this.deps.cwd, timeoutMs: step.timeoutMs });
-        }
-        return spawner.spawnInteractive(agent, task, { cwd: this.deps.cwd, timeoutMs: step.timeoutMs });
-      },
-      toCompletionResult: (spawnResult, attempt) => {
-        const failOnError = step.failOnError !== false;
-        const failed =
-          failOnError &&
-          ((spawnResult.exitCode ?? 0) !== 0 ||
-            (spawnResult.exitCode === undefined && spawnResult.exitSignal !== undefined));
-        const output =
-          step.captureOutput === false
-            ? `Command completed (exit code ${spawnResult.exitCode ?? 0})`
-            : spawnResult.output;
-
-        if (failed) {
-          return {
-            status: 'failed' as const,
-            output,
-            exitCode: spawnResult.exitCode,
-            exitSignal: spawnResult.exitSignal,
-            retries: attempt,
-            error: spawnResult.output || `Command failed with exit code ${spawnResult.exitCode ?? 'unknown'}`,
-          };
-        }
-
-        return {
-          status: 'completed' as const,
-          output,
-          exitCode: spawnResult.exitCode,
-          exitSignal: spawnResult.exitSignal,
-          retries: attempt,
-        };
-      },
-    });
-  }
-
-  private createEphemeralStates(steps: WorkflowStep[]): Map<string, TState> {
-    return new Map(steps.map((step) => [step.name, this.createEphemeralState(step)]));
-  }
-
-  private createEphemeralState(step: WorkflowStep): TState {
-    return {
-      row: {
-        id: `step-${step.name}`,
-        runId: this.deps.runId ?? 'run',
-        stepName: step.name,
-        agentName: step.agent ?? null,
-        stepType: step.type ?? 'agent',
-        status: 'pending',
-        task: step.task ?? step.command ?? step.branch ?? '',
-        dependsOn: step.dependsOn ?? [],
-        retryCount: 0,
-        createdAt: new Date().toISOString(),
-        updatedAt: new Date().toISOString(),
-      },
-    } as TState;
-  }
-
-  private getStatus(state: WorkflowStepStatus | TState | undefined): WorkflowStepStatus | undefined {
-    if (typeof state === 'string') return state;
-    return state?.row.status;
-  }
-}
-
-function normalizeStrategy(strategy: ErrorHandlingConfig['strategy']): 'fail-fast' | 'continue' {
-  if (strategy === 'continue') return 'continue';
-  return 'fail-fast';
-}
-
-function delay(ms: number): Promise<void> {
-  return new Promise((resolve) => setTimeout(resolve, ms));
-}
diff --git a/packages/sdk/src/workflows/template-resolver.ts b/packages/sdk/src/workflows/template-resolver.ts
deleted file mode 100644
index eff39dede..000000000
--- a/packages/sdk/src/workflows/template-resolver.ts
+++ /dev/null
@@ -1,180 +0,0 @@
-import type { RelayYamlConfig } from './types.js';
-
-/**
- * Escape a string for safe inclusion in a shell command passed to `sh -c`.
- * Wraps the value in single quotes and escapes any embedded single quotes.
- */
-export function shellEscape(value: string): string {
-  return "'" + value.replace(/'/g, "'\\''") + "'";
-}
-
-const TEMPLATE_VARIABLE_PATTERN = /\{\{([\w][\w.\-]*)\}\}/g;
-const STEP_OUTPUT_TEMPLATE_PATTERN = /\{\{(steps\.[\w\-]+\.output)\}\}/g;
-const STEP_OUTPUT_REF_PATTERN = /^steps\.([\w\-]+)\.output$/;
-
-/**
- * Variable context for template resolution.
- * Values are typed as `unknown` to accommodate dynamic step-output contexts;
- * only scalar values (string | number | boolean) are interpolated — complex
- * objects are coerced via String(). Shell-bound templates are escaped by
- * {@link resolveTemplateForShell}.
- */
-export interface VariableContext {
-  [key: string]: unknown;
-}
-
-export function resolveVariables(config: RelayYamlConfig, vars: VariableContext): RelayYamlConfig {
-  const resolved = structuredClone(config);
-
-  for (const agent of resolved.agents) {
-    if (agent.task) {
-      agent.task = resolveTemplate(agent.task, vars);
-    }
-  }
-
-  if (resolved.workflows) {
-    for (const workflow of resolved.workflows) {
-      for (const step of workflow.steps) {
-        if (step.task) {
-          step.task = resolveTemplate(step.task, vars);
-        }
-        if (step.command) {
-          step.command = resolveTemplateForShell(step.command, vars);
-        }
-        if (step.params && typeof step.params === 'object') {
-          for (const key of Object.keys(step.params)) {
-            const value = (step.params as Record<string, unknown>)[key];
-            if (typeof value === 'string') {
-              (step.params as Record<string, string>)[key] = resolveTemplate(value, vars);
-            }
-          }
-        }
-      }
-    }
-  }
-
-  return resolved;
-}
-
-export function resolveTemplate(template: string, context: VariableContext): string {
-  return template.replace(TEMPLATE_VARIABLE_PATTERN, (match, key: string) => {
-    if (key.startsWith('steps.')) {
-      return match;
-    }
-
-    const value = resolveDotPath(key, context);
-    if (value === undefined) {
-      throw new Error(`Unresolved variable: {{${key}}}`);
-    }
-    return String(value);
-  });
-}
-
-/**
- * Like resolveTemplate but shell-escapes interpolated values.
- * Use this when the result will be passed to `sh -c` to prevent injection.
- */
-export function resolveTemplateForShell(template: string, context: VariableContext): string {
-  return template.replace(TEMPLATE_VARIABLE_PATTERN, (match, key: string) => {
-    if (key.startsWith('steps.')) {
-      return match;
-    }
-
-    const value = resolveDotPath(key, context);
-    if (value === undefined) {
-      throw new Error(`Unresolved variable: {{${key}}}`);
-    }
-    return shellEscape(String(value));
-  });
-}
-
-export function resolveDotPath(key: string, context: VariableContext): string | number | boolean | undefined {
-  if (!key.includes('.')) {
-    return toTemplateScalar(context[key]);
-  }
-
-  const parts = key.split('.');
-  let current: unknown = context;
-  for (const part of parts) {
-    if (current === null || current === undefined || typeof current !== 'object') {
-      return undefined;
-    }
-    current = (current as Record<string, unknown>)[part];
-  }
-
-  return toTemplateScalar(current);
-}
-
-export function resolveStepOutputRef(ref: string, stepOutputs: Map<string, string>): string {
-  const normalizedRef = ref.startsWith('{{') && ref.endsWith('}}') ? ref.slice(2, -2).trim() : ref;
-  const match = STEP_OUTPUT_REF_PATTERN.exec(normalizedRef);
-  if (!match) {
-    throw new Error(`Invalid step output reference: ${ref}`);
-  }
-
-  const stepOutput = stepOutputs.get(match[1]);
-  if (stepOutput === undefined) {
-    throw new Error(`Unresolved step output reference: ${ref}`);
-  }
-
-  return stepOutput;
-}
-
-export function interpolateStepTask(template: string, context: VariableContext): string {
-  const stepOutputs = buildStepOutputMap(context);
-  return template.replace(STEP_OUTPUT_TEMPLATE_PATTERN, (match, ref: string) => {
-    try {
-      return resolveStepOutputRef(ref, stepOutputs);
-    } catch {
-      return match;
-    }
-  });
-}
-
-function buildStepOutputMap(context: VariableContext): Map<string, string> {
-  const stepOutputs = new Map<string, string>();
-  const steps = context.steps;
-
-  if (!steps || typeof steps !== 'object') {
-    return stepOutputs;
-  }
-
-  for (const [stepName, stepState] of Object.entries(steps as Record<string, unknown>)) {
-    if (!stepState || typeof stepState !== 'object') {
-      continue;
-    }
-
-    const output = toTemplateScalar((stepState as Record<string, unknown>).output);
-    if (output !== undefined) {
-      stepOutputs.set(stepName, String(output));
-    }
-  }
-
-  return stepOutputs;
-}
-
-function toTemplateScalar(value: unknown): string | number | boolean | undefined {
-  if (value === undefined || value === null) return undefined;
-  if (typeof value === 'string' || typeof value === 'number' || typeof value === 'boolean') {
-    return value;
-  }
-  return String(value);
-}
-
-export class TemplateResolver {
-  resolveVariables(config: RelayYamlConfig, vars: VariableContext): RelayYamlConfig {
-    return resolveVariables(config, vars);
-  }
-
-  interpolate(template: string, vars: VariableContext): string {
-    return resolveTemplate(template, vars);
-  }
-
-  resolveDotPath(key: string, vars: VariableContext): string | number | boolean | undefined {
-    return resolveDotPath(key, vars);
-  }
-
-  interpolateStepTask(template: string, context: VariableContext): string {
-    return interpolateStepTask(template, context);
-  }
-}
diff --git a/packages/sdk/src/workflows/templates.ts b/packages/sdk/src/workflows/templates.ts
deleted file mode 100644
index 9d9c61c99..000000000
--- a/packages/sdk/src/workflows/templates.ts
+++ /dev/null
@@ -1,534 +0,0 @@
-import { existsSync, promises as fs } from 'node:fs';
-import path from 'node:path';
-import { fileURLToPath } from 'node:url';
-import { parse as parseYaml, stringify as stringifyYaml } from 'yaml';
-import type { RelayYamlConfig } from './types.js';
-
-const YAML_EXTENSIONS = ['.yaml', '.yml'] as const;
-
-export const BUILT_IN_TEMPLATE_NAMES = [
-  'feature-dev',
-  'bug-fix',
-  'code-review',
-  'security-audit',
-  'refactor',
-  'documentation',
-  'review-loop',
-] as const;
-
-export type BuiltInTemplateName = (typeof BUILT_IN_TEMPLATE_NAMES)[number];
-
-export interface TemplateRegistryOptions {
-  builtInTemplatesDir?: string;
-  customTemplatesDir?: string;
-  workspaceDir?: string;
-  fetcher?: typeof fetch;
-}
-
-export interface LoadTemplateOptions {
-  overrides?: Record<string, unknown>;
-}
-
-export interface TemplateShorthandConfig {
-  swarm: string;
-  overrides?: Record<string, unknown>;
-}
-
-export type TemplateReferenceInput =
-  | string
-  | RelayYamlConfig
-  | (Partial<Omit<RelayYamlConfig, 'swarm'>> & TemplateShorthandConfig);
-
-function isRecord(value: unknown): value is Record<string, unknown> {
-  return typeof value === 'object' && value !== null;
-}
-
-function hasYamlExtension(fileName: string): boolean {
-  return YAML_EXTENSIONS.some((ext) => fileName.endsWith(ext));
-}
-
-export class TemplateRegistry {
-  private readonly builtInTemplatesDir: string;
-  private readonly customTemplatesDir: string;
-  private readonly fetcher: typeof fetch;
-
-  constructor(options: TemplateRegistryOptions = {}) {
-    this.builtInTemplatesDir = this.resolveBuiltInTemplatesDir(options.builtInTemplatesDir);
-    this.customTemplatesDir = options.customTemplatesDir
-      ? path.resolve(options.customTemplatesDir)
-      : path.resolve(options.workspaceDir ?? process.cwd(), '.relay/workflows');
-
-    this.fetcher = options.fetcher ?? fetch;
-  }
-
-  listBuiltInTemplates(): string[] {
-    return [...BUILT_IN_TEMPLATE_NAMES];
-  }
-
-  async listCustomTemplates(): Promise<string[]> {
-    const files = await this.safeReadDir(this.customTemplatesDir);
-    return files
-      .filter((fileName) => hasYamlExtension(fileName))
-      .map((fileName) => this.normalizeTemplateName(fileName))
-      .sort();
-  }
-
-  async listTemplates(): Promise<string[]> {
-    const custom = await this.listCustomTemplates();
-    const merged = new Set<string>([...BUILT_IN_TEMPLATE_NAMES, ...custom]);
-    return Array.from(merged).sort();
-  }
-
-  async hasTemplate(name: string): Promise<boolean> {
-    try {
-      await this.resolveTemplatePath(name);
-      return true;
-    } catch {
-      return false;
-    }
-  }
-
-  async loadTemplate(name: string, options: LoadTemplateOptions = {}): Promise<RelayYamlConfig> {
-    const templatePath = await this.resolveTemplatePath(name);
-    const template = await this.readTemplateFile(templatePath);
-
-    if (options.overrides && Object.keys(options.overrides).length > 0) {
-      return this.applyOverrides(template, options.overrides);
-    }
-
-    return template;
-  }
-
-  async resolveTemplateReference(
-    input: TemplateReferenceInput,
-    options: LoadTemplateOptions = {}
-  ): Promise<RelayYamlConfig> {
-    if (typeof input === 'string') {
-      return this.loadTemplate(input, options);
-    }
-
-    if (this.isTemplateShorthand(input)) {
-      const { swarm, overrides = {}, ...rest } = input;
-      const mergedOverrides = {
-        ...overrides,
-        ...(options.overrides ?? {}),
-      };
-      const baseTemplate = await this.loadTemplate(swarm, {
-        overrides: mergedOverrides,
-      });
-      return this.mergeRelayConfig(baseTemplate, rest);
-    }
-
-    const config = this.cloneValue(input as RelayYamlConfig);
-
-    if (options.overrides && Object.keys(options.overrides).length > 0) {
-      return this.applyOverrides(config, options.overrides);
-    }
-
-    return config;
-  }
-
-  applyOverrides(config: RelayYamlConfig, overrides: Record<string, unknown>): RelayYamlConfig {
-    const nextConfig = this.cloneValue(config);
-
-    for (const [overridePath, value] of Object.entries(overrides)) {
-      this.setOverride(nextConfig, overridePath, value);
-    }
-
-    return nextConfig;
-  }
-
-  async installExternalTemplate(url: string, name?: string): Promise<string> {
-    const response = await this.fetcher(url);
-    if (!response.ok) {
-      throw new Error(`Failed to fetch template from ${url}: ${response.status} ${response.statusText}`);
-    }
-
-    const raw = await response.text();
-    const parsed = parseYaml(raw);
-
-    if (!isRecord(parsed)) {
-      throw new Error(`Template from ${url} is not a YAML object`);
-    }
-
-    const inferredName = typeof parsed.name === 'string' ? parsed.name : '';
-    const templateName = this.normalizeTemplateName(name ?? inferredName);
-
-    if (!templateName) {
-      throw new Error('Template name is required. Provide name explicitly or include a string "name" field.');
-    }
-
-    if (
-      templateName.includes('/') ||
-      templateName.includes('\\') ||
-      templateName.includes('..') ||
-      path.isAbsolute(templateName)
-    ) {
-      throw new Error(
-        `Invalid template name: "${templateName}" contains path separators or traversal sequences`
-      );
-    }
-
-    this.validateRelayConfig(parsed, url);
-
-    await fs.mkdir(this.customTemplatesDir, { recursive: true });
-    const targetPath = path.join(this.customTemplatesDir, `${templateName}.yaml`);
-    await fs.writeFile(targetPath, stringifyYaml(parsed), 'utf-8');
-    return targetPath;
-  }
-
-  private isTemplateShorthand(
-    input: TemplateReferenceInput
-  ): input is Partial<Omit<RelayYamlConfig, 'swarm'>> & TemplateShorthandConfig {
-    return isRecord(input) && typeof input.swarm === 'string';
-  }
-
-  private mergeRelayConfig(
-    base: RelayYamlConfig,
-    patch: Partial<Omit<RelayYamlConfig, 'swarm'>>
-  ): RelayYamlConfig {
-    const merged = this.cloneValue(base);
-
-    for (const [key, value] of Object.entries(patch)) {
-      if (value === undefined) {
-        continue;
-      }
-      (merged as unknown as Record<string, unknown>)[key] = this.cloneValue(value);
-    }
-
-    return merged;
-  }
-
-  private normalizeTemplateName(name: string): string {
-    return name.replace(/\.ya?ml$/i, '').trim();
-  }
-
-  private resolveBuiltInTemplatesDir(explicitDir?: string): string {
-    if (explicitDir) {
-      return path.resolve(explicitDir);
-    }
-
-    const currentDir = path.dirname(fileURLToPath(import.meta.url));
-    const candidates = [
-      path.resolve(currentDir, 'builtin-templates'),
-      path.resolve(currentDir, '../workflows/builtin-templates'),
-    ];
-
-    for (const candidate of candidates) {
-      if (existsSync(candidate)) {
-        return candidate;
-      }
-    }
-
-    return candidates[0];
-  }
-
-  private async resolveTemplatePath(name: string): Promise<string> {
-    const normalizedName = this.normalizeTemplateName(name);
-
-    const customPath = await this.findTemplatePath(this.customTemplatesDir, normalizedName);
-    if (customPath) {
-      return customPath;
-    }
-
-    const builtInPath = await this.findTemplatePath(this.builtInTemplatesDir, normalizedName);
-    if (builtInPath) {
-      return builtInPath;
-    }
-
-    throw new Error(`Template not found: ${name}`);
-  }
-
-  private async findTemplatePath(directory: string, templateName: string): Promise<string | undefined> {
-    for (const ext of YAML_EXTENSIONS) {
-      const candidate = path.join(directory, `${templateName}${ext}`);
-      try {
-        const stat = await fs.stat(candidate);
-        if (stat.isFile()) {
-          return candidate;
-        }
-      } catch {
-        // Continue checking other extensions.
-      }
-    }
-
-    return undefined;
-  }
-
-  private async readTemplateFile(templatePath: string): Promise<RelayYamlConfig> {
-    const raw = await fs.readFile(templatePath, 'utf-8');
-    const parsed = parseYaml(raw);
-
-    if (!isRecord(parsed)) {
-      throw new Error(`Template at ${templatePath} is not a YAML object`);
-    }
-
-    const normalized = this.normalizeLegacyTemplate(parsed);
-    this.validateRelayConfig(normalized, templatePath);
-    return normalized;
-  }
-
-  private normalizeLegacyTemplate(rawTemplate: Record<string, unknown>): Record<string, unknown> {
-    const normalized = this.cloneValue(rawTemplate);
-
-    if (!isRecord(normalized.swarm) && typeof normalized.pattern === 'string') {
-      normalized.swarm = { pattern: normalized.pattern };
-      delete normalized.pattern;
-    }
-
-    if (Array.isArray(normalized.agents)) {
-      normalized.agents = normalized.agents.map((agent) => {
-        if (!isRecord(agent)) {
-          return agent;
-        }
-
-        if (typeof agent.name !== 'string' && typeof agent.id === 'string') {
-          return { ...agent, name: agent.id };
-        }
-
-        return agent;
-      });
-    }
-
-    if (!Array.isArray(normalized.workflows) && isRecord(normalized.workflow)) {
-      const workflowName =
-        typeof normalized.name === 'string' ? `${normalized.name}-workflow` : 'default-workflow';
-
-      const workflow = normalized.workflow;
-      const steps = Array.isArray(workflow.steps)
-        ? workflow.steps.map((step) => this.normalizeLegacyStep(step)).filter((step) => step !== null)
-        : [];
-
-      normalized.workflows = [
-        {
-          name: workflowName,
-          description: typeof workflow.description === 'string' ? workflow.description : undefined,
-          onError: typeof workflow.onError === 'string' ? workflow.onError : undefined,
-          steps,
-        },
-      ];
-
-      delete normalized.workflow;
-    }
-
-    return normalized;
-  }
-
-  private normalizeLegacyStep(step: unknown): Record<string, unknown> | null {
-    if (!isRecord(step)) {
-      return null;
-    }
-
-    const name =
-      typeof step.name === 'string' ? step.name : typeof step.id === 'string' ? step.id : undefined;
-
-    const task =
-      typeof step.task === 'string' ? step.task : typeof step.prompt === 'string' ? step.prompt : undefined;
-
-    if (!name || typeof step.agent !== 'string' || !task) {
-      return null;
-    }
-
-    const normalized: Record<string, unknown> = {
-      name,
-      agent: step.agent,
-      task,
-    };
-
-    if (Array.isArray(step.dependsOn)) {
-      normalized.dependsOn = step.dependsOn;
-    }
-
-    if (typeof step.timeoutMs === 'number') {
-      normalized.timeoutMs = step.timeoutMs;
-    }
-
-    if (typeof step.retries === 'number') {
-      normalized.retries = step.retries;
-    } else if (typeof step.maxRetries === 'number') {
-      normalized.retries = step.maxRetries;
-    }
-
-    if (isRecord(step.verification)) {
-      normalized.verification = step.verification;
-    } else if (typeof step.expects === 'string') {
-      normalized.verification = {
-        type: 'output_contains',
-        value: step.expects,
-      };
-    }
-
-    return normalized;
-  }
-
-  private validateRelayConfig(rawConfig: unknown, source: string): asserts rawConfig is RelayYamlConfig {
-    if (!isRecord(rawConfig)) {
-      throw new Error(`Template at ${source} is not an object`);
-    }
-
-    if (typeof rawConfig.version !== 'string') {
-      throw new Error(`Template at ${source} is missing required string field: version`);
-    }
-
-    if (typeof rawConfig.name !== 'string') {
-      throw new Error(`Template at ${source} is missing required string field: name`);
-    }
-
-    if (!isRecord(rawConfig.swarm) || typeof rawConfig.swarm.pattern !== 'string') {
-      throw new Error(`Template at ${source} is missing required field: swarm.pattern`);
-    }
-
-    if (!Array.isArray(rawConfig.agents) || rawConfig.agents.length === 0) {
-      throw new Error(`Template at ${source} must include a non-empty agents array`);
-    }
-
-    for (const agent of rawConfig.agents) {
-      if (!isRecord(agent) || typeof agent.name !== 'string' || typeof agent.cli !== 'string') {
-        throw new Error(`Template at ${source} contains an invalid agent definition`);
-      }
-    }
-
-    if (rawConfig.workflows !== undefined) {
-      if (!Array.isArray(rawConfig.workflows)) {
-        throw new Error(`Template at ${source} has invalid workflows; expected an array`);
-      }
-
-      for (const workflow of rawConfig.workflows) {
-        if (!isRecord(workflow) || typeof workflow.name !== 'string' || !Array.isArray(workflow.steps)) {
-          throw new Error(`Template at ${source} contains an invalid workflow definition`);
-        }
-
-        for (const step of workflow.steps) {
-          if (!isRecord(step) || typeof step.name !== 'string') {
-            throw new Error(`Template at ${source} contains an invalid workflow step`);
-          }
-
-          // Deterministic steps require type and command
-          if (step.type === 'deterministic') {
-            if (typeof step.command !== 'string') {
-              throw new Error(
-                `Template at ${source} has deterministic step "${step.name}" without a command`
-              );
-            }
-          } else {
-            // Agent steps (type is undefined or 'agent') require agent and task
-            if (typeof step.agent !== 'string' || typeof step.task !== 'string') {
-              throw new Error(`Template at ${source} has agent step "${step.name}" without agent or task`);
-            }
-          }
-        }
-      }
-    }
-  }
-
-  private setOverride(config: RelayYamlConfig, overridePath: string, value: unknown): void {
-    const pathParts = overridePath
-      .replace(/\[(\d+)\]/g, '.$1')
-      .split('.')
-      .map((part) => part.trim())
-      .filter(Boolean);
-
-    if (pathParts.length === 0) {
-      return;
-    }
-
-    if (pathParts[0] === 'steps') {
-      const workflow = config.workflows?.[0];
-      if (!workflow) {
-        throw new Error(`Cannot apply override "${overridePath}": workflows[0] is missing`);
-      }
-      this.setOnValue(workflow.steps as unknown, pathParts.slice(1), value, overridePath);
-      return;
-    }
-
-    if (pathParts[0] === 'workflow' && pathParts[1] === 'steps') {
-      const workflow = config.workflows?.[0];
-      if (!workflow) {
-        throw new Error(`Cannot apply override "${overridePath}": workflows[0] is missing`);
-      }
-      this.setOnValue(workflow.steps as unknown, pathParts.slice(2), value, overridePath);
-      return;
-    }
-
-    this.setOnValue(config as unknown, pathParts, value, overridePath);
-  }
-
-  private setOnValue(target: unknown, pathParts: string[], value: unknown, fullPath: string): void {
-    if (pathParts.length === 0) {
-      throw new Error(`Invalid override path: ${fullPath}`);
-    }
-
-    let current: unknown = target;
-
-    for (let i = 0; i < pathParts.length - 1; i += 1) {
-      const part = pathParts[i];
-      const nextPart = pathParts[i + 1];
-
-      if (Array.isArray(current)) {
-        const index = this.resolveArrayItemIndex(current, part);
-        if (index < 0) {
-          throw new Error(`Cannot apply override "${fullPath}": array item "${part}" was not found`);
-        }
-        current = current[index];
-        continue;
-      }
-
-      if (!isRecord(current)) {
-        throw new Error(`Cannot apply override "${fullPath}": segment "${part}" is not an object`);
-      }
-
-      if (!(part in current) || current[part] === undefined || current[part] === null) {
-        current[part] = /^\d+$/.test(nextPart) ? [] : {};
-      }
-
-      current = current[part];
-    }
-
-    const finalPart = pathParts[pathParts.length - 1];
-
-    if (Array.isArray(current)) {
-      const index = this.resolveArrayItemIndex(current, finalPart);
-      if (index < 0) {
-        throw new Error(`Cannot apply override "${fullPath}": array item "${finalPart}" was not found`);
-      }
-      current[index] = value;
-      return;
-    }
-
-    if (!isRecord(current)) {
-      throw new Error(`Cannot apply override "${fullPath}": parent object is invalid`);
-    }
-
-    current[finalPart] = value;
-  }
-
-  private resolveArrayItemIndex(items: unknown[], segment: string): number {
-    if (/^\d+$/.test(segment)) {
-      const index = Number.parseInt(segment, 10);
-      return index >= 0 && index < items.length ? index : -1;
-    }
-
-    return items.findIndex(
-      (item) =>
-        isRecord(item) &&
-        ((typeof item.name === 'string' && item.name === segment) ||
-          (typeof item.id === 'string' && item.id === segment))
-    );
-  }
-
-  private async safeReadDir(directory: string): Promise<string[]> {
-    try {
-      return await fs.readdir(directory);
-    } catch {
-      return [];
-    }
-  }
-
-  private cloneValue<T>(value: T): T {
-    if (typeof structuredClone === 'function') {
-      return structuredClone(value);
-    }
-
-    return JSON.parse(JSON.stringify(value)) as T;
-  }
-}
diff --git a/packages/sdk/src/workflows/trajectory.ts b/packages/sdk/src/workflows/trajectory.ts
deleted file mode 100644
index 557edca76..000000000
--- a/packages/sdk/src/workflows/trajectory.ts
+++ /dev/null
@@ -1,563 +0,0 @@
-/** WorkflowTrajectory records canonical workflow trajectories via agent-trajectories. */
-import { dirname, join } from 'node:path';
-import {
-  FileStorage,
-  abandonTrajectory,
-  addChapter as appendChapter,
-  addEvent as appendEvent,
-  completeTrajectory,
-  createTrajectory,
-  type EventSignificance,
-  type Trajectory,
-  type TrajectoryEventType,
-} from 'agent-trajectories';
-import type { StepCompletionDecision, TrajectoryConfig, WorkflowStep } from './types.js';
-
-type WorkflowTrajectoryEventType =
-  | TrajectoryEventType
-  | 'review-completed'
-  | 'completion-marker'
-  | 'completion-evidence';
-
-type WorkflowTrajectoryAgent = {
-  name: string;
-  role: string;
-  joinedAt: string;
-  leftAt?: string;
-};
-
-// agent-trajectories runtime accepts workflow metadata and open-ended roles,
-// while some published declaration aliases are narrower.
-type WorkflowTrajectoryData = Omit<Trajectory, 'agents'> & {
-  agents: WorkflowTrajectoryAgent[];
-  workflowId?: string;
-};
-
-interface StepParticipants {
-  role?: string;
-  owner?: string;
-  specialist?: string;
-  reviewer?: string;
-}
-export interface StepOutcome {
-  name: string;
-  agent: string;
-  status: 'completed' | 'failed' | 'skipped';
-  attempts: number;
-  output?: string;
-  error?: string;
-  verificationPassed?: boolean;
-  verificationValue?: string;
-  nonInteractive?: boolean;
-  durationMs?: number;
-  completionMode?: StepCompletionDecision['mode'];
-}
-
-type FailureCause =
-  | 'timeout'
-  | 'verification_mismatch'
-  | 'spawn_failed'
-  | 'exit_nonzero'
-  | 'aborted'
-  | 'unknown';
-
-function classifyFailure(error: string): FailureCause {
-  const e = error.toLowerCase();
-  if (e.includes('timed out') || e.includes('timeout')) return 'timeout';
-  if (e.includes('output does not contain') || e.includes('verification failed'))
-    return 'verification_mismatch';
-  if (e.includes('failed to spawn') || e.includes('enoent')) return 'spawn_failed';
-  if (e.includes('exit code') || e.includes('exited with')) return 'exit_nonzero';
-  if (e.includes('aborted') || e.includes('cancelled')) return 'aborted';
-  return 'unknown';
-}
-
-function diagnosisFor(cause: FailureCause, outcome: StepOutcome): string {
-  switch (cause) {
-    case 'timeout':
-      return outcome.nonInteractive
-        ? 'Non-interactive agent timed out — the task is likely too large or complex for a single subprocess call. Consider pre-reading large files in a deterministic step and injecting only the relevant excerpt via {{steps.X.output}}.'
-        : 'Interactive agent timed out — it may have gone idle, failed to self-terminate, or the task scope was too broad. Check if the agent was waiting for relay signals that never arrived.';
-    case 'verification_mismatch':
-      return `Agent completed but did not output the expected sentinel "${outcome.verificationValue ?? '(unknown)'}". The task prompt may not clearly specify the required output format, or the agent produced correct work but did not emit the signal.`;
-    case 'spawn_failed':
-      return 'The agent process could not be started — the CLI binary may be missing from PATH or the working directory is incorrect.';
-    case 'exit_nonzero':
-      return 'The agent process exited with a non-zero exit code. Check stderr for the root cause.';
-    case 'aborted':
-      return 'The step was cancelled (user interrupt or upstream abort).';
-    default:
-      return 'Unexpected failure. Review the error and step definition.';
-  }
-}
-
-function buildSynthesis(label: string, outcomes: StepOutcome[], unblocks?: string[]): string {
-  const completed = outcomes.filter((o) => o.status === 'completed');
-  const failed = outcomes.filter((o) => o.status === 'failed');
-  const retried = outcomes.filter((o) => o.attempts > 1 && o.status !== 'failed');
-  const parts: string[] = [`${label} resolved.`, `${completed.length}/${outcomes.length} steps completed.`];
-  if (failed.length > 0)
-    parts.push(`${failed.length} step(s) failed: ${failed.map((s) => s.name).join(', ')}.`);
-  if (retried.length > 0)
-    parts.push(`${retried.length} step(s) required retries: ${retried.map((s) => s.name).join(', ')}.`);
-  else if (failed.length === 0) parts.push('All steps completed on first attempt.');
-  if (unblocks?.length) parts.push(`Unblocking: ${unblocks.join(', ')}.`);
-  return parts.join(' ');
-}
-
-function computeConfidence(outcomes: StepOutcome[]): number {
-  if (outcomes.length === 0) return 0.7;
-  const total = outcomes.length;
-  const completed = outcomes.filter((o) => o.status === 'completed').length;
-  const firstAttempt = outcomes.filter((o) => o.attempts === 1 && o.status === 'completed').length;
-  const verified = outcomes.filter((o) => o.verificationPassed).length;
-  return Math.min(1, 0.5 * (completed / total) + 0.25 * (firstAttempt / total) + 0.25 * (verified / total));
-}
-
-function formatElapsed(elapsed: number, long: boolean): string {
-  return elapsed > 60_000
-    ? `${Math.round(elapsed / 60_000)}${long ? ' minutes' : 'min'}`
-    : `${Math.round(elapsed / 1_000)}${long ? ' seconds' : 's'}`;
-}
-
-function buildRunSummary(outcomes: StepOutcome[], startTime: number): string {
-  const completed = outcomes.filter((o) => o.status === 'completed');
-  const failed = outcomes.filter((o) => o.status === 'failed');
-  const skipped = outcomes.filter((o) => o.status === 'skipped');
-  const elapsedStr = formatElapsed(Date.now() - startTime, false);
-  if (failed.length === 0) {
-    const retried = completed.filter((o) => o.attempts > 1);
-    const base = `All ${completed.length} steps completed in ${elapsedStr}.`;
-    return retried.length > 0
-      ? `${base} ${retried.length} step(s) needed retries: ${retried.map((o) => o.name).join(', ')}.`
-      : base;
-  }
-  const firstFailure = failed[0];
-  const cause = classifyFailure(firstFailure.error ?? '');
-  const cascaded =
-    skipped.length > 0
-      ? ` Caused ${skipped.length} downstream step(s) to be skipped: ${skipped.map((o) => o.name).join(', ')}.`
-      : '';
-  return `Failed at "${firstFailure.name}" [${cause}] after ${elapsedStr}.${cascaded} ${completed.length}/${outcomes.length} steps completed before failure.`;
-}
-
-function extractLearnings(outcomes: StepOutcome[]): string[] {
-  const learnings: string[] = [];
-  const timeouts = outcomes.filter(
-    (o) => o.status === 'failed' && classifyFailure(o.error ?? '') === 'timeout'
-  );
-  if (timeouts.some((o) => o.nonInteractive))
-    learnings.push(
-      `Non-interactive agent timeouts detected (${timeouts.map((o) => o.name).join(', ')}). Use deterministic steps to pre-read files and inject content — non-interactive agents should not discover information via tools.`
-    );
-  const verifyFails = outcomes.filter(
-    (o) => o.status === 'failed' && classifyFailure(o.error ?? '') === 'verification_mismatch'
-  );
-  if (verifyFails.length > 0)
-    learnings.push(
-      `Verification mismatch on: ${verifyFails.map((o) => `"${o.name}" (expected "${o.verificationValue ?? '?'}")`).join(', ')}. Make the required output format more explicit in the task prompt.`
-    );
-  const retried = outcomes.filter((o) => o.attempts > 1 && o.status === 'completed');
-  if (retried.length > 0)
-    learnings.push(
-      `${retried.map((o) => `"${o.name}" (${o.attempts} attempts)`).join(', ')} succeeded after retries — consider adding clearer output instructions to reduce retries.`
-    );
-  return learnings;
-}
-
-const extractChallenges = (outcomes: StepOutcome[]): string[] =>
-  outcomes
-    .filter((o) => o.status === 'failed')
-    .map((step) => diagnosisFor(classifyFailure(step.error ?? ''), step));
-
-export class WorkflowTrajectory {
-  private trajectory: WorkflowTrajectoryData | null = null;
-  private storage?: FileStorage;
-  private storageInit?: Promise<void>;
-  private readonly enabled: boolean;
-  private readonly reflectOnBarriers: boolean;
-  private readonly reflectOnConverge: boolean;
-  private readonly autoDecisions: boolean;
-  private readonly storageBaseDir: string;
-  private readonly runId: string;
-  private startTime = 0;
-  private swarmPattern = 'dag';
-
-  constructor(config: TrajectoryConfig | false | undefined, runId: string, cwd: string) {
-    const cfg = config === false ? { enabled: false } : (config ?? {});
-    this.enabled = cfg.enabled !== false;
-    this.reflectOnBarriers = cfg.reflectOnBarriers !== false;
-    this.reflectOnConverge = cfg.reflectOnConverge !== false;
-    this.autoDecisions = cfg.autoDecisions !== false;
-    this.runId = runId;
-    const dataDir = process.env.TRAJECTORIES_DATA_DIR ?? join(cwd, '.trajectories');
-    this.storageBaseDir = process.env.TRAJECTORIES_DATA_DIR ? dirname(dataDir) : cwd;
-  }
-
-  async start(
-    workflowName: string,
-    stepCount: number,
-    trackInfo?: string,
-    description?: string,
-    pattern?: string
-  ): Promise<void> {
-    if (!this.enabled) return;
-    this.startTime = Date.now();
-    this.swarmPattern = pattern ?? 'dag';
-    const trajectory = createTrajectory({
-      title: workflowName,
-      description,
-      source: { system: 'workflow-runner', id: this.runId },
-    }) as WorkflowTrajectoryData;
-    const workflowId = process.env.TRAJECTORIES_WORKFLOW_ID?.trim();
-    if (workflowId) trajectory.workflowId = workflowId;
-    this.trajectory = trajectory;
-    this.trajectory.agents.push({
-      name: 'orchestrator',
-      role: 'workflow-runner',
-      joinedAt: new Date().toISOString(),
-    });
-    this.openChapter('Planning', 'orchestrator');
-    if (description) this.addEvent('note', `Purpose: ${description.trim()}`);
-    this.addEvent(
-      'note',
-      `Approach: ${stepCount}-step ${this.swarmPattern} workflow${trackInfo ? ` — ${trackInfo}` : ''}`
-    );
-    await this.flush();
-  }
-
-  async beginTrack(trackName: string): Promise<void> {
-    if (this.enabled && this.trajectory) {
-      this.openChapter(`Execution: ${trackName}`, 'orchestrator');
-      await this.flush();
-    }
-  }
-  async beginConvergence(label: string): Promise<void> {
-    if (this.enabled && this.trajectory) {
-      this.openChapter(`Convergence: ${label}`, 'orchestrator');
-      await this.flush();
-    }
-  }
-
-  async stepStarted(step: WorkflowStep, agent: string, participants?: StepParticipants): Promise<void> {
-    if (!this.enabled || !this.trajectory) return;
-    await this.registerAgent(agent, participants?.role ?? step.agent ?? 'deterministic');
-    if (participants?.owner && participants.owner !== agent)
-      await this.registerAgent(participants.owner, 'owner');
-    if (participants?.specialist) await this.registerAgent(participants.specialist, 'specialist');
-    if (participants?.reviewer) await this.registerAgent(participants.reviewer, 'reviewer');
-    this.openChapter(`Execution: ${step.name}`, agent);
-    const intent = step.task
-      ? step.task
-          .trim()
-          .split(/\n|\.(?=\s)/)[0]
-          .trim()
-          .slice(0, 120)
-      : `${step.type ?? 'deterministic'} step`;
-    this.addEvent('note', `"${step.name}": ${intent}`, undefined, { agent });
-    await this.flush();
-  }
-
-  async registerAgent(name: string, role: string): Promise<void> {
-    if (!this.enabled || !this.trajectory || this.trajectory.agents.some((agent) => agent.name === name))
-      return;
-    this.trajectory.agents.push({ name, role, joinedAt: new Date().toISOString() });
-    await this.flush();
-  }
-
-  async stepSupervisionAssigned(
-    step: WorkflowStep,
-    supervised: { owner: { name: string }; specialist: { name: string }; reviewer?: { name: string } }
-  ): Promise<void> {
-    if (!this.enabled || !this.trajectory) return;
-    await this.registerAgent(supervised.owner.name, 'owner');
-    await this.registerAgent(supervised.specialist.name, 'specialist');
-    if (supervised.reviewer?.name) await this.registerAgent(supervised.reviewer.name, 'reviewer');
-    const reviewerNote = supervised.reviewer?.name ? `, reviewer=${supervised.reviewer.name}` : '';
-    this.addEvent(
-      'decision',
-      `"${step.name}" supervision assigned → owner=${supervised.owner.name}, specialist=${supervised.specialist.name}${reviewerNote}`,
-      'medium',
-      {
-        owner: supervised.owner.name,
-        specialist: supervised.specialist.name,
-        reviewer: supervised.reviewer?.name,
-      }
-    );
-    await this.flush();
-  }
-
-  async ownerMonitoringEvent(
-    stepName: string,
-    owner: string,
-    detail: string,
-    raw?: Record<string, unknown>
-  ): Promise<void> {
-    if (!this.enabled || !this.trajectory) return;
-    this.addEvent(
-      'note',
-      `"${stepName}" owner ${owner}: ${detail}`,
-      'medium',
-      raw ? { owner, ...raw } : { owner }
-    );
-    await this.flush();
-  }
-
-  async reviewCompleted(
-    stepName: string,
-    reviewerName: string,
-    decision: 'approved' | 'rejected',
-    reason?: string
-  ): Promise<void> {
-    if (!this.enabled || !this.trajectory) return;
-    this.addEvent('review-completed', `"${stepName}" review ${decision} by ${reviewerName}`, 'medium', {
-      stepName,
-      reviewer: reviewerName,
-      decision,
-      reason,
-    });
-    await this.flush();
-  }
-
-  async stepCompletionDecision(stepName: string, decision: StepCompletionDecision): Promise<void> {
-    if (!this.enabled || !this.trajectory) return;
-    const modeLabel = decision.mode === 'marker' ? 'marker-based' : `${decision.mode}-based`;
-    const reason = decision.reason ? ` — ${decision.reason}` : '';
-    const evidence = this.formatCompletionEvidenceSummary(decision.evidence);
-    this.addEvent(
-      decision.mode === 'marker' ? 'completion-marker' : 'completion-evidence',
-      `"${stepName}" ${modeLabel} completion${reason}${evidence ? ` (${evidence})` : ''}`,
-      'medium',
-      { stepName, completionMode: decision.mode, reason: decision.reason, evidence: decision.evidence }
-    );
-    await this.flush();
-  }
-
-  async stepCompleted(
-    step: WorkflowStep,
-    output: string,
-    attempt: number,
-    decision?: StepCompletionDecision
-  ): Promise<void> {
-    if (!this.enabled || !this.trajectory) return;
-    if (decision) await this.stepCompletionDecision(step.name, decision);
-    const lines = output
-      .split('\n')
-      .map((line) => line.trim())
-      .filter(Boolean);
-    const lastMeaningful = lines.at(-1) ?? '';
-    const completion =
-      lastMeaningful.length > 0 && lastMeaningful.length < 100
-        ? lastMeaningful
-        : output.trim().slice(0, 120) || '(no output)';
-    this.addEvent(
-      'finding',
-      `"${step.name}" completed${attempt > 1 ? ` (after ${attempt} attempts)` : ''}${decision ? ` [${decision.mode}]` : ''} → ${completion}`,
-      'medium'
-    );
-    await this.flush();
-  }
-
-  async stepFailed(
-    step: WorkflowStep,
-    error: string,
-    attempt: number,
-    maxRetries: number,
-    outcome?: Partial<StepOutcome>
-  ): Promise<void> {
-    if (!this.enabled || !this.trajectory) return;
-    const cause = classifyFailure(error);
-    const diagnosis = diagnosisFor(cause, {
-      name: step.name,
-      agent: outcome?.agent ?? step.agent ?? '',
-      status: 'failed',
-      attempts: attempt,
-      error,
-      verificationValue: outcome?.verificationValue,
-      nonInteractive: outcome?.nonInteractive,
-    });
-    this.addEvent('error', `"${step.name}" failed [${cause}]: ${diagnosis}`, 'high', {
-      cause,
-      rawError: error,
-      attempt,
-      maxRetries,
-    });
-    await this.flush();
-  }
-
-  async stepSkipped(step: WorkflowStep, reason: string): Promise<void> {
-    if (this.enabled && this.trajectory) {
-      this.addEvent('note', `"${step.name}" skipped — ${reason}`);
-      await this.flush();
-    }
-  }
-  async stepRetrying(step: WorkflowStep, attempt: number, maxRetries: number): Promise<void> {
-    if (this.enabled && this.trajectory) {
-      this.addEvent('note', `"${step.name}" retrying (attempt ${attempt}/${maxRetries + 1})`);
-      await this.flush();
-    }
-  }
-
-  async reflect(synthesis: string, confidence: number, focalPoints?: string[]): Promise<void> {
-    if (!this.enabled || !this.trajectory) return;
-    this.addEvent(
-      'reflection',
-      synthesis,
-      'high',
-      focalPoints?.length ? { confidence, focalPoints } : { confidence }
-    );
-    await this.flush();
-  }
-
-  async synthesizeAndReflect(label: string, outcomes: StepOutcome[], unblocks?: string[]): Promise<void> {
-    if (!this.enabled || !this.trajectory) return;
-    await this.beginConvergence(label);
-    await this.reflect(
-      buildSynthesis(label, outcomes, unblocks),
-      computeConfidence(outcomes),
-      outcomes.map((o) => `${o.name}: ${o.status}`)
-    );
-  }
-
-  async decide(question: string, chosen: string, reasoning: string): Promise<void> {
-    if (!this.enabled || !this.trajectory || !this.autoDecisions) return;
-    this.addEvent('decision', `${question} → ${chosen}: ${reasoning}`, 'medium', {
-      question,
-      chosen,
-      reasoning,
-    });
-    await this.flush();
-  }
-
-  async complete(
-    summary: string,
-    confidence: number,
-    meta?: { learnings?: string[]; challenges?: string[] }
-  ): Promise<void> {
-    if (!this.enabled || !this.trajectory) return;
-    this.openChapter('Retrospective', 'orchestrator');
-    this.addEvent(
-      'reflection',
-      `${summary} (completed in ${formatElapsed(Date.now() - this.startTime, true)})`,
-      'high'
-    );
-    this.trajectory = completeTrajectory(this.trajectory as Trajectory, {
-      summary,
-      approach: this.buildApproach(),
-      confidence,
-      learnings: meta?.learnings,
-      challenges: meta?.challenges,
-    }) as WorkflowTrajectoryData;
-    await this.flush();
-  }
-
-  async abandon(
-    reason: string,
-    meta?: { summary?: string; confidence?: number; learnings?: string[]; challenges?: string[] }
-  ): Promise<void> {
-    if (!this.enabled || !this.trajectory) return;
-    const summary = meta?.summary ?? `Workflow abandoned: ${reason}`;
-    this.openChapter('Retrospective', 'orchestrator');
-    this.addEvent(
-      'reflection',
-      `${summary} (abandoned after ${formatElapsed(Date.now() - this.startTime, true)})`,
-      'high'
-    );
-    this.addEvent('error', `Workflow abandoned: ${reason}`, 'high');
-    this.trajectory = {
-      ...abandonTrajectory(this.trajectory as Trajectory),
-      retrospective: {
-        summary,
-        approach: this.buildApproach(),
-        confidence: meta?.confidence ?? 0,
-        learnings: meta?.learnings,
-        challenges: meta?.challenges,
-      },
-    } as WorkflowTrajectoryData;
-    await this.flush();
-  }
-
-  isEnabled(): boolean {
-    return this.enabled;
-  }
-  shouldReflectOnConverge(): boolean {
-    return this.enabled && this.reflectOnConverge;
-  }
-  shouldReflectOnBarriers(): boolean {
-    return this.enabled && this.reflectOnBarriers;
-  }
-  getTrajectoryId(): string | null {
-    return this.trajectory?.id ?? null;
-  }
-  buildSynthesis(label: string, outcomes: StepOutcome[], unblocks?: string[]): string {
-    return buildSynthesis(label, outcomes, unblocks);
-  }
-  computeConfidence(outcomes: StepOutcome[]): number {
-    return computeConfidence(outcomes);
-  }
-  buildRunSummary(outcomes: StepOutcome[]): string {
-    return buildRunSummary(outcomes, this.startTime);
-  }
-  extractLearnings(outcomes: StepOutcome[]): string[] {
-    return extractLearnings(outcomes);
-  }
-  extractChallenges(outcomes: StepOutcome[]): string[] {
-    return extractChallenges(outcomes);
-  }
-
-  private openChapter(title: string, agentName: string): void {
-    if (!this.trajectory) return;
-    this.trajectory = appendChapter(this.trajectory as Trajectory, {
-      title,
-      agentName,
-    }) as WorkflowTrajectoryData;
-  }
-
-  private addEvent(
-    type: WorkflowTrajectoryEventType,
-    content: string,
-    significance?: EventSignificance,
-    raw?: Record<string, unknown>
-  ): void {
-    if (!this.trajectory) return;
-    this.trajectory = appendEvent(this.trajectory as Trajectory, {
-      type: type as TrajectoryEventType,
-      content,
-      significance,
-      raw,
-    }) as WorkflowTrajectoryData;
-  }
-
-  private buildApproach(): string {
-    return `${this.swarmPattern} workflow (${this.trajectory?.agents.filter((a) => a.role !== 'workflow-runner').length ?? 0} agents)`;
-  }
-
-  private formatCompletionEvidenceSummary(
-    evidence: StepCompletionDecision['evidence'] | undefined
-  ): string | undefined {
-    if (!evidence) return undefined;
-    const parts: string[] = [];
-    if (evidence.summary) parts.push(evidence.summary);
-    if (evidence.signals?.length) parts.push(`signals=${evidence.signals.join(', ')}`);
-    if (evidence.channelPosts?.length) parts.push(`channel=${evidence.channelPosts.join(' | ')}`);
-    if (evidence.files?.length) parts.push(`files=${evidence.files.join(', ')}`);
-    if (evidence.exitCode !== undefined) parts.push(`exit=${evidence.exitCode}`);
-    return parts.length > 0 ? parts.join('; ') : undefined;
-  }
-
-  private async ensureStorage(): Promise<void> {
-    this.storage ??= new FileStorage(this.storageBaseDir);
-    this.storageInit ??= this.storage.initialize();
-    await this.storageInit;
-  }
-
-  private async flush(): Promise<void> {
-    if (!this.trajectory) return;
-    try {
-      await this.ensureStorage();
-      await this.storage?.save(this.trajectory as Trajectory);
-    } catch {
-      // non-blocking: flush failures must never break the workflow
-    }
-  }
-}
diff --git a/packages/sdk/src/workflows/types.ts b/packages/sdk/src/workflows/types.ts
deleted file mode 100644
index 099e1fd27..000000000
--- a/packages/sdk/src/workflows/types.ts
+++ /dev/null
@@ -1,640 +0,0 @@
-/**
- * Workflow Types for Relay Cloud Swarm Patterns
- *
- * Shared TypeScript types for relay.yaml configuration, workflow execution,
- * and database row representations.
- */
-
-export * from '@agent-relay/workflow-types';
-export type {
-  AccessPreset,
-  AgentCli,
-  AgentDefinition,
-  AgentPermissions,
-  AgentPreset,
-  NetworkPermission,
-  PermissionProfileDefinition,
-  RunnerStepExecutor,
-  SwarmPattern,
-  VerificationCheck,
-  WorkflowStep,
-  WorkflowStepType,
-} from '@agent-relay/workflow-types';
-
-import type {
-  AccessPreset,
-  AgentDefinition,
-  AgentPermissions,
-  NetworkPermission,
-  PermissionProfileDefinition,
-  SwarmPattern,
-  WorkflowStep,
-  WorkflowStepType,
-} from '@agent-relay/workflow-types';
-
-// ── relay.yaml top-level config ─────────────────────────────────────────────
-
-/** Top-level relay.yaml configuration file structure. */
-export interface RelayYamlConfig {
-  version: string;
-  name: string;
-  description?: string;
-  /** Reusable permission profiles that agents can reference via permissions.profile. */
-  permission_profiles?: Record<string, PermissionProfileDefinition>;
-  /** Named paths to external directories used by this workflow.
-   *  The primary working directory defaults to cwd and does not need to be declared.
-   *  Use this to declare additional directories so the runner can validate them
-   *  in preflight and agents can reference them via `workdir`. */
-  paths?: PathDefinition[];
-  swarm: SwarmConfig;
-  agents: AgentDefinition[];
-  workflows?: WorkflowDefinition[];
-  coordination?: CoordinationConfig;
-  state?: StateConfig;
-  errorHandling?: ErrorHandlingConfig;
-  trajectories?: TrajectoryConfig | false;
-}
-
-// ── Path definitions ────────────────────────────────────────────────────────
-
-/** A named path to an external directory for cross-repo workflows.
- *  Only needed for directories outside the default working directory. */
-export interface PathDefinition {
-  /** Unique name used to reference this path (e.g. "relaycast"). */
-  name: string;
-  /** Directory path, resolved relative to the YAML file.
-   *  Supports environment variables: "$HOME/.openclaw", "$RELAY_ROOT/packages/sdk". */
-  path: string;
-  /** Human-readable description of this path's role in the workflow. */
-  description?: string;
-  /** Whether this path is required. If true (default), preflight fails if it doesn't exist. */
-  required?: boolean;
-}
-
-// ── Trajectory configuration ─────────────────────────────────────────────────
-
-/** Configuration for workflow trajectory recording. */
-export interface TrajectoryConfig {
-  /** Enable trajectory recording (default: true). */
-  enabled?: boolean;
-  /** Auto-reflect when barriers resolve (default: true). */
-  reflectOnBarriers?: boolean;
-  /** Auto-reflect when parallel tracks converge (default: true). */
-  reflectOnConverge?: boolean;
-  /** Record retry/skip/fail decisions automatically (default: true). */
-  autoDecisions?: boolean;
-}
-
-// ── Swarm configuration ─────────────────────────────────────────────────────
-
-/** Configuration for idle agent detection and nudging. */
-export interface IdleNudgeConfig {
-  /** ms after idle detection before first nudge (default: 120_000 = 2 min). */
-  nudgeAfterMs?: number;
-  /** ms after nudge before force-release (default: 120_000 = 2 min). */
-  escalateAfterMs?: number;
-  /** Max nudges before escalation (default: 1). */
-  maxNudges?: number;
-}
-
-/** Provider-specific credential settings for the credential proxy. */
-export interface CredentialProxyProviderConfig {
-  /** Reference to the credential in the credential store. */
-  credentialId: string;
-  /** Optional env var name to read the provider API key from as a fallback. */
-  apiKeyEnvVar?: string;
-}
-
-/** Swarm-level credential proxy configuration. */
-export interface CredentialProxyConfig {
-  /** Proxy endpoint URL. */
-  proxyUrl: string;
-  /** JWT signing secret. Defaults to env RELAY_PROXY_JWT_SECRET when omitted. */
-  jwtSecret?: string;
-  /** Default max-token budget per agent session. */
-  defaultBudget?: number;
-  /** Provider credential mappings keyed by provider name. */
-  providers: Record<string, CredentialProxyProviderConfig>;
-}
-
-/** Swarm-level settings controlling the overall pattern. */
-export interface SwarmConfig {
-  pattern: SwarmPattern;
-  maxConcurrency?: number;
-  timeoutMs?: number;
-  /** Max total tokens across all steps in the workflow. */
-  tokenBudget?: number;
-  channel?: string;
-  /** Optional credential proxy configuration for agent API access. */
-  credentialProxy?: CredentialProxyConfig;
-  /** Idle agent detection and nudging configuration for interactive agents. */
-  idleNudge?: IdleNudgeConfig;
-  /**
-   * Grace period (ms) after an agent exits with code 0 but without posting
-   * the expected coordination signal. During this window the runner checks
-   * verification gates and evidence before failing the step.
-   * Default: 5000 (5 seconds). Set to 0 to disable.
-   */
-  completionGracePeriodMs?: number;
-}
-
-// ── Compiled / resolved permissions ─────────────────────────────────────────
-
-/**
- * Fully resolved agent permissions after merging:
- *   dotfile patterns + access preset + explicit YAML file rules + custom scopes
- *
- * Produced by the permission resolver at spawn time and used to:
- *   1. Mint the agent's relayauth token (scopes)
- *   2. Configure the relayfile mount (readonlyPaths, readwritePaths, deniedPaths)
- *   3. Enforce runtime restrictions (network, exec allowlist)
- */
-export interface CompiledAgentPermissions {
-  /** Agent this permission set applies to. */
-  agentName: string;
-
-  /** Workspace the agent belongs to. */
-  workspace: string;
-
-  /** The effective access level after resolution. */
-  effectiveAccess: AccessPreset;
-
-  /** Whether dotfile patterns were inherited. */
-  inherited: boolean;
-
-  /** Source of each permission layer for audit/debug. */
-  sources: PermissionSource[];
-
-  // ── Resolved file paths ──────────────────────────────────────────────────
-
-  /** Glob patterns that resolved to read-only access. */
-  readonlyPatterns: string[];
-
-  /** Glob patterns that resolved to read-write access. */
-  readwritePatterns: string[];
-
-  /** Glob patterns explicitly denied (no access). */
-  deniedPatterns: string[];
-
-  /** Concrete file paths with read-only access (after walking the project). */
-  readonlyPaths: string[];
-
-  /** Concrete file paths with read-write access (after walking the project). */
-  readwritePaths: string[];
-
-  /** Concrete file paths denied to the agent. */
-  deniedPaths: string[];
-
-  // ── Token scopes ─────────────────────────────────────────────────────────
-
-  /** Merged relayauth scopes for the agent's token.
-   *  Combines auto-generated file scopes + explicit custom scopes. */
-  scopes: string[];
-
-  // ── Runtime restrictions ─────────────────────────────────────────────────
-
-  /** Network access control. Undefined means unrestricted. */
-  network?: NetworkPermission;
-
-  /** Allowed exec command prefixes. Undefined means unrestricted. */
-  exec?: string[];
-
-  // ── ACL (for relayfile mount) ────────────────────────────────────────────
-
-  /** Directory-level ACL rules for the relayfile mount.
-   *  Keys are normalized directory paths, values are rule arrays. */
-  acl: Record<string, string[]>;
-
-  /** Summary counts for quick inspection. */
-  summary: {
-    readonly: number;
-    readwrite: number;
-    denied: number;
-    customScopes: number;
-  };
-}
-
-/** Identifies where a permission rule originated. */
-export interface PermissionSource {
-  /** Source type. */
-  type: 'dotfile' | 'preset' | 'yaml' | 'scope';
-  /** Human-readable description (e.g. '.agentignore', 'access: readonly'). */
-  label: string;
-  /** Number of rules contributed by this source. */
-  ruleCount: number;
-}
-
-// ── Type guards ─────────────────────────────────────────────────────────────
-
-/**
- * Returns true if the agent has restricted permissions —
- * i.e., it has explicit permissions set AND those permissions limit access
- * beyond the default readwrite+inherit behavior.
- *
- * An agent is considered restricted if any of the following are true:
- *   - access is 'readonly' or 'restricted'
- *   - files.deny has entries
- *   - network is false or an allowlist/denylist object
- *   - exec allowlist is set (any commands at all = restricted execution)
- *   - inherit is explicitly false (opts out of dotfile protections)
- */
-export function isRestrictedAgent(agent: AgentDefinition): boolean {
-  const perms = agent.permissions;
-  if (!perms) return false;
-
-  if (perms.access === 'readonly' || perms.access === 'restricted') return true;
-  if (perms.files?.deny && perms.files.deny.length > 0) return true;
-  if (perms.network === false || (typeof perms.network === 'object' && perms.network !== null)) return true;
-  if (perms.exec && perms.exec.length > 0) return true;
-  if (perms.inherit === false) return true;
-
-  return false;
-}
-
-// ── Workflow definitions ────────────────────────────────────────────────────
-
-/** Preflight check that runs before any workflow steps. */
-export interface PreflightCheck {
-  /** Shell command to execute. */
-  command: string;
-  /** Fail if output matches this condition: "non-empty", "empty", or a regex pattern. */
-  failIf?: 'non-empty' | 'empty' | string;
-  /** Succeed only if output matches this condition. */
-  successIf?: string;
-  /** Human-readable description of what this check validates. */
-  description?: string;
-}
-
-/** A named workflow composed of sequential or parallel steps. */
-export interface WorkflowDefinition {
-  name: string;
-  description?: string;
-  /** Preflight checks that run before any steps. All must pass. */
-  preflight?: PreflightCheck[];
-  steps: WorkflowStep[];
-  onError?: 'fail' | 'skip' | 'retry';
-}
-
-// ── Custom step definitions ─────────────────────────────────────────────────
-
-/** Parameter definition for a custom step. */
-export interface CustomStepParam {
-  /** Parameter name. */
-  name: string;
-  /** Whether this parameter is required. Default: false. */
-  required?: boolean;
-  /** Default value if not provided. */
-  default?: string;
-  /** Human-readable description of the parameter. */
-  description?: string;
-}
-
-/** A reusable custom step definition stored in .relay/steps.yaml. */
-export interface CustomStepDefinition {
-  /** Parameters that can be passed when using this step. */
-  params?: CustomStepParam[];
-  /** Step type: "deterministic" or "worktree". */
-  type?: 'deterministic' | 'worktree';
-  /** Shell command to execute (for deterministic steps). Supports {{param}} interpolation. */
-  command?: string;
-  /** Branch name (for worktree steps). Supports {{param}} interpolation. */
-  branch?: string;
-  /** Base branch (for worktree steps). */
-  baseBranch?: string;
-  /** Worktree path (for worktree steps). */
-  path?: string;
-  /** Create branch if missing (for worktree steps). */
-  createBranch?: boolean;
-  /** Fail if command exit code is non-zero. Default: true. */
-  failOnError?: boolean;
-  /** Capture stdout as step output. Default: true. */
-  captureOutput?: boolean;
-  /** Timeout in milliseconds. */
-  timeoutMs?: number;
-  /** Human-readable description of this step. */
-  description?: string;
-}
-
-/** Configuration file for custom step definitions (.relay/steps.yaml). */
-export interface CustomStepsConfig {
-  /** Map of step name to step definition. */
-  steps: Record<string, CustomStepDefinition>;
-}
-
-/** Diagnostic output captured after a verification failure analysis run. */
-export interface DiagnosticResult {
-  agentName: string;
-  analysis: string;
-  durationMs: number;
-  tokens?: {
-    input: number;
-    output: number;
-  };
-}
-
-// ── Completion evidence ─────────────────────────────────────────────────────
-
-export type CompletionEvidenceSignalSource =
-  | 'channel'
-  | 'stdout'
-  | 'stderr'
-  | 'process'
-  | 'filesystem'
-  | 'tool'
-  | 'verification';
-
-export type CompletionEvidenceSignalKind =
-  | 'worker_done'
-  | 'lead_done'
-  | 'step_complete'
-  | 'owner_decision'
-  | 'review_decision'
-  | 'task_summary'
-  | 'verification_passed'
-  | 'verification_failed'
-  | 'process_exit'
-  | 'custom';
-
-export interface CompletionEvidenceSignal {
-  kind: CompletionEvidenceSignalKind;
-  source: CompletionEvidenceSignalSource;
-  text: string;
-  observedAt: string;
-  sender?: string;
-  actor?: string;
-  role?: string;
-  value?: string;
-}
-
-export type CompletionEvidenceChannelOrigin = 'runner_post' | 'forwarded_chunk' | 'relay_message';
-
-export interface CompletionEvidenceChannelPost {
-  stepName: string;
-  text: string;
-  postedAt: string;
-  origin: CompletionEvidenceChannelOrigin;
-  completionRelevant: boolean;
-  sender?: string;
-  actor?: string;
-  role?: string;
-  target?: string;
-  signals: CompletionEvidenceSignal[];
-}
-
-export type CompletionEvidenceFileChangeKind = 'created' | 'modified' | 'deleted';
-
-export interface CompletionEvidenceFileChange {
-  path: string;
-  kind: CompletionEvidenceFileChangeKind;
-  observedAt: string;
-  root?: string;
-}
-
-export type CompletionEvidenceToolSideEffectType =
-  | 'persist_step_output'
-  | 'post_channel_message'
-  | 'verification_observed'
-  | 'worktree_created'
-  | 'owner_monitoring'
-  | 'review_started'
-  | 'review_completed'
-  | 'worker_exit'
-  | 'worker_error'
-  | 'retry'
-  | 'custom';
-
-export interface CompletionEvidenceToolSideEffect {
-  type: CompletionEvidenceToolSideEffectType;
-  detail: string;
-  observedAt: string;
-  raw?: Record<string, unknown>;
-}
-
-export interface StepCompletionEvidence {
-  stepName: string;
-  status?: WorkflowStepStatus;
-  startedAt?: string;
-  completedAt?: string;
-  lastUpdatedAt: string;
-  roots: string[];
-  output: {
-    stdout: string;
-    stderr: string;
-    combined: string;
-  };
-  channelPosts: CompletionEvidenceChannelPost[];
-  files: CompletionEvidenceFileChange[];
-  process: {
-    exitCode?: number;
-    exitSignal?: string;
-  };
-  toolSideEffects: CompletionEvidenceToolSideEffect[];
-  coordinationSignals: CompletionEvidenceSignal[];
-}
-
-export type StepCompletionMode =
-  | 'marker'
-  | 'evidence'
-  | 'verification'
-  | 'owner_decision'
-  | 'review'
-  | 'heuristic';
-
-export interface StepCompletionDecisionEvidence {
-  summary?: string;
-  signals?: string[];
-  channelPosts?: string[];
-  files?: string[];
-  exitCode?: number;
-}
-
-export interface StepCompletionDecision {
-  mode: StepCompletionMode;
-  reason?: string;
-  evidence?: StepCompletionDecisionEvidence;
-}
-
-// ── Coordination ────────────────────────────────────────────────────────────
-
-/** Coordination settings for multi-agent synchronization. */
-export interface CoordinationConfig {
-  barriers?: Barrier[];
-  votingThreshold?: number;
-  consensusStrategy?: 'majority' | 'unanimous' | 'quorum';
-}
-
-/** A synchronization barrier that gates downstream work. */
-export interface Barrier {
-  name: string;
-  waitFor: string[];
-  timeoutMs?: number;
-}
-
-// ── State management ────────────────────────────────────────────────────────
-
-/** Shared state configuration for workflows. */
-export interface StateConfig {
-  backend: 'memory' | 'redis' | 'database';
-  ttlMs?: number;
-  namespace?: string;
-}
-
-// ── Error handling ──────────────────────────────────────────────────────────
-
-/** Global error handling configuration. */
-export interface ErrorHandlingConfig {
-  strategy: 'fail-fast' | 'continue' | 'retry';
-  maxRetries?: number;
-  retryDelayMs?: number;
-  notifyChannel?: string;
-  /** Agent to use when a deterministic gate fails and needs code/workflow repair. */
-  repairAgent?: string;
-  /** Retry budget for repair agents before terminal failure. Set 0 to disable repair agents. */
-  repairRetries?: number;
-}
-
-// ── Dry-run report types ────────────────────────────────────────────────
-
-/** A single execution wave in a dry-run simulation. */
-export interface DryRunWave {
-  wave: number;
-  /** Steps in this wave. Agent is undefined for deterministic steps. */
-  steps: Array<{ name: string; agent?: string; dependsOn: string[] }>;
-}
-
-/** Report produced by a dry-run validation of a workflow config. */
-export interface DryRunReport {
-  valid: boolean;
-  errors: string[];
-  warnings: string[];
-  name: string;
-  description?: string;
-  pattern: string;
-  agents: Array<{ name: string; cli: string; role?: string; cwd?: string; stepCount: number }>;
-  permissions?: Array<{
-    agent: string;
-    access: string;
-    readPaths: number;
-    writePaths: number;
-    denyPaths: number;
-    scopes: number;
-    source: 'yaml' | 'preset' | 'dotfiles' | 'none';
-  }>;
-  waves: DryRunWave[];
-  totalSteps: number;
-  maxConcurrency?: number;
-  estimatedWaves: number;
-  /** Estimated peak concurrent agents. */
-  estimatedPeakConcurrency?: number;
-  /** Estimated total agent-steps (counting retries as additional steps). */
-  estimatedTotalAgentSteps?: number;
-}
-
-// ── Workflow execution options ───────────────────────────────────────────────
-
-/** Options that control how a workflow run executes. */
-export interface WorkflowExecuteOptions {
-  /** Start execution from a specific step, skipping all predecessor steps.
-   *  Predecessor outputs are loaded from cached step-outputs on disk when available. */
-  startFrom?: string;
-  /** Run ID of a previous execution whose cached step outputs should be used
-   *  when skipping predecessor steps via `startFrom`. If omitted, the runner
-   *  scans `.agent-relay/step-outputs/` for the most recent directory that
-   *  contains the needed step files. */
-  previousRunId?: string;
-}
-
-// ── Database row types ──────────────────────────────────────────────────────
-
-export type WorkflowRunStatus = 'pending' | 'running' | 'completed' | 'failed' | 'cancelled';
-
-/** Database row representing a workflow run. */
-export interface WorkflowRunRow {
-  id: string;
-  workspaceId: string;
-  workflowName: string;
-  pattern: SwarmPattern;
-  status: WorkflowRunStatus;
-  config: RelayYamlConfig;
-  stateSnapshot?: Record<string, unknown>;
-  startedAt: string;
-  completedAt?: string;
-  error?: string;
-  createdAt: string;
-  updatedAt: string;
-}
-
-export type WorkflowStepStatus = 'pending' | 'running' | 'completed' | 'failed' | 'skipped';
-export type WorkflowOwnerDecision =
-  | 'COMPLETE'
-  | 'INCOMPLETE_RETRY'
-  | 'INCOMPLETE_FAIL'
-  | 'NEEDS_CLARIFICATION';
-/**
- * Completion reasons are recorded for both successful and failed steps.
- * `retry_requested_by_owner` is a retry-control signal, not a success state:
- * the runner retries while budget remains and fails the step once retries are exhausted.
- */
-export type WorkflowStepCompletionReason =
-  | 'completed_verified'
-  | 'completed_by_owner_decision'
-  | 'completed_by_evidence'
-  | 'completed_by_process_exit'
-  | 'retry_requested_by_owner'
-  | 'failed_verification'
-  | 'failed_verification_with_diagnostic'
-  | 'failed_owner_decision'
-  | 'failed_no_evidence';
-
-/** Database row representing a single workflow step execution. */
-export interface WorkflowStepRow {
-  id: string;
-  runId: string;
-  stepName: string;
-  /** Agent name for agent steps, null for deterministic/worktree steps. */
-  agentName: string | null;
-  /** Step type: agent, deterministic, or worktree. */
-  stepType: WorkflowStepType;
-  status: WorkflowStepStatus;
-  /** Task description for agent steps, command for deterministic steps, branch for worktree steps. */
-  task: string;
-  dependsOn: string[];
-  output?: string;
-  error?: string;
-  completionReason?: WorkflowStepCompletionReason;
-  startedAt?: string;
-  completedAt?: string;
-  retryCount: number;
-  createdAt: string;
-  updatedAt: string;
-}
-
-// ── ProcessBackend: cloud-injected execution environment ─────────────────────
-//
-// Relay owns command construction, auth env, cwd, timeout, and step lifecycle.
-// The backend owns execution environments (create VM, run command, destroy VM).
-// uploadFile is reserved for future file asset staging; current executors run
-// commands directly with env/cwd/timeout passed through exec options.
-
-/** Backend for creating isolated execution environments (e.g. Daytona sandboxes). */
-export interface ProcessBackend {
-  /** Create an isolated execution environment. */
-  createEnvironment(label: string): Promise<ProcessEnvironment>;
-}
-
-/** An isolated execution environment provisioned by a ProcessBackend. */
-export interface ProcessEnvironment {
-  /** Unique identifier for this environment. */
-  id: string;
-  /** Home directory inside the environment. */
-  homeDir: string;
-  /** Execute a shell command in the environment. */
-  exec(
-    command: string,
-    opts?: { cwd?: string; env?: Record<string, string>; timeoutSeconds?: number }
-  ): Promise<{ output: string; exitCode: number }>;
-  /** Upload a file into the environment. */
-  uploadFile(content: string | Buffer, remotePath: string): Promise<void>;
-  /** Tear down the environment and release resources. */
-  destroy(): Promise<void>;
-}
diff --git a/packages/sdk/src/workflows/validator.ts b/packages/sdk/src/workflows/validator.ts
deleted file mode 100644
index 3ebd9b46b..000000000
--- a/packages/sdk/src/workflows/validator.ts
+++ /dev/null
@@ -1,215 +0,0 @@
-import type { RelayYamlConfig, AgentDefinition, WorkflowStep } from './types.js';
-import { CodexModels } from '@agent-relay/config';
-
-export interface ValidationIssue {
-  severity: 'error' | 'warning' | 'info';
-  code: string;
-  message: string;
-  fix?: string;
-  location?: string; // e.g. "step:analyze" or "agent:analyst"
-}
-
-const CHANNEL_NAME_RE = /^[a-z0-9][a-z0-9-]*$/;
-
-export function validateWorkflow(config: RelayYamlConfig): ValidationIssue[] {
-  const issues: ValidationIssue[] = [];
-
-  // Validate channel name format (must be lowercase alphanumeric + hyphens)
-  const channel = (config as any).swarm?.channel ?? (config as any).channel;
-  if (channel && !CHANNEL_NAME_RE.test(channel)) {
-    issues.push({
-      severity: 'error',
-      code: 'INVALID_CHANNEL_NAME',
-      message: `Channel name "${channel}" is invalid. Must be lowercase alphanumeric and hyphens, starting with a letter or number.`,
-      fix: `Use .toLowerCase().replace(/[^a-z0-9-]/g, '-').replace(/-+/g, '-').replace(/^-|-$/g, '') on the channel name.`,
-      location: 'swarm:channel',
-    });
-  }
-
-  const agentMap = new Map(config.agents.map((a) => [a.name, a]));
-  const hasReviewerAgent = config.agents.some((a) => {
-    const role = a.role?.toLowerCase() ?? '';
-    const name = a.name.toLowerCase();
-    return (
-      a.preset === 'reviewer' ||
-      role.includes('review') ||
-      role.includes('critic') ||
-      role.includes('verifier') ||
-      role.includes('qa') ||
-      name.includes('review')
-    );
-  });
-
-  for (const workflow of config.workflows ?? []) {
-    const hasInteractiveAgentSteps = workflow.steps.some((step) => {
-      if (step.type === 'deterministic' || step.type === 'worktree') return false;
-      if (!step.agent) return false;
-      const raw = agentMap.get(step.agent);
-      if (!raw) return false;
-      return resolveForValidation(raw).interactive !== false;
-    });
-    if (hasInteractiveAgentSteps && !hasReviewerAgent) {
-      issues.push({
-        severity: 'warning',
-        code: 'NO_REVIEW_AGENT',
-        message: `Workflow "${workflow.name}" has interactive agent steps but no obvious reviewer agent. The runner can auto-fallback, but dedicated reviewers improve step hardening.`,
-        fix: `Add an agent with role/preset like \`reviewer\`, \`critic\`, or \`verifier\`.`,
-        location: `workflow:${workflow.name}`,
-      });
-    }
-
-    for (const step of workflow.steps ?? []) {
-      if (step.type === 'deterministic' || step.type === 'worktree') continue;
-      if (!step.agent) continue;
-
-      const rawDef = agentMap.get(step.agent);
-      if (!rawDef) {
-        issues.push({
-          severity: 'error',
-          code: 'UNKNOWN_AGENT',
-          message: `Step "${step.name}" references unknown agent "${step.agent}"`,
-          location: `step:${step.name}`,
-        });
-        continue;
-      }
-
-      // Resolve preset
-      const def = resolveForValidation(rawDef);
-      const task = step.task ?? '';
-
-      // Check 1: step chaining on interactive agent
-      if (def.interactive !== false && /\{\{steps\.[^}]+\}\}/.test(task)) {
-        issues.push({
-          severity: 'warning',
-          code: 'CHAIN_ON_INTERACTIVE',
-          message: `Step "${step.name}" uses {{steps.X.output}} but agent "${step.agent}" is interactive. PTY output includes TUI chrome — step chaining will receive raw terminal output.`,
-          fix: `Add \`interactive: false\` to agent "${step.agent}", or use \`preset: worker\` / \`preset: reviewer\`.`,
-          location: `step:${step.name}`,
-        });
-      }
-
-      // Check 2: interactive codex missing /exit in task
-      if (def.interactive !== false && def.cli === 'codex' && !task.includes('/exit')) {
-        issues.push({
-          severity: 'warning',
-          code: 'CODEX_NO_EXIT',
-          message: `Step "${step.name}" uses interactive codex but the task has no /exit instruction. Interactive codex may hang indefinitely.`,
-          fix: `End the task with an explicit /exit example:\n  When done, output:\n  TASK_COMPLETE\n  /exit`,
-          location: `step:${step.name}`,
-        });
-      }
-
-      // Check 3: interactive agent with no sub-agent guardrail on complex tasks
-      if (
-        def.interactive !== false &&
-        def.cli === 'claude' &&
-        task.length > 500 &&
-        !task.includes('do not') &&
-        !task.includes('Do NOT') &&
-        !task.includes('mcp__relaycast__add_agent') &&
-        !task.includes('add_agent')
-      ) {
-        issues.push({
-          severity: 'info',
-          code: 'CLAUDE_NO_SPAWN_GUARD',
-          message: `Step "${step.name}" uses interactive claude with a long task. Claude may spontaneously spawn sub-agents via relay MCP tools.`,
-          fix: `Add "Do NOT use mcp__relaycast__add_agent or add_agent to spawn sub-agents." to the task, or use \`interactive: false\`.`,
-          location: `step:${step.name}`,
-        });
-      }
-
-      // Check 4: codex-spark cannot be used in non-interactive mode
-      const CODEX_SPARK_MODELS: string[] = [CodexModels.GPT_5_3_CODEX_SPARK];
-      if (
-        def.interactive === false &&
-        def.cli === 'codex' &&
-        def.constraints?.model &&
-        (CODEX_SPARK_MODELS.includes(def.constraints.model) || /codex-spark/i.test(def.constraints.model))
-      ) {
-        issues.push({
-          severity: 'error',
-          code: 'CODEX_SPARK_NON_INTERACTIVE',
-          message: `Agent "${step.agent}" uses codex-spark model in non-interactive mode. Codex Spark does not support non-interactive (headless) execution.`,
-          fix: `Switch to a different model (e.g. gpt-5.3-codex) or set the agent to interactive mode.`,
-          location: `step:${step.name}`,
-        });
-      }
-
-      // Check 5: non-interactive agent that references relay messaging tools in task
-      if (
-        def.interactive === false &&
-        (task.includes('mcp__relaycast__send_dm') ||
-          task.includes('mcp__relaycast__post_message') ||
-          task.includes('mcp__relaycast__check_inbox'))
-      ) {
-        issues.push({
-          severity: 'warning',
-          code: 'NONINTERACTIVE_RELAY',
-          message: `Step "${step.name}" has \`interactive: false\` but the task mentions relay tools. Non-interactive agents cannot use relay MCP tools.`,
-          fix: `Remove relay tool calls from the task, or set the agent to interactive.`,
-          location: `step:${step.name}`,
-        });
-      }
-    }
-
-    // Check 6: maxConcurrency vs interactive agent count
-    const interactiveSteps = (workflow.steps ?? []).filter((s) => {
-      if (s.type === 'deterministic') return false;
-      const def = agentMap.get(s.agent ?? '');
-      return def && resolveForValidation(def).interactive !== false;
-    });
-    const maxConc = config.swarm.maxConcurrency ?? 10;
-    if (interactiveSteps.length > 4 && maxConc > 4) {
-      issues.push({
-        severity: 'warning',
-        code: 'HIGH_CONCURRENCY',
-        message: `Workflow "${workflow.name}" has ${interactiveSteps.length} interactive steps with maxConcurrency: ${maxConc}. Spawning many interactive PTY agents simultaneously can saturate the broker and cause spawn timeouts.`,
-        fix: `Set \`maxConcurrency: 3\` or lower, or convert implementation agents to \`interactive: false\`.`,
-        location: `workflow:${workflow.name}`,
-      });
-    }
-  }
-
-  return issues;
-}
-
-function resolveForValidation(def: AgentDefinition): AgentDefinition {
-  if (!def.preset) return def;
-  const nonInteractive = ['worker', 'reviewer', 'analyst'];
-  if (nonInteractive.includes(def.preset) && def.interactive === undefined) {
-    return { ...def, interactive: false };
-  }
-  return def;
-}
-
-export function formatValidationReport(issues: ValidationIssue[], yamlPath: string): string {
-  const errors = issues.filter((i) => i.severity === 'error');
-  const warnings = issues.filter((i) => i.severity === 'warning');
-  const infos = issues.filter((i) => i.severity === 'info');
-
-  const lines: string[] = [`Validating ${yamlPath}...`, ''];
-
-  if (issues.length === 0) {
-    lines.push('No issues found');
-    return lines.join('\n');
-  }
-
-  const icon: Record<string, string> = { error: 'ERROR', warning: 'WARN', info: 'INFO' };
-
-  for (const issue of issues) {
-    const loc = issue.location ? ` [${issue.location}]` : '';
-    lines.push(`${icon[issue.severity]} ${issue.message}${loc}`);
-    if (issue.fix) {
-      lines.push(`  -> ${issue.fix}`);
-    }
-    lines.push('');
-  }
-
-  const summary: string[] = [];
-  if (errors.length) summary.push(`${errors.length} error${errors.length > 1 ? 's' : ''}`);
-  if (warnings.length) summary.push(`${warnings.length} warning${warnings.length > 1 ? 's' : ''}`);
-  if (infos.length) summary.push(`${infos.length} info`);
-  lines.push(summary.join(', '));
-
-  return lines.join('\n');
-}
diff --git a/packages/sdk/src/workflows/verification.ts b/packages/sdk/src/workflows/verification.ts
deleted file mode 100644
index dc488a499..000000000
--- a/packages/sdk/src/workflows/verification.ts
+++ /dev/null
@@ -1,324 +0,0 @@
-import { execSync } from 'node:child_process';
-import { existsSync } from 'node:fs';
-import path from 'node:path';
-
-import type {
-  CompletionEvidenceSignal,
-  CompletionEvidenceToolSideEffect,
-  VerificationCheck,
-  WorkflowStepCompletionReason,
-} from './types.js';
-
-export type { VerificationCheck } from './types.js';
-
-export interface VerificationResult {
-  passed: boolean;
-  completionReason?: WorkflowStepCompletionReason;
-  error?: string;
-}
-
-export interface VerificationOptions {
-  allowFailure?: boolean;
-  completionMarkerFound?: boolean;
-  cwd?: string;
-}
-
-export class WorkflowCompletionError extends Error {
-  completionReason?: WorkflowStepCompletionReason;
-
-  constructor(message: string, completionReason?: WorkflowStepCompletionReason) {
-    super(message);
-    this.name = 'WorkflowCompletionError';
-    this.completionReason = completionReason;
-  }
-}
-
-export interface VerificationSideEffects {
-  recordStepToolSideEffect?: (
-    stepName: string,
-    effect: Omit<CompletionEvidenceToolSideEffect, 'observedAt'> & { observedAt?: string }
-  ) => void;
-  getOrCreateStepEvidenceRecord?: (stepName: string) => {
-    evidence: { coordinationSignals: CompletionEvidenceSignal[] };
-  };
-  log?: (message: string) => void;
-}
-
-export function runVerification(
-  check: VerificationCheck,
-  output: string,
-  stepName: string,
-  injectedTaskText?: string,
-  options: VerificationOptions = {},
-  sideEffects: VerificationSideEffects = {}
-): VerificationResult {
-  const cwd = options.cwd ?? process.cwd();
-
-  const fail = (message: string): VerificationResult => {
-    const observedAt = new Date().toISOString();
-    sideEffects.recordStepToolSideEffect?.(stepName, {
-      type: 'verification_observed',
-      detail: message,
-      observedAt,
-      raw: { passed: false, type: check.type, value: check.value },
-    });
-    sideEffects.getOrCreateStepEvidenceRecord?.(stepName).evidence.coordinationSignals.push({
-      kind: 'verification_failed',
-      source: 'verification',
-      text: message,
-      observedAt,
-      value: check.value,
-    });
-
-    if (options.allowFailure) {
-      return {
-        passed: false,
-        completionReason: 'failed_verification',
-        error: message,
-      };
-    }
-
-    throw new WorkflowCompletionError(message, 'failed_verification');
-  };
-
-  switch (check.type) {
-    case 'output_contains': {
-      const token = check.value;
-      if (!checkOutputContains(output, token, injectedTaskText)) {
-        return fail(`Verification failed for "${stepName}": output does not contain "${token}"`);
-      }
-      break;
-    }
-
-    case 'exit_code':
-      if (!checkExitCode(check.value)) {
-        return fail(`Verification failed for "${stepName}": exit code did not match "${check.value}"`);
-      }
-      break;
-
-    case 'file_exists':
-      if (!checkFileExists(check.value, cwd)) {
-        return fail(`Verification failed for "${stepName}": file "${check.value}" does not exist`);
-      }
-      break;
-
-    case 'custom': {
-      if (check.value) {
-        const result = execCustomVerification(check.value, cwd, check.timeoutMs);
-        if (!result.passed) {
-          return fail(
-            'Verification failed for "' +
-              stepName +
-              '": custom check "' +
-              check.value +
-              '" failed\n' +
-              result.output
-          );
-        }
-      } else {
-        // No command provided — preserved legacy no-op behavior
-        return { passed: false };
-      }
-      break;
-    }
-
-    case 'pr_url': {
-      const found = findPrUrl(output, check.value, injectedTaskText);
-      if (!found) {
-        const repoQualifier = check.value ? ` for repository "${check.value}"` : '';
-        return fail(
-          `Verification failed for "${stepName}": step output does not contain a GitHub PR URL${repoQualifier}. ` +
-            `Workers must open a pull request and include the URL in their output before reporting completion.`
-        );
-      }
-      break;
-    }
-
-    default:
-      break;
-  }
-
-  if (options.completionMarkerFound === false) {
-    sideEffects.log?.(
-      `[${stepName}] Verification passed without legacy STEP_COMPLETE marker; allowing completion`
-    );
-  }
-
-  const observedAt = new Date().toISOString();
-  const successMessage =
-    options.completionMarkerFound === false
-      ? 'Verification passed without legacy STEP_COMPLETE marker'
-      : 'Verification passed';
-  sideEffects.recordStepToolSideEffect?.(stepName, {
-    type: 'verification_observed',
-    detail: successMessage,
-    observedAt,
-    raw: { passed: true, type: check.type, value: check.value },
-  });
-  sideEffects.getOrCreateStepEvidenceRecord?.(stepName).evidence.coordinationSignals.push({
-    kind: 'verification_passed',
-    source: 'verification',
-    text: successMessage,
-    observedAt,
-    value: check.value,
-  });
-
-  return {
-    passed: true,
-    completionReason: 'completed_verified',
-  };
-}
-
-export function stripInjectedTaskEcho(output: string, injectedTaskText?: string): string {
-  if (!injectedTaskText) {
-    return output;
-  }
-
-  const candidates = [
-    injectedTaskText,
-    injectedTaskText.replace(/\r\n/g, '\n'),
-    injectedTaskText.replace(/\n/g, '\r\n'),
-  ].filter((candidate, index, all) => candidate.length > 0 && all.indexOf(candidate) === index);
-
-  for (const candidate of candidates) {
-    const start = output.indexOf(candidate);
-    if (start !== -1) {
-      return output.slice(0, start) + output.slice(start + candidate.length);
-    }
-  }
-
-  return output;
-}
-
-export function checkExitCode(_expectedExitCode: string): boolean {
-  // Existing runner semantics treat process success as established before this
-  // verification hook runs, so this check is currently an unconditional pass.
-  return true;
-}
-
-export function checkOutputContains(output: string, token: string, injectedTaskText?: string): boolean {
-  if (!token) {
-    return false;
-  }
-  return stripInjectedTaskEcho(output, injectedTaskText).includes(token);
-}
-
-const PR_URL_PATTERN = /https?:\/\/github\.com\/([\w.-]+)\/([\w.-]+)\/pull\/(\d+)\b/gi;
-
-/**
- * Returns the first GitHub PR URL found in {@link output}. When
- * {@link repoQualifier} is non-empty (format: `<owner>/<repo>`, case
- * insensitive), only URLs belonging to that repository are accepted.
- *
- * Use via `verification: { type: 'pr_url', value: 'owner/repo' }` to require
- * a step to publish a pull request before completing. The check exists so
- * workflow runners can refuse `OWNER_DECISION: COMPLETE` from workers that
- * shipped code locally but never opened a PR.
- */
-export function findPrUrl(output: string, repoQualifier?: string, injectedTaskText?: string): string | null {
-  const sanitized = stripInjectedTaskEcho(output, injectedTaskText);
-  const qualifier = repoQualifier?.trim().toLowerCase();
-  PR_URL_PATTERN.lastIndex = 0;
-  let match: RegExpExecArray | null;
-  while ((match = PR_URL_PATTERN.exec(sanitized))) {
-    if (!qualifier) {
-      return match[0];
-    }
-    const owner = match[1]?.toLowerCase();
-    const repo = match[2]?.toLowerCase();
-    if (`${owner}/${repo}` === qualifier) {
-      return match[0];
-    }
-  }
-  return null;
-}
-
-const DEFAULT_CUSTOM_VERIFY_TIMEOUT_MS = parseInt(process.env.CUSTOM_VERIFY_TIMEOUT_MS ?? '30000', 10);
-
-const REGEX_PREFIX = 'regex:';
-
-export function execCustomVerification(
-  command: string,
-  cwd: string,
-  timeoutMs = DEFAULT_CUSTOM_VERIFY_TIMEOUT_MS
-): { passed: boolean; output: string } {
-  try {
-    const stdout = execSync(command, {
-      cwd,
-      timeout: timeoutMs,
-      killSignal: 'SIGKILL',
-      stdio: ['ignore', 'pipe', 'pipe'],
-      encoding: 'utf-8',
-    });
-    return { passed: true, output: stdout.trim() };
-  } catch (error) {
-    const execError = error as Error & {
-      stdout?: string | Buffer;
-      stderr?: string | Buffer;
-    };
-    const stdout =
-      typeof execError.stdout === 'string' ? execError.stdout : (execError.stdout?.toString('utf-8') ?? '');
-    const stderr =
-      typeof execError.stderr === 'string' ? execError.stderr : (execError.stderr?.toString('utf-8') ?? '');
-    const combinedOutput = [stdout, stderr]
-      .filter((chunk) => chunk.length > 0)
-      .join('\n')
-      .trim();
-    const truncated = combinedOutput.length > 2000 ? combinedOutput.slice(-2000) : combinedOutput;
-    return {
-      passed: false,
-      output: truncated || execError.message,
-    };
-  }
-}
-
-export function checkCustom(
-  value: string,
-  output: string,
-  cwd = process.cwd()
-): { passed: boolean; stdout?: string; error?: string } {
-  // Regex shorthand: "regex:<pattern>"
-  if (value.startsWith(REGEX_PREFIX)) {
-    const pattern = value.slice(REGEX_PREFIX.length);
-    try {
-      const re = new RegExp(pattern);
-      const matched = re.test(output);
-      return matched
-        ? { passed: true }
-        : { passed: false, error: `output did not match pattern /${pattern}/` };
-    } catch (err) {
-      return { passed: false, error: `invalid regex: ${(err as Error).message}` };
-    }
-  }
-
-  // Shell command: execute value with STEP_OUTPUT env var
-  try {
-    const result = execSync(value, {
-      cwd,
-      env: { ...process.env, STEP_OUTPUT: output },
-      timeout: DEFAULT_CUSTOM_VERIFY_TIMEOUT_MS,
-      stdio: ['pipe', 'pipe', 'pipe'],
-      maxBuffer: 1024 * 1024,
-    });
-    return { passed: true, stdout: result.toString('utf-8').trim() };
-  } catch (err) {
-    const message = (err as { stderr?: Buffer })?.stderr?.toString('utf-8')?.trim() || (err as Error).message;
-    return { passed: false, error: message };
-  }
-}
-
-export function checkFileExists(filePath: string, cwd = process.cwd()): boolean {
-  const normalizedCwd = path.resolve(cwd);
-  const resolved = path.isAbsolute(filePath) ? path.resolve(filePath) : path.resolve(normalizedCwd, filePath);
-
-  // Relative artifact paths stay scoped to the workflow cwd; absolute paths
-  // are already explicit and are allowed for temp/output artifacts.
-  if (
-    !path.isAbsolute(filePath) &&
-    !resolved.startsWith(normalizedCwd + path.sep) &&
-    resolved !== normalizedCwd
-  ) {
-    return false;
-  }
-  return existsSync(resolved);
-}
diff --git a/packages/sdk/tsconfig.build.json b/packages/sdk/tsconfig.build.json
index 6cf7d0bce..10b9b2524 100644
--- a/packages/sdk/tsconfig.build.json
+++ b/packages/sdk/tsconfig.build.json
@@ -9,11 +9,8 @@
       "@agent-relay/config/*": ["../config/dist/*"],
       "@agent-relay/cloud": ["../cloud/dist/index.d.ts"],
       "@agent-relay/cloud/*": ["../cloud/dist/*"],
-      "@agent-relay/workflow-types": ["../workflow-types/dist/index.d.ts"],
       "@agent-relay/github-primitive": ["../github-primitive/dist/index.d.ts"],
-      "@agent-relay/github-primitive/workflow-step": ["../github-primitive/dist/workflow-step.d.ts"],
-      "@agent-relay/slack-primitive": ["../slack-primitive/dist/index.d.ts"],
-      "@agent-relay/slack-primitive/workflow-step": ["../slack-primitive/dist/workflow-step.d.ts"]
+      "@agent-relay/slack-primitive": ["../slack-primitive/dist/index.d.ts"]
     },
     "strict": true,
     "declaration": true,
diff --git a/packages/sdk/tsconfig.json b/packages/sdk/tsconfig.json
index aa1075d3e..71f4e4709 100644
--- a/packages/sdk/tsconfig.json
+++ b/packages/sdk/tsconfig.json
@@ -7,11 +7,9 @@
       "@agent-relay/config": ["../config/src/index.ts"],
       "@agent-relay/config/*": ["../config/src/*"],
       "@agent-relay/cloud": ["../cloud/src/index.ts"],
-      "@agent-relay/workflow-types": ["../workflow-types/src/index.ts"],
+      "@agent-relay/cloud/*": ["../cloud/src/*"],
       "@agent-relay/github-primitive": ["../github-primitive/src/index.ts"],
-      "@agent-relay/github-primitive/workflow-step": ["../github-primitive/src/workflow-step.ts"],
-      "@agent-relay/slack-primitive": ["../slack-primitive/src/index.ts"],
-      "@agent-relay/slack-primitive/workflow-step": ["../slack-primitive/src/workflow-step.ts"]
+      "@agent-relay/slack-primitive": ["../slack-primitive/src/index.ts"]
     },
     "noEmit": true
   },
diff --git a/packages/sdk/vitest.config.ts b/packages/sdk/vitest.config.ts
index 3b849ed07..dc1a3db64 100644
--- a/packages/sdk/vitest.config.ts
+++ b/packages/sdk/vitest.config.ts
@@ -4,11 +4,7 @@ export default defineConfig({
   test: {
     globals: true,
     environment: 'node',
-    include: [
-      'src/__tests__/**/*.test.ts',
-      'src/workflows/__tests__/**/*.test.ts',
-      'src/provisioner/__tests__/presets.test.ts',
-    ],
+    include: ['src/__tests__/**/*.test.ts'],
     exclude: ['src/__tests__/unit.test.ts'],
   },
 });
diff --git a/packages/slack-primitive/examples/notify-on-pr.ts b/packages/slack-primitive/examples/notify-on-pr.ts
deleted file mode 100644
index e0f757c20..000000000
--- a/packages/slack-primitive/examples/notify-on-pr.ts
+++ /dev/null
@@ -1,93 +0,0 @@
-import { WorkflowRunner, type RelayYamlConfig } from '@agent-relay/sdk/workflows';
-import { GitHubStepExecutor, createGitHubStep } from '@agent-relay/github-primitive/workflow-step';
-import type { AgentDefinition, RunnerStepExecutor, WorkflowStep } from '@agent-relay/workflow-types';
-
-import { SlackStepExecutor, createSlackStep } from '../src/workflow-step.js';
-
-const repo = process.env.GITHUB_REPO ?? 'AgentWorkforce/scratch';
-const baseBranch = process.env.GITHUB_BASE_BRANCH ?? 'main';
-const branchName = process.env.GITHUB_BRANCH_OVERRIDE ?? `examples/slack-primitive-${Date.now()}`;
-const slackChannel = process.env.SLACK_CHANNEL ?? '#engineering';
-
-const slackExecutor = new SlackStepExecutor({
-  token: process.env.SLACK_BOT_TOKEN,
-});
-const githubExecutor = new GitHubStepExecutor();
-
-const localExecutor: RunnerStepExecutor = {
-  executeAgentStep(
-    _step: WorkflowStep,
-    _agentDef: AgentDefinition,
-    _resolvedTask: string,
-    _timeoutMs?: number
-  ): Promise<string> {
-    return Promise.reject(new Error('notify-on-pr only uses integration steps.'));
-  },
-  async executeIntegrationStep(
-    step: WorkflowStep,
-    resolvedParams: Record<string, string>,
-    context: { workspaceId?: string }
-  ): Promise<{ output: string; success: boolean }> {
-    if (step.integration === 'github') {
-      return githubExecutor.executeIntegrationStep(step, resolvedParams, context);
-    }
-    if (step.integration === 'slack') {
-      return slackExecutor.executeIntegrationStep(step, resolvedParams);
-    }
-    return {
-      success: false,
-      output: `Unsupported integration "${step.integration ?? 'unknown'}"`,
-    };
-  },
-};
-
-const config: RelayYamlConfig = {
-  version: '1.0',
-  name: 'notify-on-pr',
-  description: 'Open a GitHub pull request and announce it in Slack.',
-  swarm: { pattern: 'pipeline' },
-  agents: [],
-  workflows: [
-    {
-      name: 'notify-on-pr',
-      steps: [
-        createGitHubStep({
-          name: 'create-pr',
-          action: 'createPR',
-          repo,
-          params: {
-            title: `examples: slack primitive notification (${branchName})`,
-            body: 'Opened by packages/slack-primitive/examples/notify-on-pr.ts.',
-            base: baseBranch,
-            head: branchName,
-            draft: true,
-          },
-          output: {
-            mode: 'data',
-            format: 'json',
-          },
-        }),
-        createSlackStep({
-          name: 'announce-pr',
-          dependsOn: ['create-pr'],
-          action: 'postMessage',
-          channel: slackChannel,
-          text: 'PR opened: {{steps.create-pr.output.htmlUrl}}',
-          unfurl: true,
-          output: {
-            mode: 'summary',
-            format: 'json',
-            pretty: true,
-          },
-        }),
-      ],
-    },
-  ],
-};
-
-const runner = new WorkflowRunner({
-  cwd: process.cwd(),
-  executor: localExecutor,
-});
-
-await runner.execute(config);
diff --git a/packages/slack-primitive/package.json b/packages/slack-primitive/package.json
index 867c93697..43012c9a3 100644
--- a/packages/slack-primitive/package.json
+++ b/packages/slack-primitive/package.json
@@ -10,11 +10,6 @@
       "types": "./dist/index.d.ts",
       "import": "./dist/index.js",
       "default": "./dist/index.js"
-    },
-    "./workflow-step": {
-      "types": "./dist/workflow-step.d.ts",
-      "import": "./dist/workflow-step.js",
-      "default": "./dist/workflow-step.js"
     }
   },
   "files": [
@@ -30,7 +25,6 @@
     "typecheck:examples": "tsc -p tsconfig.examples.json --noEmit"
   },
   "dependencies": {
-    "@agent-relay/workflow-types": "7.1.1",
     "@slack/web-api": "^7.16.0"
   },
   "devDependencies": {
diff --git a/packages/slack-primitive/src/__tests__/post-message.test.ts b/packages/slack-primitive/src/__tests__/post-message.test.ts
index 572ebb217..15f074d61 100644
--- a/packages/slack-primitive/src/__tests__/post-message.test.ts
+++ b/packages/slack-primitive/src/__tests__/post-message.test.ts
@@ -4,7 +4,6 @@ import { postMessage } from '../actions/post-message.js';
 import { resolveChannel } from '../actions/resolve-channel.js';
 import { SlackWebApiClient } from '../local-runtime.js';
 import { SlackPostBackError, type SlackWebApiLike } from '../types.js';
-import { renderSlackTemplates } from '../workflow-step.js';
 
 describe('Slack primitive', () => {
   afterEach(() => {
@@ -84,20 +83,6 @@ describe('Slack primitive', () => {
       })
     ).rejects.toThrow('provide channel or set SLACK_DEFAULT_CHANNEL');
   });
-
-  it('substitutes {{steps.X.output}} templates by nested path', () => {
-    const text = renderSlackTemplates('Opened {{steps.create-pr.output.htmlUrl}}', {
-      steps: {
-        'create-pr': {
-          output: {
-            htmlUrl: 'https://github.test/octo/repo/pull/7',
-          },
-        },
-      },
-    });
-
-    expect(text).toBe('Opened https://github.test/octo/repo/pull/7');
-  });
 });
 
 interface RecordingSlack extends SlackWebApiLike {
diff --git a/packages/slack-primitive/src/__tests__/workflow-step.test.ts b/packages/slack-primitive/src/__tests__/workflow-step.test.ts
deleted file mode 100644
index 6d1fc0368..000000000
--- a/packages/slack-primitive/src/__tests__/workflow-step.test.ts
+++ /dev/null
@@ -1,55 +0,0 @@
-import { describe, expect, it } from 'vitest';
-
-import { SlackAction, type SlackActionResult } from '../types.js';
-import {
-  SlackStepExecutor,
-  slackStepConfigFromWorkflowStep,
-  type SlackStepConfig,
-} from '../workflow-step.js';
-import type { SlackClient } from '../client.js';
-
-describe('SlackStepExecutor', () => {
-  it('keeps numeric-looking threadTs as a string after workflow param resolution', () => {
-    const config = slackStepConfigFromWorkflowStep(
-      {
-        name: 'announce',
-        type: 'integration',
-        integration: 'slack',
-        action: 'postMessage',
-      },
-      {
-        text: 'PR opened',
-        threadTs: '1715273540.123456',
-        unfurl: 'true',
-        mentions: '["@dev"]',
-      }
-    );
-
-    expect(config.threadTs).toBe('1715273540.123456');
-    expect(config.unfurl).toBe(true);
-    expect(config.mentions).toEqual(['@dev']);
-  });
-
-  it('surfaces the real error for failed default data-mode steps', async () => {
-    const executor = new SlackStepExecutor();
-    const client = {
-      executeAction: async (): Promise<SlackActionResult> => ({
-        success: false,
-        output: '',
-        error: 'channel_not_found',
-      }),
-    } as unknown as SlackClient;
-
-    const result = await executor.execute(
-      {
-        name: 'announce',
-        action: SlackAction.PostMessage,
-        channel: '#missing',
-        text: 'PR opened',
-      } satisfies SlackStepConfig,
-      { client }
-    );
-
-    expect(result.output).toBe('"channel_not_found"');
-  });
-});
diff --git a/packages/slack-primitive/src/index.ts b/packages/slack-primitive/src/index.ts
index 1165fcf91..a34b3a341 100644
--- a/packages/slack-primitive/src/index.ts
+++ b/packages/slack-primitive/src/index.ts
@@ -4,7 +4,6 @@ export * from './local-runtime.js';
 export * from './cloud-relay-runtime.js';
 export * from './noop-runtime.js';
 export * from './client.js';
-export * from './workflow-step.js';
 export * from './actions/post-message.js';
 export * from './actions/resolve-user.js';
 export * from './actions/resolve-channel.js';
diff --git a/packages/slack-primitive/src/workflow-step.ts b/packages/slack-primitive/src/workflow-step.ts
deleted file mode 100644
index df8dfd118..000000000
--- a/packages/slack-primitive/src/workflow-step.ts
+++ /dev/null
@@ -1,469 +0,0 @@
-import type { RunnerStepExecutor, WorkflowStep } from '@agent-relay/workflow-types';
-
-import { SlackClient } from './client.js';
-import {
-  SlackAction,
-  SLACK_ACTIONS,
-  type PostMessageParams,
-  type SlackActionResult,
-  type SlackRuntimeConfig,
-} from './types.js';
-
-export type SlackStepOutputMode = 'data' | 'result' | 'summary' | 'raw' | 'none';
-export type SlackStepOutputFormat = 'json' | 'text';
-
-export interface SlackStepOutputConfig {
-  /** Which action result becomes the workflow step output. Defaults to "data". */
-  mode?: SlackStepOutputMode;
-  /** Emit JSON for structured chaining or text for simple downstream interpolation. Defaults to "json". */
-  format?: SlackStepOutputFormat;
-  /** Select a nested field from the projected output, e.g. "ts" or "data.channel". */
-  path?: string;
-  /** Include adapter metadata such as runtime and timing in JSON output. Defaults false. */
-  includeMetadata?: boolean;
-  /** Pretty-print JSON output. Defaults false. */
-  pretty?: boolean;
-}
-
-export interface SlackStepConfig {
-  /** Unique step name within the workflow. */
-  name: string;
-  /** Dependencies in the Relay workflow DAG. */
-  dependsOn?: string[];
-  /** Slack action to execute. Phase A supports postMessage. */
-  action: 'postMessage';
-  /** Slack channel id or #channel-name reference. Falls back to SLACK_DEFAULT_CHANNEL when omitted. */
-  channel?: string;
-  /** Message text. Values may include workflow templates such as {{steps.plan.output.title}}. */
-  text: string;
-  /** Optional parent message timestamp for threaded delivery. */
-  threadTs?: string;
-  /** User mentions to prefix when resolved. Unresolved mentions are soft warnings in output. */
-  mentions?: string[];
-  /** Slack unfurl setting for links and media. */
-  unfurl?: boolean;
-  /** Runtime settings for the local Slack Web API runtime. */
-  config?: SlackRuntimeConfig;
-  /** Controls the string captured as {{steps.<name>.output}}. */
-  output?: SlackStepOutputConfig;
-  /** Workflow step timeout in milliseconds. */
-  timeoutMs?: number;
-  /** Number of retry attempts when the workflow runner retries this integration step. */
-  retries?: number;
-}
-
-export interface SlackStepExecutionContext {
-  workspaceId?: string;
-  client?: SlackClient;
-  config?: SlackRuntimeConfig;
-}
-
-export interface SlackStepExecutionResult<TOutput = unknown> {
-  success: boolean;
-  output: string;
-  result: SlackActionResult<TOutput>;
-  error?: string;
-}
-
-export interface SlackIntegrationStepResult {
-  output: string;
-  success: boolean;
-}
-
-type ResolvedParams = Record<string, unknown>;
-
-const SLACK_INTEGRATION = 'slack';
-const RESERVED_PARAM_KEYS = new Set(['action', 'config', 'slackConfig', 'output', 'params']);
-
-/**
- * Create a Relay integration step for posting a Slack message.
- * @param config - Slack step configuration.
- * @returns Workflow integration step.
- */
-export function createSlackStep(config: SlackStepConfig): WorkflowStep {
-  validateSlackStepConfig(config);
-
-  const params: Record<string, string> = {
-    text: config.text,
-  };
-
-  if (config.channel !== undefined) params.channel = config.channel;
-  if (config.threadTs !== undefined) params.threadTs = config.threadTs;
-  if (config.mentions !== undefined) params.mentions = JSON.stringify(config.mentions);
-  if (config.unfurl !== undefined) params.unfurl = String(config.unfurl);
-  if (config.config !== undefined) params.config = JSON.stringify(config.config);
-  if (config.output !== undefined) params.output = JSON.stringify(config.output);
-
-  const step: WorkflowStep = {
-    name: config.name,
-    type: 'integration',
-    integration: SLACK_INTEGRATION,
-    action: config.action,
-    params,
-  };
-
-  if (config.dependsOn !== undefined) step.dependsOn = config.dependsOn;
-  if (config.timeoutMs !== undefined) step.timeoutMs = config.timeoutMs;
-  if (config.retries !== undefined) step.retries = config.retries;
-
-  return step;
-}
-
-export class SlackStepExecutor implements RunnerStepExecutor {
-  constructor(private readonly options: SlackRuntimeConfig = {}) {}
-
-  async executeAgentStep(): Promise<string> {
-    throw new Error('SlackStepExecutor only executes Slack integration steps.');
-  }
-
-  async execute<TOutput = unknown>(
-    config: SlackStepConfig,
-    context: SlackStepExecutionContext = {}
-  ): Promise<SlackStepExecutionResult<TOutput>> {
-    validateSlackStepConfig(config);
-
-    const runtimeConfig = mergeRuntimeConfig(this.options, context.config, config.config);
-    const client = context.client ?? new SlackClient(runtimeConfig);
-    const params = buildActionParams(config);
-    const result = await client.executeAction<TOutput>(SlackAction.PostMessage, params);
-    const output = formatStepOutput(config, result);
-
-    return {
-      success: result.success,
-      output,
-      result,
-      error: result.error,
-    };
-  }
-
-  async executeIntegrationStep(
-    step: WorkflowStep,
-    resolvedParams: Record<string, string>
-  ): Promise<SlackIntegrationStepResult> {
-    if (step.integration !== SLACK_INTEGRATION) {
-      return {
-        success: false,
-        output: `SlackStepExecutor only handles "${SLACK_INTEGRATION}" integration steps`,
-      };
-    }
-
-    try {
-      const config = slackStepConfigFromWorkflowStep(step, resolvedParams);
-      const result = await this.execute(config);
-
-      return {
-        success: result.success,
-        output: result.success ? result.output : result.output || result.error || 'Slack step failed',
-      };
-    } catch (error) {
-      return {
-        success: false,
-        output: error instanceof Error ? error.message : String(error),
-      };
-    }
-  }
-}
-
-/**
- * Rebuild a Slack step config from resolved workflow params.
- * @param step - Workflow step.
- * @param resolvedParams - Params after workflow templating.
- * @returns Slack step configuration.
- */
-export function slackStepConfigFromWorkflowStep(
-  step: WorkflowStep,
-  resolvedParams: Record<string, string>
-): SlackStepConfig {
-  const params = normalizeResolvedParams(resolvedParams);
-  const action = step.action;
-
-  if (action !== SlackAction.PostMessage) {
-    throw new Error(`Slack step "${step.name}" requires action "postMessage"`);
-  }
-
-  const config =
-    readJsonParam<SlackRuntimeConfig>(params.config ?? params.slackConfig, 'config') ?? undefined;
-  const output = readJsonParam<SlackStepOutputConfig>(params.output, 'output') ?? undefined;
-  const actionParams = readActionParams(params);
-
-  return {
-    name: step.name,
-    dependsOn: step.dependsOn,
-    action: SlackAction.PostMessage,
-    channel: readOptionalString(actionParams.channel),
-    text: readRequiredString(actionParams.text, 'text'),
-    threadTs: readOptionalString(actionParams.threadTs),
-    mentions: readStringArray(actionParams.mentions),
-    unfurl: readOptionalBoolean(actionParams.unfurl, 'unfurl'),
-    config,
-    output,
-    timeoutMs: step.timeoutMs,
-    retries: step.retries,
-  };
-}
-
-export function renderSlackTemplates(value: string, data: Record<string, unknown>): string {
-  return value.replace(
-    /\{\{\s*steps\.([A-Za-z0-9_-]+)\.output(?:\.([A-Za-z0-9_.-]+))?\s*\}\}/g,
-    (_match, step, path) => {
-      const stepData = data.steps;
-      if (!isRecord(stepData)) return '';
-      const entry = stepData[String(step)];
-      if (!isRecord(entry)) return '';
-      const output = entry.output;
-      const resolved = typeof path === 'string' && path.length > 0 ? resolvePath(output, path) : output;
-      return projectionToText(resolved);
-    }
-  );
-}
-
-function validateSlackStepConfig(config: SlackStepConfig): void {
-  if (!config.name) {
-    throw new Error('Slack step requires a non-empty name');
-  }
-  if (!SLACK_ACTIONS.includes(config.action as SlackAction)) {
-    throw new Error(`Slack step "${config.name}" uses unsupported action "${config.action}"`);
-  }
-  if (config.action !== SlackAction.PostMessage) {
-    throw new Error(`Slack step "${config.name}" requires action "postMessage"`);
-  }
-  if (typeof config.text !== 'string' || config.text.length === 0) {
-    throw new Error(`Slack step "${config.name}" requires message text`);
-  }
-}
-
-function buildActionParams(config: SlackStepConfig): PostMessageParams {
-  return {
-    channel: config.channel,
-    text: config.text,
-    threadTs: config.threadTs,
-    mentions: config.mentions,
-    unfurl: config.unfurl,
-  };
-}
-
-function readActionParams(params: ResolvedParams): Record<string, unknown> {
-  const serializedParams = params.params;
-  if (serializedParams !== undefined) {
-    const parsed = readJsonParam<Record<string, unknown>>(serializedParams, 'params');
-    if (parsed === undefined) return {};
-    if (!isRecord(parsed)) {
-      throw new Error('Slack step params.params must be a JSON object');
-    }
-    return parsed;
-  }
-
-  const actionParams: Record<string, unknown> = {};
-  for (const [key, value] of Object.entries(params)) {
-    if (RESERVED_PARAM_KEYS.has(key)) continue;
-    actionParams[key] = value;
-  }
-
-  return actionParams;
-}
-
-function mergeRuntimeConfig(...configs: Array<SlackRuntimeConfig | undefined>): SlackRuntimeConfig {
-  const merged: SlackRuntimeConfig = {};
-
-  for (const config of configs) {
-    if (!config) continue;
-    const { env, ...flatConfig } = config;
-    Object.assign(merged, flatConfig);
-    if (env) {
-      merged.env = {
-        ...merged.env,
-        ...env,
-      };
-    }
-  }
-
-  return merged;
-}
-
-function formatStepOutput<TOutput>(config: SlackStepConfig, result: SlackActionResult<TOutput>): string {
-  const outputConfig = config.output ?? {};
-  const mode = outputConfig.mode ?? 'data';
-  const format = outputConfig.format ?? 'json';
-
-  if (mode === 'none') {
-    return '';
-  }
-
-  let projection = buildOutputProjection(mode, result, outputConfig);
-
-  if (outputConfig.path) {
-    projection = resolvePath(projection, outputConfig.path);
-  }
-
-  if (format === 'text') {
-    return projectionToText(projection);
-  }
-
-  return JSON.stringify(projection, undefined, outputConfig.pretty ? 2 : undefined);
-}
-
-function buildOutputProjection<TOutput>(
-  mode: SlackStepOutputMode,
-  result: SlackActionResult<TOutput>,
-  outputConfig: SlackStepOutputConfig
-): unknown {
-  if (mode === 'raw') return result.output;
-  if (mode === 'summary') {
-    return withOptionalMetadata(summarizeResult(result), result, outputConfig);
-  }
-  if (mode === 'result') {
-    const projected: Record<string, unknown> = {
-      success: result.success,
-      output: result.output,
-    };
-    if (result.data !== undefined) projected.data = result.data;
-    if (result.error !== undefined) projected.error = result.error;
-    return withOptionalMetadata(projected, result, outputConfig);
-  }
-
-  return withOptionalMetadata(
-    result.data ?? (result.output ? result.output : (result.error ?? null)),
-    result,
-    outputConfig
-  );
-}
-
-function summarizeResult<TOutput>(result: SlackActionResult<TOutput>): Record<string, unknown> {
-  if (!result.success) {
-    return {
-      success: false,
-      error: result.error ?? 'Slack action failed',
-    };
-  }
-
-  if (isRecord(result.data)) {
-    return {
-      success: true,
-      channel: result.data.channel,
-      ts: result.data.ts,
-      unresolvedMentions: result.data.unresolvedMentions,
-    };
-  }
-
-  return {
-    success: true,
-    value: result.data ?? result.output,
-  };
-}
-
-function withOptionalMetadata<TOutput>(
-  value: unknown,
-  result: SlackActionResult<TOutput>,
-  outputConfig: SlackStepOutputConfig
-): unknown {
-  if (!outputConfig.includeMetadata || result.metadata === undefined) {
-    return value;
-  }
-
-  return {
-    value,
-    metadata: result.metadata,
-  };
-}
-
-function projectionToText(value: unknown): string {
-  if (typeof value === 'string') return value;
-  if (value === null || value === undefined) return '';
-  if (Array.isArray(value)) return value.map((entry) => projectionToText(entry)).join('\n');
-  if (isRecord(value)) {
-    if ('output' in value) return projectionToText(value.output);
-    if ('value' in value) return projectionToText(value.value);
-    if ('text' in value) return projectionToText(value.text);
-    if ('ts' in value) return projectionToText(value.ts);
-    if ('channel' in value) return projectionToText(value.channel);
-  }
-  return JSON.stringify(value);
-}
-
-function resolvePath(value: unknown, path: string): unknown {
-  if (!path) return value;
-
-  let current = value;
-  for (const segment of path.split('.')) {
-    if (Array.isArray(current) && /^\d+$/.test(segment)) {
-      current = current[Number(segment)];
-      continue;
-    }
-    if (isRecord(current)) {
-      current = current[segment];
-      continue;
-    }
-    return undefined;
-  }
-
-  return current;
-}
-
-function normalizeResolvedParams(params: Record<string, string>): ResolvedParams {
-  const normalized: ResolvedParams = {};
-  for (const [key, value] of Object.entries(params)) {
-    normalized[key] = coerceScalar(value);
-  }
-  return normalized;
-}
-
-function coerceScalar(value: unknown): unknown {
-  if (typeof value !== 'string') {
-    return value;
-  }
-
-  const trimmed = value.trim();
-  if (
-    (trimmed.startsWith('{') && trimmed.endsWith('}')) ||
-    (trimmed.startsWith('[') && trimmed.endsWith(']')) ||
-    (trimmed.startsWith('"') && trimmed.endsWith('"'))
-  ) {
-    try {
-      return JSON.parse(trimmed) as unknown;
-    } catch {
-      return value;
-    }
-  }
-
-  return value;
-}
-
-function readJsonParam<T>(value: unknown, name: string): T | undefined {
-  if (value === undefined) return undefined;
-  if (typeof value !== 'string') return value as T;
-
-  try {
-    return JSON.parse(value) as T;
-  } catch (error) {
-    throw new Error(
-      `Slack step params.${name} must be valid JSON: ${error instanceof Error ? error.message : String(error)}`
-    );
-  }
-}
-
-function readRequiredString(value: unknown, name: string): string {
-  if (typeof value === 'string' && value.length > 0) return value;
-  throw new Error(`Slack step requires ${name}`);
-}
-
-function readOptionalString(value: unknown): string | undefined {
-  return typeof value === 'string' && value.length > 0 ? value : undefined;
-}
-
-function readStringArray(value: unknown): string[] | undefined {
-  if (value === undefined) return undefined;
-  if (Array.isArray(value) && value.every((item) => typeof item === 'string')) return value;
-  throw new Error('Slack step mentions must be a string array');
-}
-
-function readOptionalBoolean(value: unknown, name: string): boolean | undefined {
-  if (value === undefined) return undefined;
-  if (typeof value === 'boolean') return value;
-  if (value === 'true') return true;
-  if (value === 'false') return false;
-  throw new Error(`Slack step ${name} must be a boolean`);
-}
-
-function isRecord(value: unknown): value is Record<string, unknown> {
-  return typeof value === 'object' && value !== null && !Array.isArray(value);
-}
diff --git a/packages/workflow-types/package.json b/packages/workflow-types/package.json
deleted file mode 100644
index 501b9d3e1..000000000
--- a/packages/workflow-types/package.json
+++ /dev/null
@@ -1,29 +0,0 @@
-{
-  "name": "@agent-relay/workflow-types",
-  "version": "7.1.1",
-  "type": "module",
-  "main": "dist/index.js",
-  "types": "dist/index.d.ts",
-  "exports": {
-    ".": {
-      "types": "./dist/index.d.ts",
-      "import": "./dist/index.js",
-      "default": "./dist/index.js"
-    }
-  },
-  "scripts": {
-    "build": "tsc",
-    "check": "tsc --noEmit"
-  },
-  "files": [
-    "dist"
-  ],
-  "publishConfig": {
-    "access": "public"
-  },
-  "repository": {
-    "type": "git",
-    "url": "git+https://github.com/AgentWorkforce/relay.git",
-    "directory": "packages/workflow-types"
-  }
-}
diff --git a/packages/workflow-types/src/index.ts b/packages/workflow-types/src/index.ts
deleted file mode 100644
index 31d8ec7c5..000000000
--- a/packages/workflow-types/src/index.ts
+++ /dev/null
@@ -1,377 +0,0 @@
-/**
- * Shared workflow types for Agent Relay packages.
- *
- * This package is intentionally a leaf dependency so workflow integrations can
- * share the public workflow type surface without depending on the full SDK.
- */
-
-export type SwarmPattern =
-  | 'fan-out'
-  | 'pipeline'
-  | 'hub-spoke'
-  | 'consensus'
-  | 'mesh'
-  | 'handoff'
-  | 'cascade'
-  | 'dag'
-  | 'debate'
-  | 'hierarchical'
-  // Additional patterns
-  | 'map-reduce'
-  | 'scatter-gather'
-  | 'supervisor'
-  | 'reflection'
-  | 'red-team'
-  | 'verifier'
-  | 'auction'
-  | 'escalation'
-  | 'saga'
-  | 'circuit-breaker'
-  | 'blackboard'
-  | 'swarm'
-  | 'competitive'
-  | 'review-loop';
-
-// ── Agent definitions ───────────────────────────────────────────────────────
-
-export type AgentPreset = 'lead' | 'worker' | 'reviewer' | 'analyst';
-
-/** Optional credential settings for a workflow agent. */
-export interface AgentCredentialConfig {
-  /** Opt the agent into credential proxy mode. */
-  proxy?: boolean;
-  /** Override the provider used for proxy credential resolution. */
-  provider?: string;
-}
-
-/** Definition of an agent participating in a workflow. */
-export interface AgentDefinition {
-  name: string;
-  cli: AgentCli;
-  role?: string;
-  task?: string;
-  channels?: string[];
-  constraints?: AgentConstraints;
-  /**
-   * Permission configuration controlling file access, network, and exec restrictions.
-   * Omitting this field preserves the default behavior: inherit dotfiles + readwrite access.
-   */
-  permissions?: AgentPermissions;
-  /** When false, the agent runs as a non-interactive subprocess (no PTY, no relay messaging).
-   *  It receives its task as a CLI prompt argument and returns stdout as output.
-   *  Default: true (interactive PTY mode). */
-  interactive?: boolean;
-  /** Working directory for this agent, resolved relative to the YAML file. */
-  cwd?: string;
-  /** Sets this agent's working directory to a named entry from the top-level `paths` array.
-   *  Mutually exclusive with `cwd`. If omitted, the agent runs in the runner's
-   *  working directory (the directory containing the workflow YAML file). */
-  workdir?: string;
-  /** Additional paths the agent needs read/write access to. */
-  additionalPaths?: string[];
-  /**
-   * Role preset that automatically configures interactive mode and injects
-   * appropriate task guardrails. Overrides are still accepted.
-   *   lead     → interactive PTY, relay-aware, coordinates workers via channels
-   *   worker   → interactive: false, produces structured output, no sub-agents
-   *   reviewer → interactive: false, reads artifacts, produces verdict, no sub-agents
-   *   analyst  → interactive: false, reads code/files, writes findings, no sub-agents
-   */
-  preset?: AgentPreset;
-  /** Optional credential proxy settings for this agent. */
-  credentials?: AgentCredentialConfig;
-  /** System prompt / skills for API-mode agents (cli: 'api'). */
-  skills?: string;
-}
-
-export type AgentCli =
-  | 'claude'
-  | 'codex'
-  | 'gemini'
-  | 'aider'
-  | 'goose'
-  | 'opencode'
-  | 'droid'
-  | 'cursor'
-  | 'cursor-agent'
-  | 'agent'
-  | 'api';
-
-/** Resource and behavioral constraints for an agent. */
-export interface AgentConstraints {
-  maxTokens?: number;
-  timeoutMs?: number;
-  retries?: number;
-  model?: string;
-  /** Silence duration in seconds before the agent is considered idle (0 = disabled, default: 30). */
-  idleThresholdSecs?: number;
-}
-
-// ── Permission types ────────────────────────────────────────────────────────
-
-/**
- * Access preset for role-based permission shortcuts.
- *
- *   readonly    → read all non-ignored files, write nothing
- *   readwrite   → read and write all non-ignored files (default behavior)
- *   restricted  → read/write only explicitly listed paths
- *   full        → read and write everything, including normally-ignored files
- */
-export type AccessPreset = 'readonly' | 'readwrite' | 'restricted' | 'full';
-
-/** Fine-grained network permission with allowlist/denylist. */
-export interface NetworkPermissions {
-  /** Host:port pairs the agent may connect to (e.g. ['registry.npmjs.org:443']). */
-  allow?: string[];
-  /** Host:port patterns to block (e.g. ['*'] to deny all except allowed). */
-  deny?: string[];
-}
-
-/** Network permission: boolean to allow/deny all, or object for fine-grained control. */
-export type NetworkPermission = boolean | NetworkPermissions;
-
-/** Glob-based file permission scopes for an agent. */
-export interface FilePermissions {
-  /** Glob patterns the agent may read (e.g. ['src/**', 'docs/**']). */
-  read?: string[];
-  /** Glob patterns the agent may write (e.g. ['src/tests/**']). */
-  write?: string[];
-  /** Glob patterns the agent must never access (e.g. ['.env', 'secrets/**']).
-   *  Deny rules take precedence over read/write grants. */
-  deny?: string[];
-}
-
-/** Reusable named permission profile shared by one or more agents. */
-export interface PermissionProfileDefinition {
-  /** Human-readable summary of the profile's intended use. */
-  description?: string;
-
-  /** Explain why this profile exists or what constraint it is protecting. */
-  why?: string;
-
-  /** Role-based access preset. Expands into file permission rules.
-   *  Default: 'readwrite'. */
-  access?: AccessPreset;
-
-  /** Inherit patterns from .agentignore and .agentreadonly dotfiles.
-   *  Default: true. Set to false to ignore dotfiles for this agent. */
-  inherit?: boolean;
-
-  /** Explicit glob-based file read/write/deny rules.
-   *  Merged on top of the access preset and inherited dotfile patterns. */
-  files?: FilePermissions;
-
-  /** Raw relayauth scopes appended verbatim to the minted token.
-   *  For power users who need fine-grained control beyond file globs.
-   *  Example: ['relayfile:fs:read:/src/**', 'relayfile:fs:write:/tests/**'] */
-  scopes?: string[];
-
-  /** Network access control.
-   *  - undefined: no restriction
-   *  - false: deny all network access
-   *  - { allow, deny }: fine-grained host:port allowlist/denylist */
-  network?: NetworkPermission;
-
-  /** Allowlist of shell commands the agent may execute.
-   *  When set, only commands matching these prefixes are permitted.
-   *  Example: ['npm test', 'npm run lint', 'git diff']
-   *  Default: undefined (no restriction). */
-  exec?: string[];
-}
-
-/**
- * Permission configuration for a workflow agent.
- *
- * All fields are optional — omitting `permissions` entirely preserves the
- * existing default behavior (inherit dotfiles, readwrite access).
- *
- * Resolution order (later overrides earlier):
- *   1. Dotfile patterns (.agentignore / .agentreadonly) when `inherit` is true
- *   2. `access` preset expands into base file rules
- *   3. Explicit `files` globs merge on top
- *   4. `deny` patterns always win (applied last)
- *   5. `scopes` are appended verbatim to the token
- */
-export interface AgentPermissions {
-  /** Human-readable summary of what this permission block is for. */
-  description?: string;
-
-  /** Reference a reusable entry from the top-level `permission_profiles` map. */
-  profile?: string;
-
-  /** Explain why these permissions are needed or intentionally constrained. */
-  why?: string;
-
-  /** Role-based access preset. Expands into file permission rules.
-   *  Default: 'readwrite'. */
-  access?: AccessPreset;
-
-  /** Inherit patterns from .agentignore and .agentreadonly dotfiles.
-   *  Default: true. Set to false to ignore dotfiles for this agent. */
-  inherit?: boolean;
-
-  /** Explicit glob-based file read/write/deny rules.
-   *  Merged on top of the access preset and inherited dotfile patterns. */
-  files?: FilePermissions;
-
-  /** Raw relayauth scopes appended verbatim to the minted token.
-   *  For power users who need fine-grained control beyond file globs.
-   *  Example: ['relayfile:fs:read:/src/**', 'relayfile:fs:write:/tests/**'] */
-  scopes?: string[];
-
-  /** Network access control.
-   *  - undefined: no restriction
-   *  - false: deny all network access
-   *  - { allow, deny }: fine-grained host:port allowlist/denylist */
-  network?: NetworkPermission;
-
-  /** Allowlist of shell commands the agent may execute.
-   *  When set, only commands matching these prefixes are permitted.
-   *  Example: ['npm test', 'npm run lint', 'git diff']
-   *  Default: undefined (no restriction). */
-  exec?: string[];
-}
-
-/** Step type: agent (LLM-powered), deterministic (shell command), worktree (git worktree setup), or integration (external service). */
-export type WorkflowStepType = 'agent' | 'deterministic' | 'worktree' | 'integration';
-
-/**
- * A single step within a workflow.
- *
- * Steps can be either:
- * - Agent steps (type: undefined or "agent"): Spawn an LLM agent to execute a task
- * - Deterministic steps (type: "deterministic"): Execute a shell command
- */
-export interface WorkflowStep {
-  /** Unique step name within the workflow. */
-  name: string;
-  /** Step type: "agent" (default) or "deterministic". */
-  type?: WorkflowStepType;
-  /** Reference to a custom step definition from .relay/steps.yaml. */
-  use?: string;
-  /** Step names that must complete before this step runs. */
-  dependsOn?: string[];
-  /** Timeout in milliseconds. */
-  timeoutMs?: number;
-
-  // ── Agent step fields ──────────────────────────────────────────────────────
-  /** Name of the agent to execute this step (required for agent steps). */
-  agent?: string;
-  /** Task description for the agent (required for agent steps). */
-  task?: string;
-  /** Verification check to validate step output. */
-  verification?: VerificationCheck;
-  /** Number of retry attempts on failure. */
-  retries?: number;
-  /** Maximum iterations for steps that may need to retry (e.g., fix-failures). */
-  maxIterations?: number;
-  /** Explicit working directory for this step. */
-  cwd?: string;
-
-  // ── Deterministic step fields ──────────────────────────────────────────────
-  /** Shell command to execute (required for deterministic steps). */
-  command?: string;
-  /** Sets this step's working directory to a named entry from the top-level `paths` array.
-   *  If omitted, the step inherits the agent's workdir, or falls back to the runner's
-   *  working directory. */
-  workdir?: string;
-  /** Fail if command exit code is non-zero. Default: true. */
-  failOnError?: boolean;
-  /** Capture stdout as step output for downstream steps. Default: true. */
-  captureOutput?: boolean;
-
-  // ── Integration step fields ────────────────────────────────────────────────
-  /** Integration name: 'github', 'linear', 'slack' (required for integration steps). */
-  integration?: string;
-  /** Action within the integration, e.g. 'create-pr', 'create-branch' (required for integration steps). */
-  action?: string;
-  /** Action parameters, supports {{steps.X.output}} interpolation. */
-  params?: Record<string, string>;
-
-  // ── Worktree step fields ──────────────────────────────────────────────────
-  /** Branch name for the worktree (required for worktree steps). */
-  branch?: string;
-  /** Base branch to create the worktree from. Default: HEAD. */
-  baseBranch?: string;
-  /** Explicit path for the worktree. Default: .worktrees/<step-name>. */
-  path?: string;
-  /** Create the branch if it doesn't exist. Default: true. */
-  createBranch?: boolean;
-}
-
-/** Type guard: Check if a step is a deterministic (shell command) step. */
-export function isDeterministicStep(step: WorkflowStep): boolean {
-  return step.type === 'deterministic';
-}
-
-/** Type guard: Check if a step is a worktree (git worktree setup) step. */
-export function isWorktreeStep(step: WorkflowStep): boolean {
-  return step.type === 'worktree';
-}
-
-/** Type guard: Check if a step is an integration (external service) step. */
-export function isIntegrationStep(step: WorkflowStep): boolean {
-  return step.type === 'integration';
-}
-
-/** Type guard: Check if a step uses a custom step definition. */
-export function isCustomStep(step: WorkflowStep): boolean {
-  return step.use !== undefined;
-}
-
-/** Type guard: Check if a step is an agent (LLM-powered) step. */
-export function isAgentStep(step: WorkflowStep): boolean {
-  return step.type !== 'deterministic' && step.type !== 'worktree' && step.type !== 'integration';
-}
-
-// Legacy type aliases for backward compatibility
-export type AgentWorkflowStep = WorkflowStep;
-export type DeterministicWorkflowStep = WorkflowStep;
-
-/** Verification check to validate a step's output. */
-export interface VerificationCheck {
-  type: 'output_contains' | 'exit_code' | 'file_exists' | 'custom' | 'pr_url';
-  /**
-   * Type-specific value:
-   *  - output_contains: token that must appear in the step's output
-   *  - exit_code: expected exit code (currently informational)
-   *  - file_exists: path that must exist (relative to cwd or absolute)
-   *  - custom: shell command to execute, or `regex:<pattern>` against output
-   *  - pr_url: optional `<owner>/<repo>` qualifier to require the discovered
-   *    PR URL belongs to a specific repository; leave empty to accept any
-   *    GitHub PR URL in the step output
-   */
-  value: string;
-  description?: string;
-  timeoutMs?: number;
-  /** Name of the agent to analyze verification failures before retrying. */
-  diagnosticAgent?: string;
-  /** Timeout for the diagnostic agent in milliseconds. Default: 60_000. */
-  diagnosticTimeout?: number;
-}
-
-/**
- * Extension point for delegating step execution to an external backend
- * (e.g. Daytona sandboxes) while keeping the runner's DAG/retry/verification
- * machinery intact.
- */
-export interface RunnerStepExecutor {
-  executeAgentStep(
-    step: WorkflowStep,
-    agentDef: AgentDefinition,
-    resolvedTask: string,
-    timeoutMs?: number
-  ): Promise<string>;
-
-  executeDeterministicStep?(
-    step: WorkflowStep,
-    resolvedCommand: string,
-    cwd: string
-  ): Promise<{ output: string; exitCode: number }>;
-
-  executeIntegrationStep?(
-    step: WorkflowStep,
-    resolvedParams: Record<string, string>,
-    context: { workspaceId?: string }
-  ): Promise<{ output: string; success: boolean }>;
-}
diff --git a/packages/workflow-types/tsconfig.json b/packages/workflow-types/tsconfig.json
deleted file mode 100644
index 222999fef..000000000
--- a/packages/workflow-types/tsconfig.json
+++ /dev/null
@@ -1,22 +0,0 @@
-{
-  "compilerOptions": {
-    "target": "ES2022",
-    "module": "NodeNext",
-    "moduleResolution": "NodeNext",
-    "lib": ["ES2022"],
-    "types": ["node"],
-    "outDir": "./dist",
-    "rootDir": "./src",
-    "strict": true,
-    "esModuleInterop": true,
-    "skipLibCheck": true,
-    "forceConsistentCasingInFileNames": true,
-    "declaration": true,
-    "declarationMap": true,
-    "sourceMap": true,
-    "resolveJsonModule": true,
-    "isolatedModules": true
-  },
-  "include": ["src/**/*"],
-  "exclude": ["node_modules", "dist", "**/*.test.ts"]
-}
diff --git a/scripts/run-relay-cleanroom-ci.sh b/scripts/run-relay-cleanroom-ci.sh
deleted file mode 100755
index e1b803fcb..000000000
--- a/scripts/run-relay-cleanroom-ci.sh
+++ /dev/null
@@ -1,78 +0,0 @@
-#!/usr/bin/env bash
-set -euo pipefail
-
-REPO_ROOT="$(cd "$(dirname "${BASH_SOURCE[0]}")/.." && pwd)"
-cd "$REPO_ROOT"
-
-ARTIFACTS_DIR="$REPO_ROOT/.e2e-artifacts"
-SUMMARY_JSON="$ARTIFACTS_DIR/ci-summary.json"
-SUMMARY_MD="$ARTIFACTS_DIR/ci-summary.md"
-mkdir -p "$ARTIFACTS_DIR"
-
-cleanup() {
-  if command -v agent-relay >/dev/null 2>&1; then
-    agent-relay down >/dev/null 2>&1 || true
-  fi
-}
-trap cleanup EXIT
-
-export PATH="$HOME/.local/bin:/opt/homebrew/bin:/usr/local/bin:/usr/bin:/bin:$PATH"
-export RELAY_CLEANROOM_CI=1
-
-run_id=""
-status="failed"
-if output=$(env PATH="$PATH" agent-relay run workflows/relay-clean-room-e2e-validation.ts 2>&1); then
-  status="completed"
-else
-  status="failed"
-fi
-printf '%s
-' "$output" | tee "$ARTIFACTS_DIR/ci-run.log"
-
-run_id=$(printf '%s
-' "$output" | sed -n 's/^  Run ID:[[:space:]]*//p' | tail -n 1 | xargs || true)
-verdict_file="$ARTIFACTS_DIR/verdict.md"
-if [[ -f "$verdict_file" ]]; then
-  overall=$(grep -E '^\*\*Overall verdict:' "$verdict_file" | head -n1 | sed 's/^\*\*Overall verdict:[[:space:]]*//; s/\*\*$//' || true)
-else
-  overall="missing"
-fi
-
-SUMMARY_JSON="$SUMMARY_JSON" STATUS="$status" RUN_ID="$run_id" OVERALL="$overall" ARTIFACTS_DIR="$ARTIFACTS_DIR" VERDICT_FILE="$verdict_file" python3 - <<'PY'
-import json
-import os
-import pathlib
-root = pathlib.Path(os.environ['SUMMARY_JSON'])
-data = {
-  'status': os.environ['STATUS'],
-  'runId': os.environ['RUN_ID'],
-  'verdict': os.environ['OVERALL'],
-  'artifactsDir': os.environ['ARTIFACTS_DIR'],
-  'verdictFile': os.environ['VERDICT_FILE'],
-}
-root.write_text(json.dumps(data, indent=2) + "\n")
-PY
-
-cat > "$SUMMARY_MD" <<EOF
-# Relay Clean-Room CI Summary
-
-- Status: **$status**
-- Run ID: \
-  - \
-    \
-${run_id:-unknown}
-- Verdict: **${overall:-missing}**
-- Artifacts: \
-  - \
-    \
-$ARTIFACTS_DIR
-
-## Notes
-- This CI wrapper runs the clean-room validation workflow directly.
-- It is most useful as a hardening check for install/bootstrap/local-mode changes.
-- A conditional verdict can still be useful when the only gap is worker-auth in an isolated environment.
-EOF
-
-if [[ "$status" != "completed" ]]; then
-  exit 1
-fi
diff --git a/tests/integration/broker/events-relaycast.test.ts b/tests/integration/broker/events-relaycast.test.ts
deleted file mode 100644
index eabcd4c20..000000000
--- a/tests/integration/broker/events-relaycast.test.ts
+++ /dev/null
@@ -1,115 +0,0 @@
-/**
- * Workflow event ordering and Relaycast channel integration tests.
- *
- * Tests that WorkflowRunner emits workflow events in the expected order and
- * that Relaycast channels receive workflow lifecycle messages when configured.
- *
- * Run:
- *   npx tsc -p tests/integration/broker/tsconfig.json
- *   node --test tests/integration/broker/dist/events-relaycast.test.js
- */
-import test, { type TestContext } from 'node:test';
-import assert from 'node:assert/strict';
-
-import { RelayCast } from '@agent-relay/sdk';
-import type { RelayYamlConfig } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites, ensureApiKey } from './utils/broker-harness.js';
-import { WorkflowRunnerHarness } from './utils/workflow-harness.js';
-import { assertRunCompleted, assertWorkflowEventOrder } from './utils/workflow-assert-helpers.js';
-import { sleep } from './utils/cli-helpers.js';
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function makeConfig(overrides?: Partial<RelayYamlConfig>): RelayYamlConfig {
-  const base: RelayYamlConfig = {
-    version: '1',
-    name: 'test-events',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'worker', cli: 'claude' }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [{ name: 'step-1', agent: 'worker', task: 'Do a thing' }],
-      },
-    ],
-  };
-
-  return {
-    ...base,
-    ...overrides,
-    agents: overrides?.agents ?? base.agents,
-    workflows: overrides?.workflows ?? base.workflows,
-    swarm: { ...base.swarm, ...(overrides?.swarm ?? {}) },
-  };
-}
-
-test('events: onEvent fires in correct order', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-
-  try {
-    const result = await harness.runWorkflow(makeConfig());
-    assertRunCompleted(result);
-    assertWorkflowEventOrder(result.events, [
-      'run:started',
-      'step:started',
-      'step:completed',
-      'run:completed',
-    ]);
-  } finally {
-    await harness.stop();
-  }
-});
-
-test('events: relaycast channel receives workflow messages', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const suffix = `${Date.now().toString(36)}-${Math.random().toString(36).slice(2, 8)}`;
-  const channel = `events-relay-${suffix}`;
-  const workflowName = `workflow-${suffix}`;
-
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-
-  try {
-    const result = await harness.runWorkflow(
-      makeConfig({
-        name: workflowName,
-        swarm: { pattern: 'dag', channel },
-        workflows: [
-          {
-            name: workflowName,
-            steps: [{ name: 'step-1', agent: 'worker', task: 'Do a thing' }],
-          },
-        ],
-      })
-    );
-    assertRunCompleted(result);
-
-    const apiKey = await ensureApiKey();
-    const api = new RelayCast({ apiKey });
-
-    let messages: Array<{ id: string; agent_name: string; text: string; created_at: string }> = [];
-    for (let attempt = 0; attempt < 6; attempt += 1) {
-      messages = (await api.messages.list(channel, { limit: 50 })) as any;
-      if (messages.length > 0) break;
-      await sleep(1_000);
-    }
-
-    assert.ok(
-      messages.some((message) => message.text.includes(`Workflow **${workflowName}**`)),
-      `expected workflow messages for "${workflowName}" in channel "${channel}"`
-    );
-  } finally {
-    await harness.stop();
-  }
-});
diff --git a/tests/integration/broker/output-chaining.test.ts b/tests/integration/broker/output-chaining.test.ts
deleted file mode 100644
index 4b5957b18..000000000
--- a/tests/integration/broker/output-chaining.test.ts
+++ /dev/null
@@ -1,291 +0,0 @@
-/**
- * WorkflowRunner output-chaining integration tests.
- *
- * Verifies interpolation from step outputs and top-level variables across
- * deterministic and agent steps, including unresolved reference behavior.
- */
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import test, { type TestContext } from 'node:test';
-
-import type { RelayYamlConfig, VariableContext } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites } from './utils/broker-harness.js';
-import { WorkflowRunnerHarness } from './utils/workflow-harness.js';
-import {
-  assertRunCompleted,
-  assertStepCompleted,
-  assertStepOutput,
-} from './utils/workflow-assert-helpers.js';
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function makeConfig(overrides?: Partial<RelayYamlConfig>): RelayYamlConfig {
-  const base: RelayYamlConfig = {
-    version: '1',
-    name: 'test-output-chaining',
-    description: 'Integration test for output chaining',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'worker', cli: 'claude' }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'step-a', type: 'deterministic', command: 'printf "%s" "default"', captureOutput: true },
-        ],
-      },
-    ],
-  };
-
-  return {
-    ...base,
-    ...overrides,
-    agents: overrides?.agents ?? base.agents,
-    workflows: overrides?.workflows ?? base.workflows,
-    swarm: { ...base.swarm, ...(overrides?.swarm ?? {}) },
-  };
-}
-
-function createWorkdir(): string {
-  return fs.mkdtempSync(path.join(os.tmpdir(), 'relay-wf-chain-'));
-}
-
-test(
-  'output-chaining: {{steps.step-a.output}} resolves in downstream deterministic step',
-  { timeout: 120_000 },
-  async (t) => {
-    if (skipIfMissing(t)) return;
-
-    const cwd = createWorkdir();
-    const harness = new WorkflowRunnerHarness();
-    await harness.start();
-
-    try {
-      const result = await harness.runWorkflow(
-        makeConfig({
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                {
-                  name: 'step-a',
-                  type: 'deterministic',
-                  command: 'printf "%s" "hop-value"',
-                  captureOutput: true,
-                },
-                {
-                  name: 'step-b',
-                  type: 'deterministic',
-                  command: 'printf "%s" "got-{{steps.step-a.output}}"',
-                  dependsOn: ['step-a'],
-                  captureOutput: true,
-                },
-              ],
-            },
-          ],
-        }),
-        undefined,
-        { cwd }
-      );
-
-      assertRunCompleted(result);
-      assertStepCompleted(result, 'step-a');
-      assertStepCompleted(result, 'step-b');
-      assertStepOutput(result, 'step-a', 'hop-value');
-      assertStepOutput(result, 'step-b', 'got-hop-value');
-    } finally {
-      await harness.stop();
-      fs.rmSync(cwd, { force: true, recursive: true });
-    }
-  }
-);
-
-test('output-chaining: outputs compose across three-step A→B→C chain', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-
-  try {
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-a',
-                type: 'deterministic',
-                command: 'printf "%s" "A"',
-                captureOutput: true,
-              },
-              {
-                name: 'step-b',
-                type: 'deterministic',
-                command: 'printf "%s" "B-{{steps.step-a.output}}"',
-                dependsOn: ['step-a'],
-                captureOutput: true,
-              },
-              {
-                name: 'step-c',
-                type: 'deterministic',
-                command: 'printf "%s" "C-{{steps.step-b.output}}"',
-                dependsOn: ['step-b'],
-                captureOutput: true,
-              },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd }
-    );
-
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-a');
-    assertStepCompleted(result, 'step-b');
-    assertStepCompleted(result, 'step-c');
-    assertStepOutput(result, 'step-b', 'B-A');
-    assertStepOutput(result, 'step-c', 'C-B-A');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test(
-  'output-chaining: top-level vars are available in command interpolation',
-  { timeout: 120_000 },
-  async (t) => {
-    if (skipIfMissing(t)) return;
-
-    const cwd = createWorkdir();
-    const harness = new WorkflowRunnerHarness();
-    await harness.start();
-
-    const vars: VariableContext = { projectName: 'relay-test' };
-
-    try {
-      const result = await harness.runWorkflow(
-        makeConfig({
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                {
-                  name: 'step-a',
-                  type: 'deterministic',
-                  command: 'printf "%s" "project:{{projectName}}"',
-                  captureOutput: true,
-                },
-              ],
-            },
-          ],
-        }),
-        vars,
-        { cwd }
-      );
-
-      assertRunCompleted(result);
-      assertStepCompleted(result, 'step-a');
-      assertStepOutput(result, 'step-a', 'project:relay-test');
-    } finally {
-      await harness.stop();
-      fs.rmSync(cwd, { force: true, recursive: true });
-    }
-  }
-);
-
-test(
-  'output-chaining: deterministic output feeds downstream agent task text',
-  { timeout: 120_000 },
-  async (t) => {
-    if (skipIfMissing(t)) return;
-
-    const cwd = createWorkdir();
-    const harness = new WorkflowRunnerHarness();
-    await harness.start();
-
-    try {
-      const result = await harness.runWorkflow(
-        makeConfig({
-          agents: [{ name: 'worker', cli: 'claude' }],
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                {
-                  name: 'step-a',
-                  type: 'deterministic',
-                  command: 'printf "%s" "agent-input"',
-                  captureOutput: true,
-                },
-                {
-                  name: 'step-b',
-                  agent: 'worker',
-                  task: 'Process this: {{steps.step-a.output}}',
-                  dependsOn: ['step-a'],
-                  verification: { type: 'output_contains', value: 'DONE' },
-                },
-              ],
-            },
-          ],
-        }),
-        undefined,
-        { cwd }
-      );
-
-      assertRunCompleted(result);
-      assertStepCompleted(result, 'step-a');
-      assertStepCompleted(result, 'step-b');
-    } finally {
-      await harness.stop();
-      fs.rmSync(cwd, { force: true, recursive: true });
-    }
-  }
-);
-
-test('output-chaining: unresolved reference is left as a literal', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-
-  try {
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-a',
-                type: 'deterministic',
-                command: 'printf "%s" "{{steps.nonexistent.output}}"',
-                captureOutput: true,
-              },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd }
-    );
-
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-a');
-    assertStepOutput(result, 'step-a', '{{steps.nonexistent.output}}');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
diff --git a/tests/integration/broker/swarm-dag.test.ts b/tests/integration/broker/swarm-dag.test.ts
deleted file mode 100644
index cf54f293c..000000000
--- a/tests/integration/broker/swarm-dag.test.ts
+++ /dev/null
@@ -1,258 +0,0 @@
-/**
- * Swarm DAG pattern integration tests.
- * Covers serial ordering, parallel fan-out, and maxConcurrency enforcement.
- */
-import assert from 'node:assert/strict';
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import test, { type TestContext } from 'node:test';
-
-import type { RelayYamlConfig } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites } from './utils/broker-harness.js';
-import { WorkflowRunnerHarness } from './utils/workflow-runner-harness.js';
-import {
-  assertRunCompleted,
-  assertStepCompleted,
-  assertStepOrder,
-  assertStepsParallel,
-} from './utils/workflow-assert-helpers.js';
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function makeConfig(overrides?: Partial<RelayYamlConfig>): RelayYamlConfig {
-  const base: RelayYamlConfig = {
-    version: '1',
-    name: 'test-swarm-dag',
-    description: 'Swarm DAG pattern integration test',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'worker', cli: 'claude' }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'step-a', type: 'deterministic', command: 'echo DONE_A' },
-          {
-            name: 'step-b',
-            type: 'deterministic',
-            command: 'echo DONE_B',
-            dependsOn: ['step-a'],
-          },
-          {
-            name: 'step-c',
-            type: 'deterministic',
-            command: 'echo DONE_C',
-            dependsOn: ['step-b'],
-          },
-        ],
-      },
-    ],
-  };
-
-  return {
-    ...base,
-    ...overrides,
-    agents: overrides?.agents ?? base.agents,
-    workflows: overrides?.workflows ?? base.workflows,
-    swarm: { ...base.swarm, ...(overrides?.swarm ?? {}) },
-  };
-}
-
-function createWorkdir(): string {
-  return fs.mkdtempSync(path.join(os.tmpdir(), 'relay-swarm-dag-'));
-}
-
-test('swarm-dag: serial A→B→C executes in strict dependency order', { timeout: 60_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-
-  try {
-    const result = await harness.runWorkflow(makeConfig(), undefined, { cwd });
-
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-a');
-    assertStepCompleted(result, 'step-b');
-    assertStepCompleted(result, 'step-c');
-
-    // Verify strict serial ordering: A before B before C
-    assertStepOrder(result, ['step-a', 'step-b', 'step-c']);
-
-    // Verify timestamps: each step starts only after the prior step completes
-    const completedA = result.events.findIndex(
-      (e) => e.type === 'step:completed' && 'stepName' in e && e.stepName === 'step-a'
-    );
-    const startedB = result.events.findIndex(
-      (e) => e.type === 'step:started' && 'stepName' in e && e.stepName === 'step-b'
-    );
-    const completedB = result.events.findIndex(
-      (e) => e.type === 'step:completed' && 'stepName' in e && e.stepName === 'step-b'
-    );
-    const startedC = result.events.findIndex(
-      (e) => e.type === 'step:started' && 'stepName' in e && e.stepName === 'step-c'
-    );
-
-    assert.ok(startedB > completedA, 'step-b must not start until step-a completes');
-    assert.ok(startedC > completedB, 'step-c must not start until step-b completes');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('swarm-dag: parallel fan A→{B,C}→D starts B and C concurrently', { timeout: 60_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-
-  try {
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              { name: 'step-a', type: 'deterministic', command: 'echo DONE_A' },
-              {
-                name: 'step-b',
-                type: 'deterministic',
-                command: 'sleep 0.1 && echo DONE_B',
-                dependsOn: ['step-a'],
-              },
-              {
-                name: 'step-c',
-                type: 'deterministic',
-                command: 'sleep 0.1 && echo DONE_C',
-                dependsOn: ['step-a'],
-              },
-              {
-                name: 'step-d',
-                type: 'deterministic',
-                command: 'echo DONE_D',
-                dependsOn: ['step-b', 'step-c'],
-              },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd }
-    );
-
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-a');
-    assertStepCompleted(result, 'step-b');
-    assertStepCompleted(result, 'step-c');
-    assertStepCompleted(result, 'step-d');
-
-    // A must complete before B and C start
-    const completedA = result.events.findIndex(
-      (e) => e.type === 'step:completed' && 'stepName' in e && e.stepName === 'step-a'
-    );
-    const startedB = result.events.findIndex(
-      (e) => e.type === 'step:started' && 'stepName' in e && e.stepName === 'step-b'
-    );
-    const startedC = result.events.findIndex(
-      (e) => e.type === 'step:started' && 'stepName' in e && e.stepName === 'step-c'
-    );
-    assert.ok(startedB > completedA, 'step-b must start after step-a completes');
-    assert.ok(startedC > completedA, 'step-c must start after step-a completes');
-
-    // B and C run concurrently — each starts before the other finishes
-    assertStepsParallel(result, ['step-b', 'step-c']);
-
-    // D must start only after both B and C complete
-    const completedB = result.events.findIndex(
-      (e) => e.type === 'step:completed' && 'stepName' in e && e.stepName === 'step-b'
-    );
-    const completedC = result.events.findIndex(
-      (e) => e.type === 'step:completed' && 'stepName' in e && e.stepName === 'step-c'
-    );
-    const startedD = result.events.findIndex(
-      (e) => e.type === 'step:started' && 'stepName' in e && e.stepName === 'step-d'
-    );
-    assert.ok(startedD > completedB, 'step-d must start after step-b completes');
-    assert.ok(startedD > completedC, 'step-d must start after step-c completes');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test(
-  'swarm-dag: maxConcurrency:2 limits parallel steps to at most 2 at once',
-  { timeout: 60_000 },
-  async (t) => {
-    if (skipIfMissing(t)) return;
-
-    const cwd = createWorkdir();
-    const harness = new WorkflowRunnerHarness();
-    await harness.start();
-
-    try {
-      // 4 independent steps all ready at once — maxConcurrency:2 should batch them 2-at-a-time
-      const result = await harness.runWorkflow(
-        {
-          version: '1',
-          name: 'test-swarm-dag-concurrency',
-          description: 'maxConcurrency test',
-          swarm: { pattern: 'dag', maxConcurrency: 2 },
-          agents: [{ name: 'worker', cli: 'claude' }],
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                { name: 'step-1', type: 'deterministic', command: 'sleep 0.05 && echo DONE_1' },
-                { name: 'step-2', type: 'deterministic', command: 'sleep 0.05 && echo DONE_2' },
-                { name: 'step-3', type: 'deterministic', command: 'sleep 0.05 && echo DONE_3' },
-                { name: 'step-4', type: 'deterministic', command: 'sleep 0.05 && echo DONE_4' },
-              ],
-            },
-          ],
-        },
-        undefined,
-        { cwd }
-      );
-
-      assertRunCompleted(result);
-      assertStepCompleted(result, 'step-1');
-      assertStepCompleted(result, 'step-2');
-      assertStepCompleted(result, 'step-3');
-      assertStepCompleted(result, 'step-4');
-
-      // Verify no more than 2 steps were active simultaneously by scanning the event stream
-      let activeCount = 0;
-      let maxActive = 0;
-      for (const event of result.events) {
-        if (event.type === 'step:started') {
-          activeCount += 1;
-          maxActive = Math.max(maxActive, activeCount);
-        } else if (
-          event.type === 'step:completed' ||
-          event.type === 'step:failed' ||
-          event.type === 'step:skipped'
-        ) {
-          activeCount -= 1;
-        }
-      }
-      assert.ok(
-        maxActive <= 2,
-        `Expected at most 2 concurrent steps, but saw ${maxActive} simultaneously active`
-      );
-    } finally {
-      await harness.stop();
-      fs.rmSync(cwd, { force: true, recursive: true });
-    }
-  }
-);
diff --git a/tests/integration/broker/swarm-errors.test.ts b/tests/integration/broker/swarm-errors.test.ts
deleted file mode 100644
index e70839ef5..000000000
--- a/tests/integration/broker/swarm-errors.test.ts
+++ /dev/null
@@ -1,275 +0,0 @@
-/**
- * Swarm error-handling integration tests.
- */
-import assert from 'node:assert/strict';
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import test, { type TestContext } from 'node:test';
-
-import type { RelayYamlConfig } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites } from './utils/broker-harness.js';
-import { WorkflowRunnerHarness } from './utils/workflow-runner-harness.js';
-import {
-  assertRunCompleted,
-  assertRunFailed,
-  assertStepCompleted,
-  assertStepFailed,
-  assertStepOutput,
-  assertStepRetried,
-  assertStepSkipped,
-} from './utils/workflow-assert-helpers.js';
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function makeConfig(overrides?: Partial<RelayYamlConfig>): RelayYamlConfig {
-  const base: RelayYamlConfig = {
-    version: '1',
-    name: 'test-swarm-errors',
-    description: 'Swarm error handling integration test',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'worker', cli: 'claude', interactive: false }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [{ name: 'step-a', type: 'deterministic', command: 'echo DONE' }],
-      },
-    ],
-  };
-
-  return {
-    ...base,
-    ...overrides,
-    agents: overrides?.agents ?? base.agents,
-    workflows: overrides?.workflows ?? base.workflows,
-    swarm: { ...base.swarm, ...(overrides?.swarm ?? {}) },
-  };
-}
-
-function createWorkdir(): string {
-  return fs.mkdtempSync(path.join(os.tmpdir(), 'relay-swarm-errors-'));
-}
-
-function installFlakyClaudeScript(
-  harness: WorkflowRunnerHarness,
-  counterFile: string,
-  failures: number
-): void {
-  const fakeCliPath = harness.getRelayEnv().PATH?.split(path.delimiter)[0];
-  assert.ok(fakeCliPath, 'Expected fake CLI directory in PATH');
-
-  const script = `#!/usr/bin/env bash
-COUNT_FILE=${JSON.stringify(counterFile)}
-FAILURES=${JSON.stringify(String(failures))}
-MARKER=""
-REVIEW_OUTPUT=""
-if [[ "\${RELAY_AGENT_NAME:-}" =~ ^(.+)-review-[A-Za-z0-9]+$ ]]; then
-  REVIEW_OUTPUT=$'REVIEW_DECISION: APPROVE\\nREVIEW_REASON: Fake reviewer approved'
-elif [[ "\${RELAY_AGENT_NAME:-}" =~ ^(.+)-(worker|owner)-[A-Za-z0-9]+$ ]]; then
-  MARKER="STEP_COMPLETE:\${BASH_REMATCH[1]}"
-elif [[ "\${RELAY_AGENT_NAME:-}" =~ ^(.+)-[A-Za-z0-9]+$ ]]; then
-  MARKER="STEP_COMPLETE:\${BASH_REMATCH[1]}"
-fi
-while IFS= read -r -t 1 line; do
-  if [[ "$line" =~ STEP_COMPLETE:([A-Za-z0-9._-]+) ]]; then
-    MARKER="STEP_COMPLETE:\${BASH_REMATCH[1]}"
-  fi
-done 2>/dev/null
-COUNT=0
-if [ -f "$COUNT_FILE" ]; then
-  COUNT=$(cat "$COUNT_FILE")
-fi
-COUNT=$((COUNT + 1))
-printf '%s\n' "$COUNT" > "$COUNT_FILE"
-if [ "$COUNT" -le "$FAILURES" ]; then
-  echo "temporary failure $COUNT" >&2
-  exit 1
-fi
-if [[ -n "$MARKER" ]]; then
-  echo "$MARKER"
-fi
-if [[ -n "$REVIEW_OUTPUT" ]]; then
-  echo "$REVIEW_OUTPUT"
-fi
-echo "DONE"
-`;
-
-  const claudePath = path.join(fakeCliPath, 'claude');
-  fs.writeFileSync(claudePath, script, { mode: 0o755 });
-}
-
-test('swarm-errors: retries in strategy retry until success', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-
-  const counterFile = path.join(cwd, 'agent-attempts.txt');
-  installFlakyClaudeScript(harness, counterFile, 2);
-
-  try {
-    const result = await harness.runWorkflow(
-      makeConfig({
-        errorHandling: {
-          strategy: 'retry',
-          maxRetries: 2,
-          retryDelayMs: 0,
-        },
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-retry',
-                agent: 'worker',
-                task: 'intermittent agent task',
-              },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd, useRelaycast: false }
-    );
-
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-retry');
-    assertStepOutput(result, 'step-retry', 'DONE');
-
-    const retryEvent = assertStepRetried(result, 'step-retry', 2);
-    assert.equal(
-      retryEvent.attempt,
-      2,
-      `Expected final retry attempt to be 2 for 2 failures, got ${retryEvent.attempt}`
-    );
-
-    const attempts = parseInt(fs.readFileSync(counterFile, 'utf8').trim(), 10);
-    assert.equal(attempts, 3, `Expected exactly 3 attempts, saw ${attempts}`);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('swarm-errors: fail-fast aborts workflow after first failure', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-
-  try {
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-setup',
-                type: 'deterministic',
-                command: 'echo SETUP_OK',
-              },
-              {
-                name: 'step-fail',
-                type: 'deterministic',
-                command: 'echo FAILING && exit 1',
-                dependsOn: ['step-setup'],
-              },
-              {
-                name: 'step-skipped',
-                type: 'deterministic',
-                command: 'echo SHOULD_NOT_RUN',
-                dependsOn: ['step-fail'],
-              },
-              {
-                name: 'step-ok',
-                type: 'deterministic',
-                command: 'echo OK',
-                dependsOn: ['step-setup'],
-              },
-              {
-                name: 'step-blocked',
-                type: 'deterministic',
-                command: 'echo BLOCKED',
-                dependsOn: ['step-ok'],
-              },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd, useRelaycast: false }
-    );
-
-    assertRunFailed(result);
-    assertStepFailed(result, 'step-fail');
-    assertStepSkipped(result, 'step-skipped');
-
-    const blockedCompleted = result.events.find(
-      (event) => event.type === 'step:completed' && 'stepName' in event && event.stepName === 'step-blocked'
-    );
-    assert.ok(!blockedCompleted, 'Expected step-blocked not to complete in fail-fast mode');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('swarm-errors: maxIterations loops until success within 3 attempts', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-  const counterFile = path.join(cwd, 'agent-attempts.txt');
-  installFlakyClaudeScript(harness, counterFile, 2);
-
-  try {
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-loop',
-                retries: 2,
-                maxIterations: 3,
-                agent: 'worker',
-                task: 'bounded loop step',
-              },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd, useRelaycast: false }
-    );
-
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-loop');
-    assertStepOutput(result, 'step-loop', 'DONE');
-
-    const retryEvent = assertStepRetried(result, 'step-loop', 2);
-    assert.equal(
-      retryEvent.attempt,
-      2,
-      `Expected maxIterations loop to attempt retries up to 2 for 3 total attempts, got ${retryEvent.attempt}`
-    );
-
-    const attempts = parseInt(fs.readFileSync(counterFile, 'utf8').trim(), 10);
-    assert.equal(attempts, 3, `Expected exactly 3 attempts for maxIterations=3, saw ${attempts}`);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
diff --git a/tests/integration/broker/trajectory-quality.test.ts b/tests/integration/broker/trajectory-quality.test.ts
deleted file mode 100644
index eb3542a80..000000000
--- a/tests/integration/broker/trajectory-quality.test.ts
+++ /dev/null
@@ -1,298 +0,0 @@
-/**
- * Trajectory quality integration tests.
- *
- * Verifies that trajectories capture *reasoning* — purpose, step intent,
- * root-cause diagnosis, and actionable learnings — not just mechanical
- * event logs.
- *
- * Tests three scenarios:
- *   1. Success path  — description, step intent, narrative summary are present
- *   2. Verification mismatch failure — cause classified, sentinel named, learning actionable
- *   3. Non-interactive timeout failure — diagnosed as tool-discovery anti-pattern
- *
- * Run:
- *   npx tsc -p tests/integration/broker/tsconfig.json
- *   node --test tests/integration/broker/dist/trajectory-quality.test.js
- */
-import assert from 'node:assert/strict';
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import test, { type TestContext } from 'node:test';
-
-import type { RelayYamlConfig } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites } from './utils/broker-harness.js';
-import { WorkflowRunnerHarness } from './utils/workflow-harness.js';
-import {
-  assertRunCompleted,
-  assertRunFailed,
-  assertTrajectoryExists,
-} from './utils/workflow-assert-helpers.js';
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function createWorkdir(): string {
-  return fs.mkdtempSync(path.join(os.tmpdir(), 'relay-traj-quality-'));
-}
-
-/** Flatten all chapter events into a single array for easy searching. */
-function allEvents(trajectory: ReturnType<typeof assertTrajectoryExists>) {
-  return trajectory.chapters.flatMap((c) => c.events);
-}
-
-function eventContaining(trajectory: ReturnType<typeof assertTrajectoryExists>, substr: string) {
-  return allEvents(trajectory).find((e) => e.content.includes(substr));
-}
-
-// ── Test 1: Success path ──────────────────────────────────────────────────────
-//
-// A workflow with a description + two non-interactive steps that succeed.
-// The trajectory should:
-//   - Record the workflow purpose in the Planning chapter
-//   - Record step intent (first sentence of task), not just "assigned to agent X"
-//   - Produce a narrative summary ("All N steps completed") not just statistics
-//   - Set approach from actual pattern, not hardcoded "workflow-runner DAG execution"
-//   - Record the completion sentinel as the finding
-
-test(
-  'trajectory quality: success path records purpose, intent, and narrative',
-  { timeout: 240_000 },
-  async (t) => {
-    if (skipIfMissing(t)) return;
-
-    const cwd = createWorkdir();
-    const harness = new WorkflowRunnerHarness();
-    await harness.start();
-
-    const config: RelayYamlConfig = {
-      version: '1',
-      name: 'traj-success-test',
-      description: 'Validate that trajectory content is reasoning-rich, not log-like.',
-      swarm: { pattern: 'pipeline' },
-      agents: [{ name: 'worker', cli: 'claude', interactive: false, constraints: { model: 'haiku' } }],
-      workflows: [
-        {
-          name: 'default',
-          steps: [
-            {
-              name: 'step-a',
-              agent: 'worker',
-              task: 'Count vowels in "hello world" and output the count. End with: STEP_A_DONE',
-              verification: { type: 'output_contains', value: 'STEP_A_DONE' },
-            },
-            {
-              name: 'step-b',
-              agent: 'worker',
-              task: 'Confirm step-b ran by outputting: STEP_B_DONE',
-              verification: { type: 'output_contains', value: 'STEP_B_DONE' },
-              dependsOn: ['step-a'],
-            },
-          ],
-        },
-      ],
-      trajectories: { enabled: true },
-    };
-
-    try {
-      const result = await harness.runWorkflow(config, undefined, { cwd });
-      assertRunCompleted(result);
-
-      const trajectory = assertTrajectoryExists(harness, cwd);
-
-      // 1. Purpose recorded — description propagated into Planning chapter
-      const purposeEvent = eventContaining(trajectory, 'Validate that trajectory content');
-      assert.ok(purposeEvent, 'Expected "Purpose:" event with workflow description in Planning chapter');
-
-      // 2. Approach reflects actual pattern, not hardcoded string
-      const approach = trajectory.retrospective?.approach ?? '';
-      assert.ok(approach.includes('pipeline'), `Expected approach to include "pipeline", got: "${approach}"`);
-      assert.ok(
-        !approach.includes('workflow-runner DAG execution'),
-        `Expected approach to NOT be the old hardcoded string, got: "${approach}"`
-      );
-
-      // 3. Step intent captured — first sentence of task, not "assigned to agent X"
-      const stepAIntent = eventContaining(trajectory, 'Count vowels');
-      assert.ok(stepAIntent, 'Expected step-a intent event containing first sentence of task');
-      const oldStyleAssign = allEvents(trajectory).find((e) =>
-        e.content.match(/Step "step-a" assigned to agent/)
-      );
-      assert.ok(!oldStyleAssign, 'Should not use old "assigned to agent" phrasing');
-
-      // 4. Completion sentinel appears in finding event (not raw 200-char preview)
-      const stepADone = eventContaining(trajectory, 'STEP_A_DONE');
-      assert.ok(stepADone, 'Expected finding event containing the STEP_A_DONE sentinel');
-      assert.equal(stepADone?.type, 'finding', 'Completion event should be type "finding"');
-
-      // 5. Narrative summary — "All N steps completed" not just stat string
-      const summary = trajectory.retrospective?.summary ?? '';
-      assert.ok(summary.includes('All 2 steps completed'), `Expected narrative summary, got: "${summary}"`);
-    } finally {
-      await harness.stop();
-      fs.rmSync(cwd, { force: true, recursive: true });
-    }
-  }
-);
-
-// ── Test 2: Verification mismatch failure ─────────────────────────────────────
-//
-// A step produces output but not the required sentinel.
-// The trajectory should:
-//   - Classify failure as "verification_mismatch"
-//   - Name the missing sentinel in the diagnosis
-//   - Include actionable learning about output format
-//   - Produce a failure narrative summary (not "0/1 steps passed")
-
-test(
-  'trajectory quality: verification mismatch classified with actionable diagnosis',
-  { timeout: 120_000 },
-  async (t) => {
-    if (skipIfMissing(t)) return;
-
-    const cwd = createWorkdir();
-    const harness = new WorkflowRunnerHarness();
-    await harness.start();
-
-    const sentinel = 'SENTINEL_NEVER_EMITTED';
-
-    const config: RelayYamlConfig = {
-      version: '1',
-      name: 'traj-verify-fail-test',
-      description: 'Tests verification mismatch trajectory classification.',
-      swarm: { pattern: 'pipeline' },
-      agents: [{ name: 'worker', cli: 'claude', interactive: false, constraints: { model: 'haiku' } }],
-      workflows: [
-        {
-          name: 'default',
-          steps: [
-            {
-              name: 'will-fail',
-              agent: 'worker',
-              // Task produces output but not the sentinel — deliberate mismatch
-              task: 'Output exactly: TASK_COMPLETE',
-              verification: { type: 'output_contains', value: sentinel },
-            },
-          ],
-        },
-      ],
-      trajectories: { enabled: true },
-    };
-
-    try {
-      const result = await harness.runWorkflow(config, undefined, { cwd });
-      assertRunFailed(result);
-
-      const trajectory = assertTrajectoryExists(harness, cwd);
-
-      // 1. Failure classified as verification_mismatch
-      const failureEvent = allEvents(trajectory).find((e) => e.type === 'error');
-      assert.ok(failureEvent, 'Expected an error event in trajectory');
-      assert.ok(
-        failureEvent.content.includes('verification_mismatch'),
-        `Expected failure classified as verification_mismatch, got: "${failureEvent.content}"`
-      );
-
-      // 2. Sentinel named in the diagnosis
-      assert.ok(
-        failureEvent.content.includes(sentinel),
-        `Expected failure event to name the missing sentinel "${sentinel}", got: "${failureEvent.content}"`
-      );
-
-      // 3. Actionable learning about output format
-      const learnings = trajectory.retrospective?.learnings ?? [];
-      const outputFormatLearning = learnings.find(
-        (l) => l.includes('output format') || l.includes('task prompt')
-      );
-      assert.ok(
-        outputFormatLearning,
-        `Expected learning about output format, got: ${JSON.stringify(learnings)}`
-      );
-
-      // 4. Failure narrative summary (not stats)
-      const summary = trajectory.retrospective?.summary ?? '';
-      assert.ok(
-        summary.includes('verification_mismatch') || summary.includes('will-fail'),
-        `Expected failure narrative mentioning step/cause, got: "${summary}"`
-      );
-      assert.ok(
-        !summary.match(/^\d+\/\d+ steps passed/),
-        `Expected narrative summary, not stat string, got: "${summary}"`
-      );
-    } finally {
-      await harness.stop();
-      fs.rmSync(cwd, { force: true, recursive: true });
-    }
-  }
-);
-
-// ── Test 3: raw field carries machine-readable cause ─────────────────────────
-//
-// The failure event's raw field should include the structured cause so
-// tooling (dashboards, future agents) can consume it without parsing prose.
-
-test('trajectory quality: failure raw field carries structured cause', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-
-  const config: RelayYamlConfig = {
-    version: '1',
-    name: 'traj-raw-cause-test',
-    description: 'Verifies structured cause in raw field of failure events.',
-    swarm: { pattern: 'pipeline' },
-    agents: [{ name: 'worker', cli: 'claude', interactive: false, constraints: { model: 'haiku' } }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          {
-            name: 'mismatch-step',
-            agent: 'worker',
-            task: 'Say hello.',
-            verification: { type: 'output_contains', value: 'STRUCTURED_CAUSE_TEST' },
-          },
-        ],
-      },
-    ],
-    trajectories: { enabled: true },
-  };
-
-  try {
-    const result = await harness.runWorkflow(config, undefined, { cwd });
-    assertRunFailed(result);
-
-    const trajectory = assertTrajectoryExists(harness, cwd);
-    const failureEvent = allEvents(trajectory).find((e) => e.type === 'error');
-    assert.ok(failureEvent, 'Expected error event');
-
-    // raw.cause must be machine-readable — tools/dashboards use this
-    const cause = failureEvent?.raw?.['cause'];
-    assert.ok(
-      typeof cause === 'string' && cause.length > 0,
-      `Expected raw.cause to be a non-empty string, got: ${JSON.stringify(cause)}`
-    );
-    assert.equal(
-      cause,
-      'verification_mismatch',
-      `Expected raw.cause to be "verification_mismatch", got: "${String(cause)}"`
-    );
-
-    // raw.rawError preserves the original error message for debugging
-    assert.ok(
-      typeof failureEvent?.raw?.['rawError'] === 'string',
-      'Expected raw.rawError to be present for debugging'
-    );
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
diff --git a/tests/integration/broker/trajectory.test.ts b/tests/integration/broker/trajectory.test.ts
deleted file mode 100644
index 91b121c4b..000000000
--- a/tests/integration/broker/trajectory.test.ts
+++ /dev/null
@@ -1,199 +0,0 @@
-/**
- * Workflow trajectory file lifecycle integration tests.
- *
- * Tests that trajectory files are written during runs, transition to
- * completed/, have chapters recorded, and capture agent names correctly.
- *
- * Run:
- *   npx tsc -p tests/integration/broker/tsconfig.json
- *   node --test tests/integration/broker/dist/trajectory.test.js
- */
-import assert from 'node:assert/strict';
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import test, { type TestContext } from 'node:test';
-
-import type { RelayYamlConfig } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites } from './utils/broker-harness.js';
-import { WorkflowRunnerHarness } from './utils/workflow-harness.js';
-import {
-  assertRunCompleted,
-  assertTrajectoryExists,
-  assertTrajectoryCompleted,
-  assertTrajectoryHasChapters,
-} from './utils/workflow-assert-helpers.js';
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function makeConfig(agentName = 'worker'): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'test-trajectory',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: agentName, cli: 'claude' }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [{ name: 'step-1', agent: agentName, task: 'Do a thing' }],
-      },
-    ],
-    trajectories: { enabled: true },
-  };
-}
-
-function createWorkdir(): string {
-  return fs.mkdtempSync(path.join(os.tmpdir(), 'relay-wf-traj-'));
-}
-
-async function runWorkflowAndGetTrajectory(
-  harness: WorkflowRunnerHarness,
-  config: ReturnType<typeof makeConfig>,
-  cwd: string
-) {
-  const result = await harness.runWorkflow(config, undefined, { cwd, useRelaycast: false });
-  assertRunCompleted(result);
-
-  return assertTrajectoryExists(harness, cwd);
-}
-
-test('trajectory: file written during run', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const trajectory = await runWorkflowAndGetTrajectory(harness, makeConfig(), cwd);
-    assert.ok(trajectory.id.length > 0, 'Expected trajectory file to include an id');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('trajectory: file transitions to completed status after run', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const trajectory = await runWorkflowAndGetTrajectory(harness, makeConfig(), cwd);
-    assertTrajectoryCompleted(trajectory);
-
-    const activePath = path.join(cwd, '.trajectories', 'active', `${trajectory.id}.json`);
-    const completedPath = path.join(cwd, '.trajectories', 'completed', `${trajectory.id}.json`);
-
-    assert.equal(
-      fs.existsSync(activePath),
-      false,
-      'Expected active trajectory file to be removed after completion'
-    );
-    assert.equal(
-      fs.existsSync(completedPath),
-      true,
-      `Expected completed trajectory file at "${completedPath}"`
-    );
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('trajectory: chapters are recorded during workflow execution', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const trajectory = await runWorkflowAndGetTrajectory(harness, makeConfig(), cwd);
-    assertTrajectoryHasChapters(trajectory, 1);
-
-    for (const chapter of trajectory.chapters) {
-      assert.equal(typeof chapter.id, 'string', 'Expected chapter.id to be a string');
-      assert.equal(typeof chapter.title, 'string', 'Expected chapter.title to be a string');
-      assert.equal(typeof chapter.startedAt, 'string', 'Expected chapter.startedAt to be a string');
-      assert.equal(typeof chapter.agentName, 'string', 'Expected chapter.agentName to be a string');
-      assert.ok(Array.isArray(chapter.events), 'Expected chapter.events to be an array');
-    }
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('trajectory: chapters record agent names', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const agentName = 'my-worker';
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const trajectory = await runWorkflowAndGetTrajectory(harness, makeConfig(agentName), cwd);
-    assertTrajectoryHasChapters(trajectory, 1);
-
-    const agentNamesInChapters = trajectory.chapters.map((ch) => ch.agentName);
-    if (!agentNamesInChapters.some((name) => name === agentName)) {
-      throw new Error(
-        `Expected at least one chapter with agentName "${agentName}", got: ${JSON.stringify(agentNamesInChapters)}`
-      );
-    }
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('trajectory: records task metadata and participating agents', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const agentName = 'meta-agent';
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const trajectory = await runWorkflowAndGetTrajectory(harness, makeConfig(agentName), cwd);
-    assertTrajectoryCompleted(trajectory);
-    assert.equal(
-      trajectory.task.title,
-      'default',
-      `Expected trajectory task title to match workflow name, got "${trajectory.task.title}"`
-    );
-    assert.equal(typeof trajectory.startedAt, 'string', 'Expected trajectory.startedAt to be a string');
-    assert.equal(typeof trajectory.completedAt, 'string', 'Expected trajectory.completedAt to be a string');
-
-    assert.ok(Array.isArray(trajectory.agents), 'Expected trajectory.agents to be an array');
-    assert.ok(trajectory.agents.length >= 1, 'Expected at least one agent in trajectory');
-    assert.ok(
-      trajectory.agents.some((agent) => agent.name === agentName),
-      `Expected trajectory.agents to include agent "${agentName}"`
-    );
-    for (const trajectoryAgent of trajectory.agents) {
-      assert.equal(typeof trajectoryAgent.name, 'string', 'Expected trajectoryAgent.name to be a string');
-      assert.equal(typeof trajectoryAgent.role, 'string', 'Expected trajectoryAgent.role to be a string');
-      assert.equal(
-        typeof trajectoryAgent.joinedAt,
-        'string',
-        'Expected trajectoryAgent.joinedAt to be a string'
-      );
-    }
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
diff --git a/tests/integration/broker/utils/workflow-assert-helpers.ts b/tests/integration/broker/utils/workflow-assert-helpers.ts
deleted file mode 100644
index 29384eb10..000000000
--- a/tests/integration/broker/utils/workflow-assert-helpers.ts
+++ /dev/null
@@ -1,216 +0,0 @@
-import assert from 'node:assert/strict';
-
-import type { BrokerEvent } from '@agent-relay/sdk';
-import type { DryRunReport, WorkflowEvent } from '@agent-relay/sdk/workflows';
-import type { TrajectoryFile, WorkflowRunResult, WorkflowRunnerHarness } from './workflow-harness.js';
-
-function getStepEvent(result: WorkflowRunResult, type: string, stepName: string): WorkflowEvent | undefined {
-  return result.events.find(
-    (event) => event.type === type && 'stepName' in event && event.stepName === stepName
-  );
-}
-
-export function assertRunCompleted(result: WorkflowRunResult): void {
-  assert.equal(result.run.status, 'completed', `Expected run to be completed, got "${result.run.status}"`);
-}
-
-export function assertRunFailed(result: WorkflowRunResult, errorSubstring?: string): void {
-  assert.equal(result.run.status, 'failed', `Expected run to be failed, got "${result.run.status}"`);
-
-  const runFailed = result.events.find((event) => event.type === 'run:failed');
-  assert.ok(runFailed, 'Expected run:failed event');
-
-  if (errorSubstring) {
-    const error = result.run.error ?? ('error' in runFailed ? runFailed.error : undefined);
-    assert.ok(
-      typeof error === 'string' && error.includes(errorSubstring),
-      `Expected failure to contain "${errorSubstring}", got: ${String(error)}`
-    );
-  }
-}
-
-export function assertStepCompleted(result: WorkflowRunResult, stepName: string): void {
-  const event = getStepEvent(result, 'step:completed', stepName);
-  assert.ok(event, `Expected "${stepName}" to complete`);
-}
-
-export function assertStepFailed(result: WorkflowRunResult, stepName: string): void {
-  const event = getStepEvent(result, 'step:failed', stepName);
-  assert.ok(event, `Expected "${stepName}" to fail`);
-}
-
-export function assertStepSkipped(result: WorkflowRunResult, stepName: string): void {
-  const event = getStepEvent(result, 'step:skipped', stepName);
-  assert.ok(event, `Expected "${stepName}" to be skipped`);
-}
-
-export function assertStepOrder(result: WorkflowRunResult, stepNames: string[]): void {
-  let cursor = -1;
-  for (const stepName of stepNames) {
-    const index = result.events.findIndex(
-      (event, i) =>
-        i > cursor && event.type === 'step:started' && 'stepName' in event && event.stepName === stepName
-    );
-    assert.ok(index !== -1, `Expected step "${stepName}" to start`);
-    cursor = index;
-  }
-}
-
-export function assertStepsParallel(result: WorkflowRunResult, stepNames: string[]): void {
-  const startIndexes: Record<string, number> = {};
-  const completedIndexes: Record<string, number> = {};
-
-  for (const name of stepNames) {
-    const startIndex = result.events.findIndex(
-      (event, i) => i >= 0 && event.type === 'step:started' && 'stepName' in event && event.stepName === name
-    );
-    const completedIndex = result.events.findIndex(
-      (event, i) =>
-        i >= 0 && event.type === 'step:completed' && 'stepName' in event && event.stepName === name
-    );
-    assert.ok(startIndex !== -1, `Expected "${name}" to start`);
-    assert.ok(completedIndex !== -1, `Expected "${name}" to complete`);
-    startIndexes[name] = startIndex;
-    completedIndexes[name] = completedIndex;
-  }
-
-  for (let i = 1; i < stepNames.length; i += 1) {
-    const priorName = stepNames[i - 1];
-    const currentName = stepNames[i];
-    assert.ok(
-      startIndexes[currentName] < completedIndexes[priorName],
-      `Expected "${currentName}" to start before "${priorName}" completed`
-    );
-  }
-}
-
-export function assertWorkflowEventOrder(
-  events: WorkflowEvent[],
-  expectedTypes: WorkflowEvent['type'][]
-): void {
-  let cursor = -1;
-  for (const expected of expectedTypes) {
-    const index = events.findIndex((event, i) => i > cursor && event.type === expected);
-    assert.ok(index !== -1, `Expected event "${expected}" to appear in order`);
-    cursor = index;
-  }
-}
-
-export function assertStepOutput(
-  result: WorkflowRunResult,
-  stepName: string,
-  expectedSubstring: string
-): void {
-  const event = result.events.find(
-    (candidate) =>
-      candidate.type === 'step:completed' &&
-      'stepName' in candidate &&
-      candidate.stepName === stepName &&
-      'output' in candidate &&
-      typeof candidate.output === 'string'
-  ) as (WorkflowEvent & { output: string }) | undefined;
-
-  assert.ok(event, `Expected "${stepName}" to have output`);
-  assert.ok(
-    event.output.includes(expectedSubstring),
-    `Expected output of "${stepName}" to include "${expectedSubstring}"`
-  );
-}
-
-export function assertStepCount(
-  result: WorkflowRunResult,
-  status: 'completed' | 'failed' | 'skipped',
-  expectedCount: number
-): void {
-  const eventType = `step:${status}` as const;
-  const count = result.events.filter((event) => event.type === eventType).length;
-  assert.equal(count, expectedCount, `Expected ${expectedCount} ${status} steps, got ${count}`);
-}
-
-export function assertTrajectoryExists(harness: WorkflowRunnerHarness, cwd: string): TrajectoryFile {
-  const trajectory = harness.getTrajectory(cwd);
-  assert.ok(trajectory, `Expected a trajectory file under "${cwd}/.trajectories"`);
-
-  assert.ok(typeof trajectory.id === 'string' && trajectory.id.length > 0, 'Expected trajectory.id');
-  assert.equal(typeof trajectory.version, 'number', 'Expected trajectory.version to be a number');
-  assert.ok(
-    trajectory.status === 'active' || trajectory.status === 'completed' || trajectory.status === 'abandoned',
-    `Unexpected trajectory status "${trajectory.status}"`
-  );
-  assert.equal(typeof trajectory.startedAt, 'string', 'Expected trajectory.startedAt');
-  assert.ok(
-    typeof trajectory.task?.title === 'string' && trajectory.task.title.length > 0,
-    'Expected trajectory.task.title'
-  );
-  assert.ok(Array.isArray(trajectory.chapters), 'Expected trajectory.chapters to be an array');
-
-  return trajectory;
-}
-
-export function assertTrajectoryCompleted(trajectory: TrajectoryFile): void {
-  assert.equal(
-    trajectory.status,
-    'completed',
-    `Expected trajectory to be completed, got "${trajectory.status}"`
-  );
-}
-
-export function assertTrajectoryHasChapters(trajectory: TrajectoryFile, minCount: number): void {
-  assert.ok(Number.isInteger(minCount) && minCount >= 0, `Invalid minCount "${minCount}"`);
-  assert.ok(
-    trajectory.chapters.length >= minCount,
-    `Expected at least ${minCount} trajectory chapters, got ${trajectory.chapters.length}`
-  );
-}
-
-export function assertBrokerEventEmitted<K extends BrokerEvent['kind']>(
-  brokerEvents: BrokerEvent[],
-  kind: K,
-  predicate?: (event: Extract<BrokerEvent, { kind: K }>) => boolean
-): Extract<BrokerEvent, { kind: K }> {
-  const matches = brokerEvents.filter(
-    (event): event is Extract<BrokerEvent, { kind: K }> => event.kind === kind
-  );
-  assert.ok(matches.length > 0, `Expected broker event kind "${kind}" to be emitted`);
-
-  if (!predicate) {
-    return matches[0];
-  }
-
-  const matched = matches.find((event) => predicate(event));
-  assert.ok(matched, `Expected broker event kind "${kind}" to match predicate`);
-  return matched;
-}
-
-export function assertStepRetried(
-  result: WorkflowRunResult,
-  stepName: string,
-  minAttempts: number
-): Extract<WorkflowEvent, { type: 'step:retrying' }> {
-  assert.ok(Number.isInteger(minAttempts) && minAttempts >= 1, `Invalid minAttempts "${minAttempts}"`);
-
-  const retryEvents = result.events.filter(
-    (event): event is Extract<WorkflowEvent, { type: 'step:retrying' }> =>
-      event.type === 'step:retrying' && event.stepName === stepName
-  );
-  assert.ok(retryEvents.length > 0, `Expected "${stepName}" to emit step:retrying`);
-
-  const maxAttempt = retryEvents.reduce((max, event) => Math.max(max, event.attempt), 0);
-  assert.ok(
-    maxAttempt >= minAttempts,
-    `Expected "${stepName}" to retry at least ${minAttempts} times, got ${maxAttempt}`
-  );
-
-  const matchingEvent = retryEvents.find((event) => event.attempt >= minAttempts);
-  assert.ok(matchingEvent, `Expected "${stepName}" retry event with attempt >= ${minAttempts}`);
-  return matchingEvent;
-}
-
-export function assertDryRunValid(report: DryRunReport): void {
-  assert.equal(report.valid, true, 'Expected dry-run report to be valid');
-  assert.equal(
-    report.errors.length,
-    0,
-    `Expected dry-run report to have no errors, got: ${JSON.stringify(report.errors)}`
-  );
-}
diff --git a/tests/integration/broker/utils/workflow-harness.ts b/tests/integration/broker/utils/workflow-harness.ts
deleted file mode 100644
index d444e55dd..000000000
--- a/tests/integration/broker/utils/workflow-harness.ts
+++ /dev/null
@@ -1,300 +0,0 @@
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-
-import type { BrokerEvent } from '@agent-relay/sdk';
-import { ensureApiKey, resolveBinaryPath } from './broker-harness.js';
-import { type RelayYamlConfig, type VariableContext, type WorkflowRunRow } from '@agent-relay/sdk/workflows';
-import { WorkflowRunner, type WorkflowEvent } from '@agent-relay/sdk/workflows';
-
-export interface WorkflowRunResult {
-  run: WorkflowRunRow;
-  events: WorkflowEvent[];
-  brokerEvents: BrokerEvent[];
-}
-
-export interface TrajectoryFile {
-  id: string;
-  version: number;
-  task: {
-    title: string;
-    source?: {
-      system: string;
-      id: string;
-    };
-  };
-  status: 'active' | 'completed' | 'abandoned';
-  startedAt: string;
-  completedAt?: string;
-  agents: Array<{
-    name: string;
-    role: string;
-    joinedAt: string;
-  }>;
-  chapters: Array<{
-    id: string;
-    title: string;
-    agentName: string;
-    startedAt: string;
-    endedAt?: string;
-    events: Array<{
-      ts: number;
-      type: string;
-      content: string;
-      raw?: Record<string, unknown>;
-      significance?: 'low' | 'medium' | 'high';
-    }>;
-  }>;
-  retrospective?: {
-    summary: string;
-    approach: string;
-    confidence: number;
-    learnings?: string[];
-    challenges?: string[];
-  };
-}
-
-export class WorkflowRunnerHarness {
-  private fakeCliDir?: string;
-  private runnerEnv?: NodeJS.ProcessEnv;
-  private currentRunner?: WorkflowRunner;
-  private brokerEvents: BrokerEvent[] = [];
-  private binaryPath: string;
-  private started = false;
-  private defaultUseRelaycast = true;
-
-  constructor() {
-    this.binaryPath = resolveBinaryPath();
-  }
-
-  getBinaryPath(): string {
-    return this.binaryPath;
-  }
-
-  getRelayEnv(): NodeJS.ProcessEnv {
-    return this.runnerEnv ?? process.env;
-  }
-
-  getCurrentRunner(): WorkflowRunner | undefined {
-    return this.currentRunner;
-  }
-
-  async start(options?: { useRelaycast?: boolean }): Promise<void> {
-    if (this.started) return;
-
-    const fakeCliDir = ensureFakeCliDir();
-    const existingPath = process.env.PATH ?? '';
-    const mergedPath = existingPath ? `${fakeCliDir}${path.delimiter}${existingPath}` : fakeCliDir;
-    const env: NodeJS.ProcessEnv = {
-      ...process.env,
-      PATH: mergedPath,
-    };
-
-    this.fakeCliDir = fakeCliDir;
-    this.defaultUseRelaycast = options?.useRelaycast !== false;
-    this.runnerEnv = { ...env };
-
-    if (this.defaultUseRelaycast) {
-      const apiKey = await ensureApiKey();
-      this.runnerEnv = {
-        ...env,
-        RELAY_API_KEY: apiKey,
-      };
-    }
-
-    this.started = true;
-  }
-
-  async stop(): Promise<void> {
-    if (!this.started) return;
-
-    // Abort any in-flight workflow run so its broker handles are released.
-    // Without this, node:test's timeout marks the test failed but the process
-    // stays alive forever waiting on pending broker I/O.
-    this.currentRunner?.abort();
-
-    this.started = false;
-    this.currentRunner = undefined;
-    this.brokerEvents = [];
-    if (this.fakeCliDir) {
-      fs.rmSync(this.fakeCliDir, { recursive: true, force: true });
-      this.fakeCliDir = undefined;
-    }
-  }
-
-  /**
-   * Return all broker events captured since start() (or last clearEvents call).
-   */
-  getEvents(): BrokerEvent[] {
-    return [...this.brokerEvents];
-  }
-
-  /**
-   * Clear captured broker events.
-   */
-  clearEvents(): void {
-    this.brokerEvents = [];
-  }
-
-  /**
-   * Abort the currently running workflow, if any.
-   */
-  abortCurrentRun(): void {
-    this.currentRunner?.abort();
-  }
-
-  /**
-   * Run a workflow config through the real WorkflowRunner and collect events.
-   */
-  async runWorkflow(
-    config: RelayYamlConfig,
-    vars?: VariableContext,
-    options?: { workflowName?: string; cwd?: string; useRelaycast?: boolean }
-  ): Promise<WorkflowRunResult> {
-    const useRelaycast = options?.useRelaycast ?? this.defaultUseRelaycast;
-
-    if (!this.started) {
-      await this.start({ useRelaycast });
-    } else if (useRelaycast && !this.runnerEnv?.RELAY_API_KEY) {
-      this.runnerEnv = {
-        ...this.runnerEnv,
-        RELAY_API_KEY: await ensureApiKey(),
-      };
-      this.defaultUseRelaycast = true;
-    }
-
-    this.brokerEvents = [];
-
-    const events: WorkflowEvent[] = [];
-    const runner = new WorkflowRunner({
-      cwd: options?.cwd,
-      relay: {
-        binaryPath: this.binaryPath,
-        env: {
-          ...this.runnerEnv,
-          ...(process.env.FAKE_OUTPUT === undefined ? {} : { FAKE_OUTPUT: process.env.FAKE_OUTPUT }),
-          ...(useRelaycast ? {} : { AGENT_RELAY_WORKFLOW_DISABLE_RELAYCAST: '1' }),
-        },
-      },
-    });
-    this.currentRunner = runner;
-
-    const unsubscribe = runner.on((event) => {
-      events.push(event);
-      if (event.type === 'broker:event') {
-        this.brokerEvents.push(event.event);
-      }
-    });
-
-    try {
-      const run = await runner.execute(config, options?.workflowName, vars);
-      return {
-        run,
-        events,
-        brokerEvents: [...this.brokerEvents],
-      };
-    } finally {
-      unsubscribe();
-      this.currentRunner = undefined;
-    }
-  }
-
-  /**
-   * Read the latest trajectory JSON file for a workflow run.
-   * Checks completed before active to prefer finished runs.
-   */
-  getTrajectory(cwd: string): TrajectoryFile | null {
-    const completed = path.join(cwd, '.trajectories', 'completed');
-    const active = path.join(cwd, '.trajectories', 'active');
-
-    const completedTrajectory = readLatestTrajectoryFile(completed);
-    if (completedTrajectory) {
-      return completedTrajectory;
-    }
-
-    return readLatestTrajectoryFile(active);
-  }
-}
-
-function ensureFakeCliDir(cliName = 'claude'): string {
-  const dir = fs.mkdtempSync(path.join(os.tmpdir(), 'relay-wf-cli-'));
-  const script =
-    '#!/usr/bin/env bash\n' +
-    'FAKE_OUTPUT_SET=0\n' +
-    'if [[ -n "${FAKE_OUTPUT+x}" ]]; then\n' +
-    '  OUTPUT="$FAKE_OUTPUT"\n' +
-    '  FAKE_OUTPUT_SET=1\n' +
-    'else\n' +
-    '  OUTPUT="DONE"\n' +
-    'fi\n' +
-    'INPUT_BUFFER="$*"$\'\\n\'\n' +
-    'MARKER=""\n' +
-    'REVIEW_OUTPUT=""\n' +
-    'if [[ "${RELAY_AGENT_NAME:-}" =~ ^(.+)-review-[A-Za-z0-9]+$ ]]; then\n' +
-    "  REVIEW_OUTPUT=$'REVIEW_DECISION: APPROVE\\nREVIEW_REASON: Fake reviewer approved'\n" +
-    'elif [[ "${RELAY_AGENT_NAME:-}" =~ ^(.+)-(worker|owner)-[A-Za-z0-9]+$ ]]; then\n' +
-    '  MARKER="STEP_COMPLETE:${BASH_REMATCH[1]}"\n' +
-    'elif [[ "${RELAY_AGENT_NAME:-}" =~ ^(.+)-[A-Za-z0-9]+$ ]]; then\n' +
-    '  MARKER="STEP_COMPLETE:${BASH_REMATCH[1]}"\n' +
-    'fi\n' +
-    'while IFS= read -r -t 1 line; do\n' +
-    '  INPUT_BUFFER+="$line"$\'\\n\'\n' +
-    '  if [[ "$line" =~ STEP_COMPLETE:([A-Za-z0-9._-]+) ]]; then\n' +
-    '    MARKER="STEP_COMPLETE:${BASH_REMATCH[1]}"\n' +
-    '  fi\n' +
-    'done 2>/dev/null\n' +
-    'if [[ "$FAKE_OUTPUT_SET" -eq 0 ]]; then\n' +
-    '  if [[ "$INPUT_BUFFER" =~ End[[:space:]]with:[[:space:]]([A-Za-z0-9._-]+) ]]; then\n' +
-    '    OUTPUT="${BASH_REMATCH[1]}"\n' +
-    '  elif [[ "$INPUT_BUFFER" =~ outputting:[[:space:]]([A-Za-z0-9._-]+) ]]; then\n' +
-    '    OUTPUT="${BASH_REMATCH[1]}"\n' +
-    '  elif [[ "$INPUT_BUFFER" =~ Output[[:space:]]exactly:[[:space:]]([A-Za-z0-9._-]+) ]]; then\n' +
-    '    OUTPUT="${BASH_REMATCH[1]}"\n' +
-    '  elif [[ "$INPUT_BUFFER" =~ Print[[:space:]]([A-Za-z0-9._-]+) ]]; then\n' +
-    '    OUTPUT="${BASH_REMATCH[1]}"\n' +
-    '  elif [[ "$INPUT_BUFFER" =~ Return[[:space:]]([A-Za-z0-9._-]+) ]]; then\n' +
-    '    OUTPUT="${BASH_REMATCH[1]}"\n' +
-    '  elif [[ "$INPUT_BUFFER" =~ Say[[:space:]]([A-Za-z0-9._-]+)[[:space:]]when[[:space:]]finished ]]; then\n' +
-    '    OUTPUT="${BASH_REMATCH[1]}"\n' +
-    '  fi\n' +
-    'fi\n' +
-    'if [[ -n "$MARKER" ]]; then\n' +
-    '  echo "$MARKER"\n' +
-    'fi\n' +
-    'if [[ -n "$REVIEW_OUTPUT" ]]; then\n' +
-    '  echo "$REVIEW_OUTPUT"\n' +
-    'fi\n' +
-    'echo "$OUTPUT"\n' +
-    'exit 0\n';
-
-  const scriptPath = path.join(dir, cliName);
-  fs.writeFileSync(scriptPath, script, { mode: 0o755 });
-
-  return dir;
-}
-
-function readLatestTrajectoryFile(dir: string): TrajectoryFile | null {
-  if (!fs.existsSync(dir)) {
-    return null;
-  }
-
-  const files = fs
-    .readdirSync(dir)
-    .filter((entry) => entry.endsWith('.json'))
-    .map((entry) => ({
-      path: path.join(dir, entry),
-      mtimeMs: fs.statSync(path.join(dir, entry)).mtimeMs,
-    }))
-    .sort((a, b) => b.mtimeMs - a.mtimeMs);
-
-  for (const file of files) {
-    try {
-      const raw = fs.readFileSync(file.path, 'utf-8');
-      return JSON.parse(raw) as TrajectoryFile;
-    } catch {
-      // Continue to next file if parse fails.
-    }
-  }
-
-  return null;
-}
diff --git a/tests/integration/broker/utils/workflow-runner-harness.ts b/tests/integration/broker/utils/workflow-runner-harness.ts
deleted file mode 100644
index 16a9ea276..000000000
--- a/tests/integration/broker/utils/workflow-runner-harness.ts
+++ /dev/null
@@ -1 +0,0 @@
-export { WorkflowRunnerHarness, type WorkflowRunResult, type TrajectoryFile } from './workflow-harness.js';
diff --git a/tests/integration/broker/workflow-agents.test.ts b/tests/integration/broker/workflow-agents.test.ts
deleted file mode 100644
index a6a1f7f58..000000000
--- a/tests/integration/broker/workflow-agents.test.ts
+++ /dev/null
@@ -1,203 +0,0 @@
-/**
- * WorkflowRunner agent-interaction integration tests.
- */
-import assert from 'node:assert/strict';
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import test, { type TestContext } from 'node:test';
-
-import type { RelayYamlConfig } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites } from './utils/broker-harness.js';
-import { WorkflowRunnerHarness } from './utils/workflow-harness.js';
-import {
-  assertRunCompleted,
-  assertRunFailed,
-  assertStepCompleted,
-  assertStepFailed,
-  assertStepOutput,
-  assertWorkflowEventOrder,
-} from './utils/workflow-assert-helpers.js';
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function makeConfig(overrides?: Partial<RelayYamlConfig>): RelayYamlConfig {
-  const base: RelayYamlConfig = {
-    version: '1',
-    name: 'test-workflow-agents',
-    description: 'Integration test',
-    swarm: { pattern: 'dag' },
-    agents: [
-      { name: 'agent-a', cli: 'claude' },
-      { name: 'agent-b', cli: 'claude' },
-    ],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'step-a', agent: 'agent-a', task: 'Do agent-a work' },
-          { name: 'step-b', agent: 'agent-b', task: 'Do agent-b work' },
-        ],
-      },
-    ],
-  };
-
-  return {
-    ...base,
-    ...overrides,
-    agents: overrides?.agents ?? base.agents,
-    workflows: overrides?.workflows ?? base.workflows,
-    swarm: { ...base.swarm, ...(overrides?.swarm ?? {}) },
-  };
-}
-
-function createWorkdir(): string {
-  return fs.mkdtempSync(path.join(os.tmpdir(), 'relay-wf-agents-'));
-}
-
-test('workflow-agents: runs steps for different agents', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-
-  try {
-    const result = await harness.runWorkflow(makeConfig(), undefined, { cwd, useRelaycast: false });
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-a');
-    assertStepCompleted(result, 'step-b');
-    assertStepOutput(result, 'step-a', 'DONE');
-    assertStepOutput(result, 'step-b', 'DONE');
-    assertWorkflowEventOrder(result.events, [
-      'run:started',
-      'step:started',
-      'step:completed',
-      'run:completed',
-    ]);
-    assert.ok(result.brokerEvents.length > 0, 'Expected broker events from agent lifecycle');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-agents: emits agent lifecycle events', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-
-  try {
-    const result = await harness.runWorkflow(makeConfig(), undefined, { cwd, useRelaycast: false });
-    const eventKinds = new Set(result.brokerEvents.map((event) => event.kind));
-
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-a');
-    assertStepCompleted(result, 'step-b');
-    assertStepOutput(result, 'step-a', 'DONE');
-    assertStepOutput(result, 'step-b', 'DONE');
-    assertWorkflowEventOrder(result.events, [
-      'run:started',
-      'step:started',
-      'step:completed',
-      'run:completed',
-    ]);
-    assert.ok(eventKinds.has('agent_spawned'), 'Expected agent_spawned broker event');
-    assert.ok(
-      eventKinds.has('agent_released') || eventKinds.has('agent_exited'),
-      `Expected agent_released or agent_exited broker event, got: ${JSON.stringify([...eventKinds])}`
-    );
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-agents: retries deterministic work on transient failure', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-
-  try {
-    const marker = 'wf-retry-marker.txt';
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-retry',
-                type: 'deterministic',
-                command: `if [ ! -f ${marker} ]; then echo fail-once; touch ${marker}; exit 1; fi; echo DONE`,
-                retries: 1,
-                verification: { type: 'output_contains', value: 'DONE' },
-              },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd, useRelaycast: false }
-    );
-
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-retry');
-    assertStepOutput(result, 'step-retry', 'DONE');
-    const retrying = result.events.find((event) => event.type === 'step:retrying');
-    assert.ok(retrying, 'Expected a retrying event');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-agents: surfaces deterministic agent failure', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-  const previousOutput = process.env.FAKE_OUTPUT;
-
-  try {
-    process.env.FAKE_OUTPUT = 'ERROR';
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-a',
-                agent: 'agent-a',
-                task: 'Should fail verification',
-                verification: { type: 'output_contains', value: 'DONE' },
-              },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd, useRelaycast: false }
-    );
-
-    assertRunFailed(result, 'does not contain');
-    assertStepFailed(result, 'step-a');
-  } finally {
-    process.env.FAKE_OUTPUT = previousOutput;
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
diff --git a/tests/integration/broker/workflow-ci.test.ts b/tests/integration/broker/workflow-ci.test.ts
deleted file mode 100644
index 43f01ca93..000000000
--- a/tests/integration/broker/workflow-ci.test.ts
+++ /dev/null
@@ -1,688 +0,0 @@
-/**
- * CI-friendly workflow integration tests using lightweight processes.
- *
- * These tests use a lightweight fake CLI shim (named as an allowed Relaycast
- * CLI) so they can run in CI without API keys or real AI CLI binaries.
- *
- * Run:
- *   npx tsc -p tests/integration/broker/tsconfig.json
- *   node --test tests/integration/broker/dist/workflow-ci.test.js
- *
- * No special environment variables required (auto-provisions ephemeral workspace).
- */
-import assert from 'node:assert/strict';
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import test, { type TestContext } from 'node:test';
-
-import type { BrokerEvent } from '@agent-relay/sdk';
-import { BrokerHarness, checkPrerequisites, uniqueSuffix } from './utils/broker-harness.js';
-import {
-  assertAgentExists,
-  assertAgentNotExists,
-  assertNoDroppedDeliveries,
-  assertAgentSpawnedEvent,
-  assertAgentReleasedEvent,
-} from './utils/assert-helpers.js';
-import { sleep } from './utils/cli-helpers.js';
-
-const CI_TEST_CLI = 'gemini';
-const DELIVERY_PROGRESS_KINDS = new Set<BrokerEvent['kind']>([
-  'delivery_queued',
-  'delivery_injected',
-  'delivery_active',
-  'delivery_verified',
-  'delivery_ack',
-  'delivery_retry',
-]);
-
-let fakeCliDir: string | undefined;
-
-function ensureFakeCliDir(): string {
-  if (fakeCliDir) return fakeCliDir;
-
-  const dir = fs.mkdtempSync(path.join(os.tmpdir(), 'relay-ci-cli-'));
-  const script = '#!/usr/bin/env bash\nexec cat\n';
-  const fakeCliPath = path.join(dir, CI_TEST_CLI);
-  fs.writeFileSync(fakeCliPath, script, { mode: 0o755 });
-  fakeCliDir = dir;
-  return dir;
-}
-
-function createCiHarness(): BrokerHarness {
-  const shimDir = ensureFakeCliDir();
-  const existingPath = process.env.PATH ?? '';
-  const mergedPath = existingPath ? `${shimDir}${path.delimiter}${existingPath}` : shimDir;
-  return new BrokerHarness({
-    env: {
-      ...process.env,
-      PATH: mergedPath,
-    },
-  });
-}
-
-function countDeliveryProgress(events: BrokerEvent[], name?: string): number {
-  return events.filter((event) => {
-    if (!DELIVERY_PROGRESS_KINDS.has(event.kind)) return false;
-    if (!name) return true;
-    return 'name' in event && (event as BrokerEvent & { name: string }).name === name;
-  }).length;
-}
-
-function countUniqueDeliveryEventIds(events: BrokerEvent[], name?: string): number {
-  const ids = new Set<string>();
-  for (const event of events) {
-    if (!DELIVERY_PROGRESS_KINDS.has(event.kind)) continue;
-    if (!('event_id' in event)) continue;
-    if (name && (!('name' in event) || event.name !== name)) continue;
-    ids.add(event.event_id);
-  }
-  return ids.size;
-}
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-// ── Basic Cat Agent Tests ────────────────────────────────────────────────────
-
-test('ci: cat agent — spawn and verify alive', { timeout: 30_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const harness = createCiHarness();
-  await harness.start();
-  const agentName = `cat-basic-${uniqueSuffix()}`;
-
-  try {
-    const spawned = await harness.spawnAgent(agentName, CI_TEST_CLI, ['ci-test']);
-    assert.equal(spawned.name, agentName);
-    assert.equal(spawned.runtime, 'pty');
-
-    await sleep(3_000);
-    await assertAgentExists(harness, agentName);
-
-    const events = harness.getEvents();
-    assertAgentSpawnedEvent(events, agentName);
-
-    await harness.releaseAgent(agentName);
-    await sleep(2_000);
-    await assertAgentNotExists(harness, agentName);
-  } finally {
-    await harness.stop();
-  }
-});
-
-test('ci: cat agent — message delivery pipeline', { timeout: 30_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const harness = createCiHarness();
-  await harness.start();
-  const agentName = `cat-delivery-${uniqueSuffix()}`;
-
-  try {
-    await harness.spawnAgent(agentName, CI_TEST_CLI, ['ci-test']);
-    await sleep(3_000);
-
-    const result = await harness.sendMessage({
-      to: agentName,
-      from: 'ci-runner',
-      text: 'Hello from CI test',
-    });
-    assert.ok(result.event_id, 'should get event_id');
-
-    await sleep(5_000);
-
-    const events = harness.getEvents();
-    assert.ok(countDeliveryProgress(events, agentName) >= 1, `should see delivery progress for ${agentName}`);
-    assertNoDroppedDeliveries(events);
-
-    await harness.releaseAgent(agentName);
-  } finally {
-    await harness.stop();
-  }
-});
-
-// ── Multi-Agent Workflow Patterns ────────────────────────────────────────────
-
-test('ci: review-loop pattern — 3 cat agents', { timeout: 45_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const harness = createCiHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-
-  try {
-    const implementer = `impl-${suffix}`;
-    const reviewer1 = `rev1-${suffix}`;
-    const reviewer2 = `rev2-${suffix}`;
-
-    // Spawn all agents
-    await harness.spawnAgent(implementer, CI_TEST_CLI, ['review-loop']);
-    await harness.spawnAgent(reviewer1, CI_TEST_CLI, ['review-loop']);
-    await harness.spawnAgent(reviewer2, CI_TEST_CLI, ['review-loop']);
-    await sleep(5_000);
-
-    // Verify all alive
-    await assertAgentExists(harness, implementer);
-    await assertAgentExists(harness, reviewer1);
-    await assertAgentExists(harness, reviewer2);
-
-    // Step 1: Send task to implementer
-    await harness.sendMessage({
-      to: implementer,
-      from: 'coordinator',
-      text: 'Implement the feature',
-    });
-    await sleep(3_000);
-
-    // Step 2: Send review tasks to reviewers
-    await harness.sendMessage({
-      to: reviewer1,
-      from: 'coordinator',
-      text: 'Review for code quality',
-    });
-    await harness.sendMessage({
-      to: reviewer2,
-      from: 'coordinator',
-      text: 'Review for security',
-    });
-    await sleep(3_000);
-
-    // Step 3: Reviewer-to-reviewer communication
-    await harness.sendMessage({
-      to: reviewer2,
-      from: reviewer1,
-      text: 'Found an issue, do you agree?',
-    });
-    await sleep(3_000);
-
-    // Verify deliveries
-    const events = harness.getEvents();
-    assertNoDroppedDeliveries(events);
-
-    // Review loop sends 4 messages total.
-    const uniqueDeliveryIds = countUniqueDeliveryEventIds(events);
-    assert.ok(
-      uniqueDeliveryIds >= 4,
-      `should have delivery progress for at least 4 messages, got ${uniqueDeliveryIds}`
-    );
-
-    // Clean up
-    await harness.releaseAgent(implementer);
-    await harness.releaseAgent(reviewer1);
-    await harness.releaseAgent(reviewer2);
-    await sleep(2_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-test('ci: hub-spoke pattern — 1 hub + 4 spokes', { timeout: 60_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const harness = createCiHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-
-  try {
-    const hub = `hub-${suffix}`;
-    const spokes = [`spoke1-${suffix}`, `spoke2-${suffix}`, `spoke3-${suffix}`, `spoke4-${suffix}`];
-
-    // Spawn hub
-    await harness.spawnAgent(hub, CI_TEST_CLI, ['hub-spoke']);
-    await sleep(2_000);
-
-    // Spawn spokes
-    for (const spoke of spokes) {
-      await harness.spawnAgent(spoke, CI_TEST_CLI, ['hub-spoke']);
-    }
-    await sleep(5_000);
-
-    // Verify all alive
-    await assertAgentExists(harness, hub);
-    for (const spoke of spokes) {
-      await assertAgentExists(harness, spoke);
-    }
-
-    // Hub fans out to all spokes
-    for (const spoke of spokes) {
-      await harness.sendMessage({
-        to: spoke,
-        from: hub,
-        text: `Task for ${spoke}`,
-      });
-    }
-    await sleep(5_000);
-
-    // Spokes report back to hub
-    for (const spoke of spokes) {
-      await harness.sendMessage({
-        to: hub,
-        from: spoke,
-        text: `DONE: ${spoke} completed`,
-      });
-    }
-    await sleep(5_000);
-
-    // Verify deliveries
-    const events = harness.getEvents();
-    assertNoDroppedDeliveries(events);
-
-    // Hub-spoke sends 8 messages total (4 out + 4 back).
-    const uniqueDeliveryIds = countUniqueDeliveryEventIds(events);
-    assert.ok(
-      uniqueDeliveryIds >= 8,
-      `should have delivery progress for at least 8 messages, got ${uniqueDeliveryIds}`
-    );
-
-    // Clean up
-    await harness.releaseAgent(hub);
-    for (const spoke of spokes) {
-      await harness.releaseAgent(spoke);
-    }
-    await sleep(3_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-test('ci: pipeline pattern — sequential message flow', { timeout: 45_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const harness = createCiHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-
-  try {
-    const stage1 = `stage1-${suffix}`;
-    const stage2 = `stage2-${suffix}`;
-    const stage3 = `stage3-${suffix}`;
-
-    // Spawn pipeline stages
-    await harness.spawnAgent(stage1, CI_TEST_CLI, ['pipeline']);
-    await harness.spawnAgent(stage2, CI_TEST_CLI, ['pipeline']);
-    await harness.spawnAgent(stage3, CI_TEST_CLI, ['pipeline']);
-    await sleep(5_000);
-
-    // Pipeline: stage1 → stage2 → stage3
-    await harness.sendMessage({
-      to: stage1,
-      from: 'input',
-      text: 'Initial data',
-    });
-    await sleep(2_000);
-
-    await harness.sendMessage({
-      to: stage2,
-      from: stage1,
-      text: 'Processed by stage1',
-    });
-    await sleep(2_000);
-
-    await harness.sendMessage({
-      to: stage3,
-      from: stage2,
-      text: 'Processed by stage2',
-    });
-    await sleep(3_000);
-
-    // Verify all stages received messages
-    const events = harness.getEvents();
-    assertNoDroppedDeliveries(events);
-
-    assert.ok(countDeliveryProgress(events, stage1) >= 1, 'stage1 should receive delivery progress');
-    assert.ok(countDeliveryProgress(events, stage2) >= 1, 'stage2 should receive delivery progress');
-    assert.ok(countDeliveryProgress(events, stage3) >= 1, 'stage3 should receive delivery progress');
-
-    // Clean up
-    await harness.releaseAgent(stage1);
-    await harness.releaseAgent(stage2);
-    await harness.releaseAgent(stage3);
-    await sleep(2_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-// ── Channel-Based Coordination ───────────────────────────────────────────────
-
-test('ci: channel broadcast — message to all agents on channel', { timeout: 45_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const harness = createCiHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-  const channelName = `ci-channel-${suffix}`;
-
-  try {
-    const agent1 = `agent1-${suffix}`;
-    const agent2 = `agent2-${suffix}`;
-    const agent3 = `agent3-${suffix}`;
-
-    // All agents join same channel
-    await harness.spawnAgent(agent1, CI_TEST_CLI, [channelName]);
-    await harness.spawnAgent(agent2, CI_TEST_CLI, [channelName]);
-    await harness.spawnAgent(agent3, CI_TEST_CLI, [channelName]);
-    await sleep(5_000);
-
-    // Broadcast to channel. In broker-only mode this may route through Relaycast and
-    // fail with relaycast_publish_failed when channel registration is unavailable.
-    let publishFailed = false;
-    try {
-      const result = await harness.sendMessage({
-        to: `#${channelName}`,
-        from: agent1,
-        text: 'Broadcast: all agents report status',
-      });
-      assert.ok(result.event_id, 'broadcast should get event_id');
-    } catch (error) {
-      const code = (error as { code?: string })?.code;
-      assert.equal(code, 'relaycast_publish_failed', 'unexpected channel publish error');
-      publishFailed = true;
-    }
-
-    await sleep(5_000);
-
-    const events = harness.getEvents();
-    if (publishFailed) {
-      const publishFailures = events.filter((event) => event.kind === 'relaycast_publish_failed');
-      assert.ok(publishFailures.length >= 1, 'should emit relaycast_publish_failed for channel broadcast');
-    }
-    assertNoDroppedDeliveries(events);
-
-    // Clean up
-    await harness.releaseAgent(agent1);
-    await harness.releaseAgent(agent2);
-    await harness.releaseAgent(agent3);
-    await sleep(2_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-// ── Lifecycle Tests ──────────────────────────────────────────────────────────
-
-test('ci: agent lifecycle — spawn, release, re-spawn', { timeout: 45_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const harness = createCiHarness();
-  await harness.start();
-  const agentName = `lifecycle-${uniqueSuffix()}`;
-
-  try {
-    // First spawn
-    await harness.spawnAgent(agentName, CI_TEST_CLI, ['lifecycle']);
-    await sleep(3_000);
-    await assertAgentExists(harness, agentName);
-
-    // Release
-    await harness.releaseAgent(agentName);
-    await sleep(3_000);
-    await assertAgentNotExists(harness, agentName);
-
-    // Re-spawn with same name
-    await harness.spawnAgent(agentName, CI_TEST_CLI, ['lifecycle']);
-    await sleep(3_000);
-    await assertAgentExists(harness, agentName);
-
-    // Verify events
-    const events = harness.getEvents();
-    const spawnEvents = events.filter(
-      (e) =>
-        e.kind === 'agent_spawned' && 'name' in e && (e as BrokerEvent & { name: string }).name === agentName
-    );
-    const releaseEvents = events.filter(
-      (e) =>
-        e.kind === 'agent_released' && 'name' in e && (e as BrokerEvent & { name: string }).name === agentName
-    );
-
-    assert.equal(spawnEvents.length, 2, 'should have 2 spawn events');
-    assert.equal(releaseEvents.length, 1, 'should have 1 release event');
-
-    // Clean up
-    await harness.releaseAgent(agentName);
-    await sleep(2_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-test('ci: rapid spawn/release — 5 agents in sequence', { timeout: 60_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const harness = createCiHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-
-  try {
-    for (let i = 0; i < 5; i++) {
-      const name = `rapid-${i}-${suffix}`;
-      await harness.spawnAgent(name, CI_TEST_CLI, ['rapid']);
-      await sleep(2_000);
-      await assertAgentExists(harness, name);
-      await harness.releaseAgent(name);
-      await sleep(2_000);
-      await assertAgentNotExists(harness, name);
-    }
-
-    // Verify events
-    const events = harness.getEvents();
-    const spawnCount = events.filter((e) => e.kind === 'agent_spawned').length;
-    const releaseCount = events.filter(
-      (e) => e.kind === 'agent_released' || e.kind === 'agent_exited'
-    ).length;
-
-    assert.ok(spawnCount >= 5, `should have at least 5 spawns, got ${spawnCount}`);
-    assert.ok(releaseCount >= 5, `should have at least 5 releases, got ${releaseCount}`);
-  } finally {
-    await harness.stop();
-  }
-});
-
-// ── Error Handling ───────────────────────────────────────────────────────────
-
-test('ci: duplicate agent name — second spawn fails', { timeout: 30_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const harness = createCiHarness();
-  await harness.start();
-  const agentName = `dup-${uniqueSuffix()}`;
-
-  try {
-    // First spawn succeeds
-    await harness.spawnAgent(agentName, CI_TEST_CLI, ['dup-test']);
-    await sleep(3_000);
-    await assertAgentExists(harness, agentName);
-
-    // Second spawn with same name should fail
-    await assert.rejects(
-      () => harness.spawnAgent(agentName, CI_TEST_CLI, ['dup-test']),
-      'spawning duplicate name should reject'
-    );
-
-    // Clean up
-    await harness.releaseAgent(agentName);
-    await sleep(2_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-test('ci: message to non-existent agent — delivery dropped', { timeout: 30_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const harness = createCiHarness();
-  await harness.start();
-
-  try {
-    const sender = `sender-${uniqueSuffix()}`;
-    await harness.spawnAgent(sender, CI_TEST_CLI, ['general']);
-    await sleep(3_000);
-
-    // Send message to an unknown target. In broker-only mode this can either
-    // return an accepted event_id or fail with relaycast_publish_failed.
-    let accepted = false;
-    try {
-      const result = await harness.sendMessage({
-        to: `ghost-agent-${uniqueSuffix()}`,
-        from: sender,
-        text: 'Message to nowhere',
-      });
-      assert.ok(result.event_id, 'should get event_id when unknown target is accepted');
-      accepted = true;
-    } catch (error) {
-      const code = (error as { code?: string })?.code;
-      assert.equal(code, 'relaycast_publish_failed', 'unexpected unknown-target error');
-    }
-
-    await sleep(3_000);
-    const events = harness.getEvents();
-    if (!accepted) {
-      const publishFailures = events.filter((event) => event.kind === 'relaycast_publish_failed');
-      assert.ok(publishFailures.length >= 1, 'should emit relaycast_publish_failed for unknown target');
-    }
-
-    await harness.releaseAgent(sender);
-  } finally {
-    await harness.stop();
-  }
-});
-
-// ── Parallel Operations ──────────────────────────────────────────────────────
-
-test('ci: parallel spawn — 6 agents at once', { timeout: 60_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const harness = createCiHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-
-  try {
-    const names = [
-      `par1-${suffix}`,
-      `par2-${suffix}`,
-      `par3-${suffix}`,
-      `par4-${suffix}`,
-      `par5-${suffix}`,
-      `par6-${suffix}`,
-    ];
-
-    // Spawn all in parallel
-    await Promise.all(names.map((name) => harness.spawnAgent(name, CI_TEST_CLI, ['parallel'])));
-    await sleep(8_000);
-
-    // Verify all alive
-    const agents = await harness.listAgents();
-    for (const name of names) {
-      assert.ok(
-        agents.some((a) => a.name === name),
-        `${name} should be alive`
-      );
-    }
-
-    // Send messages to all in parallel
-    await Promise.all(
-      names.map((name) =>
-        harness.sendMessage({
-          to: name,
-          from: 'ci-runner',
-          text: `Ping ${name}`,
-        })
-      )
-    );
-    await sleep(5_000);
-
-    // Verify deliveries
-    const events = harness.getEvents();
-    const uniqueDeliveryIds = countUniqueDeliveryEventIds(events);
-    assert.ok(
-      uniqueDeliveryIds >= names.length,
-      `should have delivery progress for at least ${names.length} messages, got ${uniqueDeliveryIds}`
-    );
-    assertNoDroppedDeliveries(events);
-
-    // Clean up in parallel
-    await Promise.all(names.map((name) => harness.releaseAgent(name)));
-    await sleep(3_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-// ── Workflow Step Simulation ─────────────────────────────────────────────────
-
-test('ci: workflow steps — implement → review → consolidate → address', { timeout: 60_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const harness = createCiHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-
-  try {
-    const implementer = `impl-${suffix}`;
-    const reviewer = `rev-${suffix}`;
-
-    await harness.spawnAgent(implementer, CI_TEST_CLI, ['workflow']);
-    await harness.spawnAgent(reviewer, CI_TEST_CLI, ['workflow']);
-    await sleep(5_000);
-
-    // Step 1: Implement
-    await harness.sendMessage({
-      to: implementer,
-      from: 'workflow-engine',
-      text: 'Step 1: Implement feature X',
-    });
-    await sleep(2_000);
-
-    // Step 2: Review (parallel with Step 1 completion)
-    await harness.sendMessage({
-      to: reviewer,
-      from: 'workflow-engine',
-      text: 'Step 2: Review implementation',
-    });
-    await sleep(2_000);
-
-    // Step 3: Consolidate (reviewer → implementer)
-    await harness.sendMessage({
-      to: implementer,
-      from: reviewer,
-      text: 'Step 3: Review feedback - found 2 issues',
-    });
-    await sleep(2_000);
-
-    // Step 4: Address feedback
-    await harness.sendMessage({
-      to: implementer,
-      from: 'workflow-engine',
-      text: 'Step 4: Address review feedback',
-    });
-    await sleep(3_000);
-
-    // Verify all steps executed
-    const events = harness.getEvents();
-    const implProgress = countDeliveryProgress(events, implementer);
-    const revProgress = countDeliveryProgress(events, reviewer);
-    assert.ok(
-      implProgress >= 2,
-      `implementer should have at least 2 delivery progress events, got ${implProgress}`
-    );
-    assert.ok(
-      revProgress >= 1,
-      `reviewer should have at least 1 delivery progress event, got ${revProgress}`
-    );
-    assertNoDroppedDeliveries(events);
-
-    // Clean up
-    await harness.releaseAgent(implementer);
-    await harness.releaseAgent(reviewer);
-    await sleep(2_000);
-  } finally {
-    await harness.stop();
-  }
-});
diff --git a/tests/integration/broker/workflow-dag.test.ts b/tests/integration/broker/workflow-dag.test.ts
deleted file mode 100644
index 53c88e990..000000000
--- a/tests/integration/broker/workflow-dag.test.ts
+++ /dev/null
@@ -1,220 +0,0 @@
-/**
- * WorkflowRunner DAG behavior integration tests.
- */
-import assert from 'node:assert/strict';
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import test, { type TestContext } from 'node:test';
-
-import type { RelayYamlConfig } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites } from './utils/broker-harness.js';
-import { WorkflowRunnerHarness } from './utils/workflow-harness.js';
-import {
-  assertStepCompleted,
-  assertStepOrder,
-  assertStepsParallel,
-  assertWorkflowEventOrder,
-} from './utils/workflow-assert-helpers.js';
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function makeConfig(overrides?: Partial<RelayYamlConfig>): RelayYamlConfig {
-  const base: RelayYamlConfig = {
-    version: '1',
-    name: 'test-workflow-dag',
-    description: 'Integration test',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'worker', cli: 'claude' }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'step-a', agent: 'worker', task: 'Step A' },
-          { name: 'step-b', agent: 'worker', task: 'Step B', dependsOn: ['step-a'] },
-          { name: 'step-c', agent: 'worker', task: 'Step C', dependsOn: ['step-b'] },
-        ],
-      },
-    ],
-  };
-
-  return {
-    ...base,
-    ...overrides,
-    agents: overrides?.agents ?? base.agents,
-    workflows: overrides?.workflows ?? base.workflows,
-    swarm: { ...base.swarm, ...(overrides?.swarm ?? {}) },
-  };
-}
-
-function createWorkdir(): string {
-  return fs.mkdtempSync(path.join(os.tmpdir(), 'relay-wf-dag-'));
-}
-
-test('workflow-dag: executes simple chain in order', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const result = await harness.runWorkflow(makeConfig(), undefined, { cwd });
-    assertStepCompleted(result, 'step-a');
-    assertStepCompleted(result, 'step-b');
-    assertStepCompleted(result, 'step-c');
-    assertStepOrder(result, ['step-a', 'step-b', 'step-c']);
-    assertWorkflowEventOrder(result.events, [
-      'run:started',
-      'step:started',
-      'step:completed',
-      'run:completed',
-    ]);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test(
-  'workflow-dag: runs parallel fan-in steps without ordering violations',
-  { timeout: 120_000 },
-  async (t) => {
-    if (skipIfMissing(t)) return;
-
-    const cwd = createWorkdir();
-    const harness = new WorkflowRunnerHarness();
-    await harness.start({ useRelaycast: false });
-
-    try {
-      const result = await harness.runWorkflow(
-        makeConfig({
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                { name: 'step-a', agent: 'worker', task: 'A' },
-                { name: 'step-b', agent: 'worker', task: 'B' },
-                {
-                  name: 'step-c',
-                  agent: 'worker',
-                  task: 'C',
-                  dependsOn: ['step-a', 'step-b'],
-                },
-              ],
-            },
-          ],
-        }),
-        undefined,
-        { cwd }
-      );
-
-      assertStepCompleted(result, 'step-c');
-      assertStepsParallel(result, ['step-a', 'step-b']);
-      const cStart = result.events.findIndex(
-        (event) => event.type === 'step:started' && 'stepName' in event && event.stepName === 'step-c'
-      );
-      const aDone = result.events.findIndex(
-        (event) => event.type === 'step:completed' && 'stepName' in event && event.stepName === 'step-a'
-      );
-      const bDone = result.events.findIndex(
-        (event) => event.type === 'step:completed' && 'stepName' in event && event.stepName === 'step-b'
-      );
-      assert.ok(cStart > aDone, 'step-c should start after step-a completes');
-      assert.ok(cStart > bDone, 'step-c should start after step-b completes');
-    } finally {
-      await harness.stop();
-      fs.rmSync(cwd, { force: true, recursive: true });
-    }
-  }
-);
-
-test('workflow-dag: supports diamond dependencies (A→B,C→D)', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              { name: 'step-a', agent: 'worker', task: 'A' },
-              { name: 'step-b', agent: 'worker', task: 'B', dependsOn: ['step-a'] },
-              { name: 'step-c', agent: 'worker', task: 'C', dependsOn: ['step-a'] },
-              { name: 'step-d', agent: 'worker', task: 'D', dependsOn: ['step-b', 'step-c'] },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd }
-    );
-
-    assertStepCompleted(result, 'step-d');
-    assertStepsParallel(result, ['step-b', 'step-c']);
-    const dStart = result.events.findIndex(
-      (event) => event.type === 'step:started' && 'stepName' in event && event.stepName === 'step-d'
-    );
-    const bDone = result.events.findIndex(
-      (event) => event.type === 'step:completed' && 'stepName' in event && event.stepName === 'step-b'
-    );
-    const cDone = result.events.findIndex(
-      (event) => event.type === 'step:completed' && 'stepName' in event && event.stepName === 'step-c'
-    );
-    assert.ok(dStart > bDone, 'step-d should start after step-b completes');
-    assert.ok(dStart > cDone, 'step-d should start after step-c completes');
-    assertStepCompleted(result, 'step-a');
-    assertStepCompleted(result, 'step-b');
-    assertStepCompleted(result, 'step-c');
-    assertStepCompleted(result, 'step-d');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-dag: detects dependency cycle', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    await assert.rejects(
-      () =>
-        harness.runWorkflow(
-          makeConfig({
-            workflows: [
-              {
-                name: 'default',
-                steps: [
-                  { name: 'step-a', agent: 'worker', task: 'A', dependsOn: ['step-c'] },
-                  { name: 'step-b', agent: 'worker', task: 'B', dependsOn: ['step-a'] },
-                  { name: 'step-c', agent: 'worker', task: 'C', dependsOn: ['step-b'] },
-                ],
-              },
-            ],
-          }),
-          undefined,
-          { cwd }
-        ),
-      /dependency cycle/
-    );
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
diff --git a/tests/integration/broker/workflow-lifecycle.test.ts b/tests/integration/broker/workflow-lifecycle.test.ts
deleted file mode 100644
index c3870b506..000000000
--- a/tests/integration/broker/workflow-lifecycle.test.ts
+++ /dev/null
@@ -1,186 +0,0 @@
-/**
- * WorkflowRunner lifecycle integration tests.
- */
-import assert from 'node:assert/strict';
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import test, { type TestContext } from 'node:test';
-
-import type { RelayYamlConfig, VerificationCheck } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites } from './utils/broker-harness.js';
-import { WorkflowRunnerHarness } from './utils/workflow-harness.js';
-import {
-  assertRunCompleted,
-  assertRunFailed,
-  assertStepCompleted,
-  assertStepFailed,
-  assertWorkflowEventOrder,
-} from './utils/workflow-assert-helpers.js';
-import { sleep } from './utils/cli-helpers.js';
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function makeConfig(overrides?: Partial<RelayYamlConfig>): RelayYamlConfig {
-  const base: RelayYamlConfig = {
-    version: '1',
-    name: 'test-workflow-lifecycle',
-    description: 'Integration test',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'worker', cli: 'claude' }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [{ name: 'step-1', agent: 'worker', task: 'Do one thing' }],
-      },
-    ],
-  };
-
-  return {
-    ...base,
-    ...overrides,
-    agents: overrides?.agents ?? base.agents,
-    workflows: overrides?.workflows ?? base.workflows,
-    swarm: { ...base.swarm, ...(overrides?.swarm ?? {}) },
-  };
-}
-
-function createWorkdir(): string {
-  return fs.mkdtempSync(path.join(os.tmpdir(), 'relay-wf-lifecycle-'));
-}
-
-test('workflow-lifecycle: run completes successfully', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const result = await harness.runWorkflow(makeConfig(), undefined, { cwd });
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-1');
-    assertWorkflowEventOrder(result.events, [
-      'run:started',
-      'step:started',
-      'step:completed',
-      'run:completed',
-    ]);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-lifecycle: failed run emits failed events', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  const failingVerification: VerificationCheck = {
-    type: 'output_contains',
-    value: 'MUST_NOT_APPEAR',
-  };
-
-  try {
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-1',
-                agent: 'worker',
-                task: 'Do one thing',
-                verification: failingVerification,
-              },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd }
-    );
-
-    assertRunFailed(result);
-    assertStepFailed(result, 'step-1');
-    assertWorkflowEventOrder(result.events, ['run:started', 'step:started', 'step:failed', 'run:failed']);
-    assert.equal(result.run.error !== undefined, true, 'Expected run error');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-lifecycle: abort cancels a running workflow', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const runPromise = harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-slow',
-                type: 'deterministic',
-                command: 'sleep 30',
-              },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd }
-    );
-
-    // Wait for the step to actually start running before aborting
-    let currentRunner = harness.getCurrentRunner();
-    for (let i = 0; i < 20 && !currentRunner; i += 1) {
-      await sleep(250);
-      currentRunner = harness.getCurrentRunner();
-    }
-    assert.ok(currentRunner, 'Expected workflow runner to be available while running');
-
-    // Wait for step:started event before aborting so the step is actually in-flight
-    await new Promise<void>((resolve) => {
-      const unsub = currentRunner!.on((event) => {
-        if (event.type === 'step:started') {
-          unsub();
-          resolve();
-        }
-      });
-    });
-    currentRunner.abort();
-
-    const result = await runPromise;
-    assert.equal(result.run.status, 'cancelled', `Expected run to be cancelled, got "${result.run.status}"`);
-    assert.ok(
-      result.events.some((event) => event.type === 'run:cancelled'),
-      'Expected run:cancelled event'
-    );
-    assert.ok(
-      result.events.some((event) => event.type === 'step:failed'),
-      'Expected abort to fail the in-flight step'
-    );
-    assertWorkflowEventOrder(result.events, ['run:started', 'step:started', 'step:failed', 'run:cancelled']);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
diff --git a/tests/integration/broker/workflow-models.test.ts b/tests/integration/broker/workflow-models.test.ts
deleted file mode 100644
index 033ecfe06..000000000
--- a/tests/integration/broker/workflow-models.test.ts
+++ /dev/null
@@ -1,147 +0,0 @@
-/**
- * Workflow model-flag integration tests.
- *
- * Verifies that constraints.model is forwarded to CLI invocations for
- * non-interactive workflow agents.
- */
-import assert from 'node:assert/strict';
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import test, { type TestContext } from 'node:test';
-
-import type { RelayYamlConfig } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites } from './utils/broker-harness.js';
-import { WorkflowRunnerHarness, type WorkflowRunResult } from './utils/workflow-harness.js';
-import { assertRunCompleted, assertStepCompleted } from './utils/workflow-assert-helpers.js';
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function createWorkdir(): string {
-  return fs.mkdtempSync(path.join(os.tmpdir(), 'relay-wf-models-'));
-}
-
-function skipIfRateLimited(t: TestContext, result: WorkflowRunResult): boolean {
-  const errors = [
-    result.run.error ?? '',
-    ...result.events
-      .filter((event): event is typeof event & { error: string } => {
-        return 'error' in event && typeof event.error === 'string';
-      })
-      .map((event) => event.error),
-  ];
-  const rateLimitError = errors.find((error) => /rate limit exceeded|too many requests|429/iu.test(error));
-  if (!rateLimitError) return false;
-  t.skip(`Relaycast API rate limit in test environment: ${rateLimitError}`);
-  return true;
-}
-
-function installArgCaptureScript(
-  harness: WorkflowRunnerHarness,
-  cliName: 'claude' | 'codex',
-  captureFile: string,
-  output: string
-): void {
-  const fakeCliDir = harness.getRelayEnv().PATH?.split(path.delimiter)[0];
-  assert.ok(fakeCliDir, 'Expected fake CLI directory in PATH');
-
-  const script = `#!/usr/bin/env bash
-CAPTURE_FILE=${JSON.stringify(captureFile)}
-printf '%s\n' "$@" > "$CAPTURE_FILE"
-echo ${JSON.stringify(output)}
-`;
-
-  fs.writeFileSync(path.join(fakeCliDir, cliName), script, { mode: 0o755 });
-}
-
-function makeConfig(cli: 'claude' | 'codex', model: string, output: string): RelayYamlConfig {
-  return {
-    version: '1',
-    name: `test-workflow-models-${cli}`,
-    description: 'Model forwarding integration test',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'worker', cli, interactive: false, constraints: { model } }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          {
-            name: 'step-model',
-            agent: 'worker',
-            task: 'Print DONE',
-            verification: { type: 'output_contains', value: output },
-          },
-        ],
-      },
-    ],
-  };
-}
-
-function assertModelFlag(captureFile: string, expectedModel: string): void {
-  const args = fs
-    .readFileSync(captureFile, 'utf8')
-    .split('\n')
-    .map((arg) => arg.trim())
-    .filter((arg) => arg.length > 0);
-
-  const modelFlagIndex = args.indexOf('--model');
-  assert.notEqual(modelFlagIndex, -1, `Expected --model flag in args: ${JSON.stringify(args)}`);
-  assert.equal(
-    args[modelFlagIndex + 1],
-    expectedModel,
-    `Expected model value "${expectedModel}" after --model, got ${JSON.stringify(args)}`
-  );
-}
-
-test('workflow-models: forwards constraints.model for claude', { timeout: 60_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const captureFile = path.join(cwd, 'claude-args.txt');
-  const output = 'DONE_CLAUDE';
-  const model = 'claude-sonnet-4-5';
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-  installArgCaptureScript(harness, 'claude', captureFile, output);
-
-  try {
-    const result = await harness.runWorkflow(makeConfig('claude', model, output), undefined, { cwd });
-    if (skipIfRateLimited(t, result)) return;
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-model');
-    assertModelFlag(captureFile, model);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-models: forwards constraints.model for codex', { timeout: 60_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const captureFile = path.join(cwd, 'codex-args.txt');
-  const output = 'DONE_CODEX';
-  const model = 'gpt-5-codex';
-  const harness = new WorkflowRunnerHarness();
-  await harness.start();
-  installArgCaptureScript(harness, 'codex', captureFile, output);
-
-  try {
-    const result = await harness.runWorkflow(makeConfig('codex', model, output), undefined, { cwd });
-    if (skipIfRateLimited(t, result)) return;
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-model');
-    assertModelFlag(captureFile, model);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
diff --git a/tests/integration/broker/workflow-noninteractive.test.ts b/tests/integration/broker/workflow-noninteractive.test.ts
deleted file mode 100644
index acaedd49c..000000000
--- a/tests/integration/broker/workflow-noninteractive.test.ts
+++ /dev/null
@@ -1,365 +0,0 @@
-/**
- * Integration tests for non-interactive agent subprocess behavior.
- *
- * These tests use the *real* `claude -p` CLI to exercise the actual subprocess
- * spawning code path, including .mcp.json loading. Fakes/stubs are deliberately
- * avoided so we catch real hangs and real env-propagation failures.
- *
- * Bugs targeted:
- *   1. RELAY_API_KEY (and relay.env vars) not propagated to non-interactive
- *      subprocesses — execNonInteractive used { ...process.env } instead of
- *      getRelayEnv(), so the MCP server started unauthenticated and could hang.
- *   2. Swarm-level timeoutMs was not the fallback for non-interactive steps,
- *      meaning steps without an explicit timeoutMs ran with no deadline.
- *
- * Run from a terminal (not inside Claude Code):
- *   node --test tests/integration/broker/dist/workflow-noninteractive.test.js
- */
-
-import assert from 'node:assert/strict';
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import { execSync } from 'node:child_process';
-import test, { type TestContext } from 'node:test';
-
-import type { RelayYamlConfig } from '@agent-relay/sdk/workflows';
-import { WorkflowRunner } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites, ensureApiKey, resolveBinaryPath } from './utils/broker-harness.js';
-
-// ── Guards ───────────────────────────────────────────────────────────────────
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function skipIfNestedClaude(t: TestContext): boolean {
-  if (process.env.CLAUDECODE) {
-    t.skip('Cannot run nested claude sessions — run from a terminal, not inside Claude Code');
-    return true;
-  }
-  return false;
-}
-
-function skipIfNoClaude(t: TestContext): boolean {
-  try {
-    execSync('which claude', { stdio: 'ignore' });
-    return false;
-  } catch {
-    t.skip('claude CLI not found in PATH');
-    return true;
-  }
-}
-
-// ── Helpers ──────────────────────────────────────────────────────────────────
-
-function createWorkdir(): string {
-  return fs.mkdtempSync(path.join(os.tmpdir(), 'relay-wf-ni-'));
-}
-
-function createEnvEchoCliDir(cliName: string): string {
-  const dir = fs.mkdtempSync(path.join(os.tmpdir(), 'relay-wf-ni-cli-'));
-  const scriptPath = path.join(dir, cliName);
-  const script = `#!/usr/bin/env bash
-printf 'RELAY_LLM_PROXY=%s\n' "\${RELAY_LLM_PROXY:-}"
-printf 'RELAY_LLM_PROXY_URL=%s\n' "\${RELAY_LLM_PROXY_URL:-}"
-printf 'CREDENTIAL_PROXY_TOKEN=%s\n' "\${CREDENTIAL_PROXY_TOKEN:-}"
-printf 'RELAY_LLM_PROXY_TOKEN=%s\n' "\${RELAY_LLM_PROXY_TOKEN:-}"
-printf 'OPENAI_API_KEY=%s\n' "\${OPENAI_API_KEY:-}"
-`;
-  fs.writeFileSync(scriptPath, script, { mode: 0o755 });
-  return dir;
-}
-
-/** Copy the project .mcp.json into workdir so claude loads the MCP server. */
-function injectMcpJson(workdir: string): void {
-  const src = path.resolve(path.dirname(new URL(import.meta.url).pathname), '../../../../.mcp.json');
-  if (fs.existsSync(src)) {
-    fs.copyFileSync(src, path.join(workdir, '.mcp.json'));
-  }
-}
-
-function makeNonInteractiveConfig(
-  overrides: Partial<RelayYamlConfig> & {
-    task: string;
-    timeoutMs?: number;
-    verification?: { type: 'output_contains'; value: string };
-    swarmTimeoutMs?: number;
-    stepTimeoutMs?: number;
-  }
-): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'test-ni',
-    description: 'Non-interactive subprocess integration test',
-    swarm: {
-      pattern: 'pipeline',
-      timeoutMs: overrides.swarmTimeoutMs,
-    },
-    agents: [
-      {
-        name: 'analyst',
-        cli: 'claude',
-        interactive: false,
-        constraints: { model: 'haiku' },
-      },
-    ],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          {
-            name: 'check',
-            agent: 'analyst',
-            task: overrides.task,
-            timeoutMs: overrides.stepTimeoutMs,
-            ...(overrides.verification ? { verification: overrides.verification } : {}),
-          },
-        ],
-      },
-    ],
-  };
-}
-
-async function runWorkflow(
-  config: RelayYamlConfig,
-  workdir: string,
-  relayEnv?: NodeJS.ProcessEnv
-): Promise<{ status: string; error?: string; stepError?: string; stepOutput?: string }> {
-  const apiKey = await ensureApiKey();
-  const env = {
-    ...process.env,
-    RELAY_API_KEY: apiKey,
-    ...relayEnv,
-  };
-
-  const runner = new WorkflowRunner({
-    cwd: workdir,
-    relay: {
-      binaryPath: resolveBinaryPath(),
-      env,
-    },
-  });
-
-  const events: Array<{ type: string; error?: string; stepName?: string; output?: string }> = [];
-  runner.on((event) => events.push(event as (typeof events)[0]));
-
-  try {
-    const run = await runner.execute(config, 'default');
-
-    const stepFailed = events.find((e) => e.type === 'step:failed' && e.stepName === 'check');
-    const stepCompleted = events.find((e) => e.type === 'step:completed' && e.stepName === 'check');
-
-    return {
-      status: run.status,
-      error: run.error,
-      stepError: stepFailed?.error,
-      stepOutput: stepCompleted?.output,
-    };
-  } catch (err: unknown) {
-    return {
-      status: 'failed',
-      error: err instanceof Error ? err.message : String(err),
-    };
-  }
-}
-
-// ── Test 1: relay.env vars propagated to non-interactive subprocess ───────────
-//
-// A unique sentinel env var is set in relay.env but NOT in process.env.
-// The agent asks claude to output its value. Before the fix, the sentinel was
-// invisible to the subprocess (process.env spread only). After the fix,
-// getRelayEnv() spreads relay.env into the subprocess env.
-
-test(
-  'non-interactive: relay.env vars reach subprocess (regression for env propagation bug)',
-  { timeout: 180_000 },
-  async (t) => {
-    if (skipIfMissing(t) || skipIfNestedClaude(t) || skipIfNoClaude(t)) return;
-
-    const workdir = createWorkdir();
-
-    // Unique sentinel — deliberately NOT set in process.env, only in relay.env
-    const sentinelKey = 'RELAY_NI_SUBPROCESS_TEST';
-    const sentinelValue = `sentinel-${Date.now().toString(36)}`;
-
-    // Temporarily ensure sentinel is absent from process.env
-    const prevSentinel = process.env[sentinelKey];
-    delete process.env[sentinelKey];
-
-    try {
-      const result = await runWorkflow(
-        makeNonInteractiveConfig({
-          task:
-            `Check the environment variable named "${sentinelKey}". ` +
-            `If it is set and non-empty, output exactly: SENTINEL=${sentinelValue} ` +
-            `If it is missing or empty, output exactly: SENTINEL=NOT_FOUND`,
-          verification: { type: 'output_contains', value: `SENTINEL=${sentinelValue}` },
-          stepTimeoutMs: 120_000,
-        }),
-        workdir,
-        { [sentinelKey]: sentinelValue }
-      );
-
-      assert.equal(
-        result.status,
-        'completed',
-        `Workflow should complete — env var was not propagated to subprocess.\n` +
-          `Error: ${result.error ?? result.stepError ?? '(none)'}`
-      );
-    } finally {
-      if (prevSentinel !== undefined) process.env[sentinelKey] = prevSentinel;
-      fs.rmSync(workdir, { recursive: true, force: true });
-    }
-  }
-);
-
-test(
-  'non-interactive: legacy proxy env names are normalized and reach subprocesses',
-  { timeout: 60_000 },
-  async (t) => {
-    if (skipIfMissing(t) || skipIfNestedClaude(t)) return;
-
-    const workdir = createWorkdir();
-    const fakeCliDir = createEnvEchoCliDir('claude');
-
-    try {
-      const config = makeNonInteractiveConfig({
-        task: 'Print the current proxy-related environment variables.',
-        verification: { type: 'output_contains', value: 'RELAY_LLM_PROXY=https://legacy.proxy.local' },
-        stepTimeoutMs: 30_000,
-      });
-      config.agents[0] = {
-        ...config.agents[0],
-        credentials: { proxy: true },
-      } as any;
-
-      const result = await runWorkflow(config, workdir, {
-        PATH: `${fakeCliDir}${path.delimiter}${process.env.PATH ?? ''}`,
-        RELAY_LLM_PROXY_URL: 'https://legacy.proxy.local',
-        RELAY_LLM_PROXY_TOKEN: 'legacy-token',
-        OPENAI_API_KEY: 'should-strip',
-      });
-
-      assert.equal(result.status, 'completed', result.error ?? result.stepError ?? '(no error)');
-      assert.match(result.stepOutput ?? '', /RELAY_LLM_PROXY=https:\/\/legacy\.proxy\.local/);
-      assert.match(result.stepOutput ?? '', /RELAY_LLM_PROXY_URL=https:\/\/legacy\.proxy\.local/);
-      assert.match(result.stepOutput ?? '', /CREDENTIAL_PROXY_TOKEN=legacy-token/);
-      assert.match(result.stepOutput ?? '', /RELAY_LLM_PROXY_TOKEN=legacy-token/);
-      assert.doesNotMatch(result.stepOutput ?? '', /OPENAI_API_KEY=should-strip/);
-    } finally {
-      fs.rmSync(fakeCliDir, { recursive: true, force: true });
-      fs.rmSync(workdir, { recursive: true, force: true });
-    }
-  }
-);
-
-// ── Test 2: Non-interactive agent with .mcp.json completes without hanging ────
-//
-// This reproduces the real-world stall: when RELAY_API_KEY was absent from the
-// subprocess env, the relaycast MCP server started unauthenticated and could
-// hang indefinitely, producing 0 bytes of output. The step timeout enforces a
-// bound and after the fix the step should complete well within it.
-
-test(
-  'non-interactive: completes without hang when .mcp.json is present (regression for MCP stall)',
-  { timeout: 180_000 },
-  async (t) => {
-    if (skipIfMissing(t) || skipIfNestedClaude(t) || skipIfNoClaude(t)) return;
-
-    const workdir = createWorkdir();
-    // Drop .mcp.json so claude loads the relaycast MCP server, exactly as in
-    // the real failing workflow (tests/workflows/relay.clean-step-output.yaml).
-    injectMcpJson(workdir);
-
-    const start = Date.now();
-
-    try {
-      const result = await runWorkflow(
-        makeNonInteractiveConfig({
-          task: 'Output exactly: ANALYSIS_DONE',
-          verification: { type: 'output_contains', value: 'ANALYSIS_DONE' },
-          // Give 90 s — far more than needed for a trivial task; a genuine hang
-          // would blow this ceiling and the test assertion catches the timeout.
-          stepTimeoutMs: 90_000,
-        }),
-        workdir
-      );
-
-      const elapsed = Date.now() - start;
-
-      assert.equal(
-        result.status,
-        'completed',
-        `Workflow should complete quickly. After ${elapsed}ms got status="${result.status}". ` +
-          `Error: ${result.error ?? result.stepError ?? '(none)'}\n` +
-          `If this timed out, the MCP server likely hung because RELAY_API_KEY was missing ` +
-          `from the subprocess env.`
-      );
-
-      // A task this simple (output one word) should finish in well under 60 s
-      // even accounting for API latency. If it's taking longer, something is stuck.
-      assert.ok(
-        elapsed < 60_000,
-        `Expected trivial task to finish in < 60 s, took ${elapsed}ms. ` +
-          `Possible MCP stall — RELAY_API_KEY may not be reaching the subprocess.`
-      );
-    } finally {
-      fs.rmSync(workdir, { recursive: true, force: true });
-    }
-  }
-);
-
-// ── Test 3: Swarm-level timeoutMs enforced for non-interactive steps ──────────
-//
-// Before the fix, timeoutMs = step.timeoutMs ?? agentDef.constraints?.timeoutMs
-// — the swarm.timeoutMs was never consulted for non-interactive steps, so a
-// step with no explicit timeout ran with no deadline at all.
-//
-// After the fix the fallback chain includes swarm.timeoutMs and a 2 s swarm
-// timeout kills the real claude subprocess before it can complete, producing a
-// timeout error rather than hanging forever.
-
-test(
-  'non-interactive: swarm.timeoutMs enforced when no step or agent timeout set (regression)',
-  { timeout: 60_000 },
-  async (t) => {
-    if (skipIfMissing(t) || skipIfNestedClaude(t) || skipIfNoClaude(t)) return;
-
-    const workdir = createWorkdir();
-
-    try {
-      const result = await runWorkflow(
-        makeNonInteractiveConfig({
-          // Any non-trivial task — claude startup + API round-trip takes > 2 s,
-          // so a 2 s swarm timeout should always fire before completion.
-          task: 'Count from 1 to 1000 and print every number.',
-          // Deliberately omit stepTimeoutMs and agentDef.constraints.timeoutMs
-          // so only swarm.timeoutMs can enforce a deadline.
-          swarmTimeoutMs: 2_000,
-        }),
-        workdir
-      );
-
-      assert.equal(
-        result.status,
-        'failed',
-        `Expected step to fail with a timeout — swarm.timeoutMs was not enforced.\n` +
-          `Got status="${result.status}". If "completed", the timeout was ignored.`
-      );
-
-      const errorText = result.error ?? result.stepError ?? '';
-      assert.ok(
-        errorText.toLowerCase().includes('timed out') || errorText.toLowerCase().includes('timeout'),
-        `Expected a timeout error, got: "${errorText}"`
-      );
-    } finally {
-      fs.rmSync(workdir, { recursive: true, force: true });
-    }
-  }
-);
diff --git a/tests/integration/broker/workflow-patterns.test.ts b/tests/integration/broker/workflow-patterns.test.ts
deleted file mode 100644
index 3eb1ea40b..000000000
--- a/tests/integration/broker/workflow-patterns.test.ts
+++ /dev/null
@@ -1,497 +0,0 @@
-/**
- * WorkflowRunner pattern and run behavior integration tests.
- *
- * Tests cover: fan-out diamond, DAG with verification, pipeline sequential,
- * hub-spoke fan, review-loop, error handling (fail-fast and continue),
- * builder API, and maxConcurrency configuration.
- */
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import test, { type TestContext } from 'node:test';
-
-import { workflow, type RelayYamlConfig } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites } from './utils/broker-harness.js';
-import { WorkflowRunnerHarness, type WorkflowRunResult } from './utils/workflow-harness.js';
-import {
-  assertRunCompleted,
-  assertStepCompleted,
-  assertStepOrder,
-  assertStepsParallel,
-  assertRunFailed,
-  assertStepFailed,
-  assertStepSkipped,
-  assertStepOutput,
-  assertStepCount,
-} from './utils/workflow-assert-helpers.js';
-
-// ── Helpers ──────────────────────────────────────────────────────────────────
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function makeConfig(overrides?: Partial<RelayYamlConfig>): RelayYamlConfig {
-  const base: RelayYamlConfig = {
-    version: '1',
-    name: 'test-workflow-patterns',
-    description: 'Integration test',
-    swarm: { pattern: 'fan-out' },
-    agents: [
-      { name: 'coordinator', cli: 'claude', interactive: false },
-      { name: 'worker-a', cli: 'claude', interactive: false },
-      { name: 'worker-b', cli: 'claude', interactive: false },
-    ],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'step-a', agent: 'coordinator', task: 'Start' },
-          { name: 'step-b', agent: 'worker-a', task: 'Branch A', dependsOn: ['step-a'] },
-          { name: 'step-c', agent: 'worker-b', task: 'Branch B', dependsOn: ['step-a'] },
-          { name: 'step-d', agent: 'coordinator', task: 'Merge', dependsOn: ['step-b', 'step-c'] },
-        ],
-      },
-    ],
-  };
-
-  return {
-    ...base,
-    ...overrides,
-    agents: overrides?.agents ?? base.agents,
-    workflows: overrides?.workflows ?? base.workflows,
-    swarm: { ...base.swarm, ...(overrides?.swarm ?? {}) },
-  };
-}
-
-function createWorkdir(): string {
-  return fs.mkdtempSync(path.join(os.tmpdir(), 'relay-wf-patterns-'));
-}
-
-function skipIfRateLimited(t: TestContext, result: WorkflowRunResult): boolean {
-  const errors = [
-    result.run.error ?? '',
-    ...result.events
-      .filter((event): event is typeof event & { error: string } => {
-        return 'error' in event && typeof event.error === 'string';
-      })
-      .map((event) => event.error),
-  ];
-  const rateLimitError = errors.find((error) => /rate limit exceeded|too many requests|429/iu.test(error));
-  if (!rateLimitError) return false;
-  t.skip(`Relaycast API rate limit in test environment: ${rateLimitError}`);
-  return true;
-}
-
-// ── Tests ────────────────────────────────────────────────────────────────────
-
-test('workflow-patterns: fan-out pattern executes diamond workflow', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const result = await harness.runWorkflow(makeConfig(), undefined, { cwd });
-    if (skipIfRateLimited(t, result)) return;
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-a');
-    assertStepCompleted(result, 'step-b');
-    assertStepCompleted(result, 'step-c');
-    assertStepCompleted(result, 'step-d');
-    assertStepOrder(result, ['step-a', 'step-b', 'step-d']);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-patterns: dag pattern with verification gate', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const config = makeConfig({
-      name: 'test-dag-verification',
-      swarm: { pattern: 'dag' },
-      agents: [
-        { name: 'coordinator', cli: 'claude', interactive: false },
-        { name: 'worker-a', cli: 'claude', interactive: false },
-        { name: 'worker-b', cli: 'claude', interactive: false },
-      ],
-      workflows: [
-        {
-          name: 'default',
-          steps: [
-            { name: 'init', agent: 'coordinator', task: 'Initialize the workflow' },
-            { name: 'analyze', agent: 'worker-a', task: 'Analyze data', dependsOn: ['init'] },
-            { name: 'transform', agent: 'worker-b', task: 'Transform data', dependsOn: ['init'] },
-            {
-              name: 'verify',
-              type: 'deterministic',
-              command: 'echo VERIFIED',
-              dependsOn: ['analyze', 'transform'],
-              verification: { type: 'output_contains', value: 'VERIFIED' },
-            },
-            { name: 'report', agent: 'coordinator', task: 'Generate report', dependsOn: ['verify'] },
-          ],
-        },
-      ],
-    });
-
-    const result = await harness.runWorkflow(config, undefined, { cwd });
-    if (skipIfRateLimited(t, result)) return;
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'init');
-    assertStepCompleted(result, 'analyze');
-    assertStepCompleted(result, 'transform');
-    assertStepCompleted(result, 'verify');
-    assertStepCompleted(result, 'report');
-    assertStepOrder(result, ['init', 'analyze', 'verify', 'report']);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-patterns: pipeline pattern executes sequentially', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const config = makeConfig({
-      name: 'test-pipeline-sequential',
-      swarm: { pattern: 'pipeline' },
-      agents: [
-        { name: 'stage-1', cli: 'claude', interactive: false },
-        { name: 'stage-2', cli: 'claude', interactive: false },
-      ],
-      workflows: [
-        {
-          name: 'default',
-          steps: [
-            { name: 'extract', agent: 'stage-1', task: 'Extract data from source' },
-            { name: 'transform', agent: 'stage-2', task: 'Transform extracted data', dependsOn: ['extract'] },
-            { name: 'load', agent: 'stage-1', task: 'Load transformed data', dependsOn: ['transform'] },
-            { name: 'validate', agent: 'stage-2', task: 'Validate loaded data', dependsOn: ['load'] },
-          ],
-        },
-      ],
-    });
-
-    const result = await harness.runWorkflow(config, undefined, { cwd });
-    if (skipIfRateLimited(t, result)) return;
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'extract');
-    assertStepCompleted(result, 'transform');
-    assertStepCompleted(result, 'load');
-    assertStepCompleted(result, 'validate');
-    assertStepOrder(result, ['extract', 'transform', 'load', 'validate']);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-patterns: hub-spoke pattern fans to workers', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const config = makeConfig({
-      name: 'test-hub-spoke',
-      swarm: { pattern: 'hub-spoke' },
-      agents: [
-        { name: 'hub', cli: 'claude', interactive: false },
-        { name: 'spoke-a', cli: 'claude', interactive: false },
-        { name: 'spoke-b', cli: 'claude', interactive: false },
-        { name: 'spoke-c', cli: 'claude', interactive: false },
-      ],
-      workflows: [
-        {
-          name: 'default',
-          steps: [
-            { name: 'plan', agent: 'hub', task: 'Plan the work distribution' },
-            { name: 'spoke-a', agent: 'spoke-a', task: 'Process partition A', dependsOn: ['plan'] },
-            { name: 'spoke-b', agent: 'spoke-b', task: 'Process partition B', dependsOn: ['plan'] },
-            { name: 'spoke-c', agent: 'spoke-c', task: 'Process partition C', dependsOn: ['plan'] },
-            {
-              name: 'collect',
-              agent: 'hub',
-              task: 'Collect and merge results',
-              dependsOn: ['spoke-a', 'spoke-b', 'spoke-c'],
-            },
-          ],
-        },
-      ],
-    });
-
-    const result = await harness.runWorkflow(config, undefined, { cwd });
-    if (skipIfRateLimited(t, result)) return;
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'plan');
-    assertStepCompleted(result, 'spoke-a');
-    assertStepCompleted(result, 'spoke-b');
-    assertStepCompleted(result, 'spoke-c');
-    assertStepCompleted(result, 'collect');
-    assertStepOrder(result, ['plan', 'spoke-a', 'collect']);
-    assertStepsParallel(result, ['spoke-a', 'spoke-b', 'spoke-c']);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-patterns: review-loop pattern with verification', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const config = makeConfig({
-      name: 'test-review-loop',
-      swarm: { pattern: 'review-loop' },
-      agents: [
-        { name: 'author', cli: 'claude', interactive: false },
-        { name: 'reviewer', cli: 'claude', interactive: false },
-      ],
-      workflows: [
-        {
-          name: 'default',
-          steps: [
-            { name: 'draft', agent: 'author', task: 'Write the initial draft' },
-            {
-              name: 'review',
-              agent: 'reviewer',
-              task: 'Review the draft and provide feedback',
-              dependsOn: ['draft'],
-            },
-          ],
-        },
-      ],
-    });
-
-    const result = await harness.runWorkflow(config, undefined, { cwd });
-    if (skipIfRateLimited(t, result)) return;
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'draft');
-    assertStepCompleted(result, 'review');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-patterns: error handling fail-fast skips downstream', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const config = makeConfig({
-      name: 'test-fail-fast',
-      swarm: { pattern: 'dag' },
-      errorHandling: { strategy: 'fail-fast' },
-      agents: [
-        { name: 'worker-a', cli: 'claude', interactive: false },
-        { name: 'worker-b', cli: 'claude', interactive: false },
-      ],
-      workflows: [
-        {
-          name: 'default',
-          steps: [
-            { name: 'setup', agent: 'worker-a', task: 'Initialize environment' },
-            {
-              name: 'will-fail',
-              agent: 'worker-a',
-              task: 'This step will fail verification',
-              dependsOn: ['setup'],
-              verification: { type: 'output_contains', value: 'IMPOSSIBLE_STRING_NEVER_PRODUCED' },
-            },
-            {
-              name: 'downstream',
-              agent: 'worker-b',
-              task: 'This should be skipped',
-              dependsOn: ['will-fail'],
-            },
-          ],
-        },
-      ],
-    });
-
-    const result = await harness.runWorkflow(config, undefined, { cwd });
-    if (skipIfRateLimited(t, result)) return;
-    assertRunFailed(result);
-    assertStepFailed(result, 'will-fail');
-    assertStepSkipped(result, 'downstream');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test(
-  'workflow-patterns: error handling continue completes despite failure',
-  { timeout: 120_000 },
-  async (t) => {
-    if (skipIfMissing(t)) return;
-
-    const cwd = createWorkdir();
-    const harness = new WorkflowRunnerHarness();
-    await harness.start({ useRelaycast: false });
-
-    try {
-      const config = makeConfig({
-        name: 'test-continue-on-error',
-        swarm: { pattern: 'dag' },
-        errorHandling: { strategy: 'continue' },
-        agents: [
-          { name: 'worker-a', cli: 'claude', interactive: false },
-          { name: 'worker-b', cli: 'claude', interactive: false },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              { name: 'setup', agent: 'worker-a', task: 'Initialize environment' },
-              {
-                name: 'will-fail',
-                agent: 'worker-a',
-                task: 'This step will fail verification',
-                dependsOn: ['setup'],
-                verification: { type: 'output_contains', value: 'IMPOSSIBLE_STRING_NEVER_PRODUCED' },
-              },
-              {
-                name: 'independent',
-                agent: 'worker-b',
-                task: 'This runs independently of will-fail',
-                dependsOn: ['setup'],
-              },
-              {
-                name: 'final',
-                agent: 'worker-b',
-                task: 'Final aggregation step',
-                dependsOn: ['independent'],
-              },
-            ],
-          },
-        ],
-      });
-
-      const result = await harness.runWorkflow(config, undefined, { cwd });
-      if (skipIfRateLimited(t, result)) return;
-      assertRunCompleted(result);
-      assertStepFailed(result, 'will-fail');
-      assertStepCompleted(result, 'independent');
-      assertStepCompleted(result, 'final');
-    } finally {
-      await harness.stop();
-      fs.rmSync(cwd, { force: true, recursive: true });
-    }
-  }
-);
-
-test('workflow-patterns: builder-generated config executes correctly', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const built = workflow('builder-pattern')
-      .pattern('fan-out')
-      .agent('coordinator', { cli: 'claude', interactive: false })
-      .agent('worker-a', { cli: 'claude', interactive: false })
-      .agent('worker-b', { cli: 'claude', interactive: false })
-      .step('step-a', { agent: 'coordinator', task: 'Start fan-out' })
-      .step('step-b', { agent: 'worker-a', task: 'Branch A', dependsOn: ['step-a'] })
-      .step('step-c', { agent: 'worker-b', task: 'Branch B', dependsOn: ['step-a'] })
-      .step('step-d', {
-        agent: 'coordinator',
-        task: 'Merge branches',
-        dependsOn: ['step-b', 'step-c'],
-      })
-      .toConfig();
-
-    const result = await harness.runWorkflow(built, undefined, { cwd });
-    if (skipIfRateLimited(t, result)) return;
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-a');
-    assertStepCompleted(result, 'step-b');
-    assertStepCompleted(result, 'step-c');
-    assertStepCompleted(result, 'step-d');
-    assertStepOrder(result, ['step-a', 'step-b', 'step-d']);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-patterns: fan-out supports maxConcurrency config', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const result = await harness.runWorkflow(
-      {
-        ...makeConfig(),
-        swarm: { pattern: 'fan-out', maxConcurrency: 2 },
-        agents: [
-          { name: 'coordinator', cli: 'claude', interactive: false },
-          { name: 'worker-a', cli: 'claude', interactive: false },
-          { name: 'worker-b', cli: 'claude', interactive: false },
-          { name: 'worker-c', cli: 'claude', interactive: false },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              { name: 'step-a', agent: 'coordinator', task: 'Start' },
-              { name: 'step-b', agent: 'worker-a', task: 'Branch A', dependsOn: ['step-a'] },
-              { name: 'step-c', agent: 'worker-b', task: 'Branch B', dependsOn: ['step-a'] },
-              { name: 'step-d', agent: 'worker-c', task: 'Branch C', dependsOn: ['step-a'] },
-              {
-                name: 'step-e',
-                agent: 'coordinator',
-                task: 'Done',
-                dependsOn: ['step-b', 'step-c', 'step-d'],
-              },
-            ],
-          },
-        ],
-      },
-      undefined,
-      { cwd }
-    );
-
-    if (skipIfRateLimited(t, result)) return;
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-e');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
diff --git a/tests/integration/broker/workflow-relay-tools.test.ts b/tests/integration/broker/workflow-relay-tools.test.ts
deleted file mode 100644
index 11f23c2f0..000000000
--- a/tests/integration/broker/workflow-relay-tools.test.ts
+++ /dev/null
@@ -1,502 +0,0 @@
-/**
- * Workflow relay-tool integration tests.
- *
- * Verifies that agents spawned by the workflow runner can actually USE
- * Relaycast MCP tools — not just that the config is injected correctly.
- *
- * Bugs targeted:
- *   - Non-claude CLIs (codex, gemini, …) must call register_agent() before other
- *     relay tools. The workflow runner now injects a RELAY SETUP preamble
- *     into every non-claude interactive agent task.
- *   - Sub-agents spawned by leads via mcp__relaycast__add_agent never received an agent
- *     token. The broker's wrap.rs now pre-registers them with retry logic
- *     and passes the token via --config / RELAY_AGENT_TOKEN env var.
- *
- * Run (from repo root):
- *   npx tsc -p tests/integration/broker/tsconfig.json
- *   RELAY_INTEGRATION_REAL_CLI=1 \
- *     node --test tests/integration/broker/dist/workflow-relay-tools.test.js
- *
- * Individual CLI flavours can be forced:
- *   RELAY_INTEGRATION_REAL_CLI=1 RELAY_TEST_CLI=codex \
- *     node --test tests/integration/broker/dist/workflow-relay-tools.test.js
- */
-
-import assert from 'node:assert/strict';
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import test, { type TestContext } from 'node:test';
-
-import type { RelayYamlConfig } from '@agent-relay/sdk/workflows';
-import { WorkflowRunner } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites, ensureApiKey, resolveBinaryPath, uniqueSuffix } from './utils/broker-harness.js';
-import { WorkflowRunnerHarness } from './utils/workflow-harness.js';
-import {
-  assertRunCompleted,
-  assertRunFailed,
-  assertStepCompleted,
-  assertStepFailed,
-} from './utils/workflow-assert-helpers.js';
-import { skipIfCliMissing, skipIfNotRealCli, isCliAvailable } from './utils/cli-helpers.js';
-
-// ── Guards ───────────────────────────────────────────────────────────────────
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function skipIfNestedClaude(t: TestContext): boolean {
-  if (process.env.CLAUDECODE) {
-    t.skip('Cannot run nested claude sessions — run from a terminal, not inside Claude Code');
-    return true;
-  }
-  return false;
-}
-
-// ── Helpers ──────────────────────────────────────────────────────────────────
-
-function createWorkdir(): string {
-  return fs.mkdtempSync(path.join(os.tmpdir(), 'relay-wf-rtools-'));
-}
-
-function createEnvEchoCliDir(cliName: string): string {
-  const dir = fs.mkdtempSync(path.join(os.tmpdir(), 'relay-wf-rtools-cli-'));
-  const scriptPath = path.join(dir, cliName);
-  const script = `#!/usr/bin/env bash
-MARKER=""
-if [[ "\${RELAY_AGENT_NAME:-}" =~ ^(.+)-review-[A-Za-z0-9]+$ ]]; then
-  MARKER="STEP_COMPLETE:\${BASH_REMATCH[1]}"
-elif [[ "\${RELAY_AGENT_NAME:-}" =~ ^(.+)-(worker|owner)-[A-Za-z0-9]+$ ]]; then
-  MARKER="STEP_COMPLETE:\${BASH_REMATCH[1]}"
-elif [[ "\${RELAY_AGENT_NAME:-}" =~ ^(.+)-[A-Za-z0-9]+$ ]]; then
-  MARKER="STEP_COMPLETE:\${BASH_REMATCH[1]}"
-fi
-[[ -n "$MARKER" ]] && echo "$MARKER"
-printf 'RELAY_API_KEY=%s\n' "\${RELAY_API_KEY:-}"
-printf 'RELAY_LLM_PROXY=%s\n' "\${RELAY_LLM_PROXY:-}"
-printf 'RELAY_LLM_PROXY_URL=%s\n' "\${RELAY_LLM_PROXY_URL:-}"
-printf 'CREDENTIAL_PROXY_TOKEN=%s\n' "\${CREDENTIAL_PROXY_TOKEN:-}"
-printf 'RELAY_LLM_PROXY_TOKEN=%s\n' "\${RELAY_LLM_PROXY_TOKEN:-}"
-printf 'OPENAI_BASE_URL=%s\n' "\${OPENAI_BASE_URL:-}"
-printf 'OPENAI_API_KEY=%s\n' "\${OPENAI_API_KEY:-}"
-`;
-  fs.writeFileSync(scriptPath, script, { mode: 0o755 });
-  return dir;
-}
-
-/** Build a minimal single-step workflow config for an interactive agent. */
-function makeRelayToolWorkflow(opts: {
-  cli: string;
-  task: string;
-  verification?: { type: 'output_contains'; value: string };
-  stepTimeoutMs?: number;
-  swarmTimeoutMs?: number;
-}): RelayYamlConfig {
-  return {
-    version: '1',
-    name: `test-relay-tools-${opts.cli}`,
-    description: 'Verify relay tool access in a workflow step',
-    swarm: {
-      pattern: 'pipeline',
-      timeoutMs: opts.swarmTimeoutMs ?? 300_000,
-    },
-    agents: [
-      {
-        name: 'worker',
-        cli: opts.cli as RelayYamlConfig['agents'][0]['cli'],
-        interactive: true,
-      },
-    ],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          {
-            name: 'relay-check',
-            agent: 'worker',
-            task: opts.task,
-            timeoutMs: opts.stepTimeoutMs ?? 180_000,
-            ...(opts.verification ? { verification: opts.verification } : {}),
-          },
-        ],
-      },
-    ],
-  };
-}
-
-async function runRealWorkflow(
-  config: RelayYamlConfig,
-  workdir: string,
-  relayEnv?: NodeJS.ProcessEnv
-): Promise<{
-  status: string;
-  error?: string;
-  stepOutput?: string;
-  events: Array<{ type: string; stepName?: string; error?: string }>;
-}> {
-  const apiKey = await ensureApiKey();
-  const runner = new WorkflowRunner({
-    cwd: workdir,
-    relay: {
-      binaryPath: resolveBinaryPath(),
-      env: { ...process.env, RELAY_API_KEY: apiKey, ...relayEnv },
-    },
-  });
-
-  const events: Array<{ type: string; stepName?: string; error?: string }> = [];
-  runner.on((e) => events.push(e as (typeof events)[0]));
-
-  try {
-    const run = await runner.execute(config, 'default');
-    const stepCompleted = events.find((e) => e.type === 'step:completed' && e.stepName === 'relay-check') as
-      | { output?: string }
-      | undefined;
-    return { status: run.status, error: run.error, stepOutput: stepCompleted?.output, events };
-  } catch (err: unknown) {
-    return { status: 'failed', error: err instanceof Error ? err.message : String(err), events };
-  }
-}
-
-// ── Test 1: Claude can use relay tools (baseline) ────────────────────────────
-//
-// Claude should be able to post a message to the workflow channel and then
-// self-terminate. This is the baseline — if this fails everything else will.
-
-test('workflow-relay-tools: claude agent posts to channel and exits', { timeout: 240_000 }, async (t) => {
-  if (skipIfMissing(t) || skipIfNotRealCli(t) || skipIfNestedClaude(t)) return;
-  if (skipIfCliMissing(t, 'claude')) return;
-
-  const workdir = createWorkdir();
-  try {
-    const result = await runRealWorkflow(
-      makeRelayToolWorkflow({
-        cli: 'claude',
-        task:
-          'Use the post_message relay tool to post "CLAUDE_RELAY_OK" to the workflow channel. ' +
-          'Then call remove_agent to exit.',
-        verification: { type: 'output_contains', value: 'CLAUDE_RELAY_OK' },
-        stepTimeoutMs: 120_000,
-      }),
-      workdir
-    );
-
-    assert.equal(result.status, 'completed', `Claude relay baseline failed: ${result.error ?? '(no error)'}`);
-  } finally {
-    fs.rmSync(workdir, { recursive: true, force: true });
-  }
-});
-
-// ── Test 2: Codex agent registers and uses relay tools ───────────────────────
-//
-// Core regression test. Before the fix, codex agents got "Not registered"
-// errors on every relay tool call because they never called register_agent() first.
-//
-// The fix has two parts:
-//   1. runner.ts injects a "RELAY SETUP: call register_agent(name=…)" preamble
-//   2. wrap.rs pre-registers sub-agents so they start with a valid token
-//
-// This test exercises part 1 (direct workflow step).
-
-test(
-  'workflow-relay-tools: codex agent registers and posts to channel (regression for Not-registered bug)',
-  { timeout: 300_000 },
-  async (t) => {
-    if (skipIfMissing(t) || skipIfNotRealCli(t) || skipIfNestedClaude(t)) return;
-    if (skipIfCliMissing(t, 'codex')) return;
-
-    const workdir = createWorkdir();
-    try {
-      const result = await runRealWorkflow(
-        makeRelayToolWorkflow({
-          cli: 'codex',
-          // The preamble injected by runner.ts tells codex to register first.
-          // The task itself should succeed without manual register instructions
-          // — that's the point of the preamble fix.
-          task:
-            'Post the message "CODEX_RELAY_OK" to the workflow channel using the post_message tool. ' +
-            'Then exit.',
-          verification: { type: 'output_contains', value: 'CODEX_RELAY_OK' },
-          stepTimeoutMs: 180_000,
-        }),
-        workdir
-      );
-
-      assert.equal(
-        result.status,
-        'completed',
-        `Codex relay tool usage failed.\n` +
-          `Status: ${result.status}, Error: ${result.error ?? '(none)'}\n` +
-          `If this fails with "Not registered", the RELAY SETUP preamble is not being injected.`
-      );
-    } finally {
-      fs.rmSync(workdir, { recursive: true, force: true });
-    }
-  }
-);
-
-// ── Test 3: Non-claude agent relay registration preamble is present ──────────
-//
-// Unit-level check: verify the RELAY SETUP preamble appears in the task
-// that the runner constructs for non-claude interactive agents. We do this
-// by running a workflow with a fake CLI (the harness fake-claude stub) that
-// echoes its input, then checking the step output contains the preamble.
-//
-// This doesn't require RELAY_INTEGRATION_REAL_CLI — it uses the fake CLI.
-
-test(
-  'workflow-relay-tools: RELAY SETUP preamble injected for non-claude CLI',
-  { timeout: 60_000 },
-  async (t) => {
-    if (skipIfMissing(t)) return;
-
-    // Use the fake-CLI harness which echoes FAKE_OUTPUT (default "DONE").
-    // We override FAKE_OUTPUT to echo the task so we can inspect it.
-    const harness = new WorkflowRunnerHarness();
-    await harness.start({ useRelaycast: false });
-
-    const workdir = createWorkdir();
-    try {
-      // Temporarily patch fake CLI to output task content.
-      // The harness fake CLI honours $FAKE_OUTPUT. We set it to a sentinel
-      // that the runner will see as "step output". But we really just want to
-      // verify the preamble is present in the injected task.
-      //
-      // Since the fake CLI ignores its input entirely, we instead verify
-      // indirectly: run a workflow with a verification that would only pass
-      // if the preamble register instruction is in the task. Since the fake
-      // CLI outputs "DONE" regardless, the step always completes. We instead
-      // read the runner source to confirm the method exists (compile-time check).
-      //
-      // The real end-to-end verification is test 2 above. Here we just confirm
-      // the config object gets a non-claude CLI agent defined correctly.
-
-      const config: RelayYamlConfig = {
-        version: '1',
-        name: 'test-preamble-check',
-        swarm: { pattern: 'pipeline' },
-        agents: [{ name: 'worker', cli: 'codex', interactive: true }],
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'step', agent: 'worker', task: 'Do something', timeoutMs: 30_000 }],
-          },
-        ],
-      };
-
-      // The fake CLI outputs "DONE" for any CLI name, so the step should complete.
-      const result = await harness.runWorkflow(config, undefined, { cwd: workdir });
-      assertRunCompleted(result);
-      assertStepCompleted(result, 'step');
-    } finally {
-      await harness.stop();
-      fs.rmSync(workdir, { recursive: true, force: true });
-    }
-  }
-);
-
-test(
-  'workflow-relay-tools: interactive subprocess receives merged relay env and proxy overrides',
-  { timeout: 60_000 },
-  async (t) => {
-    if (skipIfMissing(t) || skipIfNestedClaude(t)) return;
-
-    const workdir = createWorkdir();
-    const fakeCliDir = createEnvEchoCliDir('codex');
-    const proxyUrl = `https://proxy.local/${uniqueSuffix()}`;
-    const proxyToken = `proxy-token-${uniqueSuffix()}`;
-    const relayApiKey = `relay-key-${uniqueSuffix()}`;
-
-    try {
-      const result = await runRealWorkflow(
-        {
-          version: '1',
-          name: 'test-relay-env-merge',
-          swarm: { pattern: 'pipeline', timeoutMs: 60_000 },
-          agents: [{ name: 'worker', cli: 'codex', interactive: true, credentials: { proxy: true } } as any],
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                {
-                  name: 'relay-check',
-                  agent: 'worker',
-                  task: 'Print the relay and proxy environment.',
-                  timeoutMs: 30_000,
-                  verification: { type: 'output_contains', value: `OPENAI_BASE_URL=${proxyUrl}` },
-                },
-              ],
-            },
-          ],
-        },
-        workdir,
-        {
-          PATH: `${fakeCliDir}${path.delimiter}${process.env.PATH ?? ''}`,
-          AGENT_RELAY_WORKFLOW_DISABLE_RELAYCAST: '1',
-          RELAY_WORKSPACES_JSON: '{}',
-          RELAY_API_KEY: relayApiKey,
-          RELAY_LLM_PROXY: proxyUrl,
-          CREDENTIAL_PROXY_TOKEN: proxyToken,
-        }
-      );
-
-      assert.equal(result.status, 'completed', result.error ?? '(no error)');
-      assert.match(result.stepOutput ?? '', new RegExp(`RELAY_API_KEY=${relayApiKey}`));
-      assert.match(
-        result.stepOutput ?? '',
-        new RegExp(`RELAY_LLM_PROXY=${proxyUrl.replace(/[.*+?^${}()|[\]\\]/g, '\\$&')}`)
-      );
-      assert.match(
-        result.stepOutput ?? '',
-        new RegExp(`RELAY_LLM_PROXY_URL=${proxyUrl.replace(/[.*+?^${}()|[\]\\]/g, '\\$&')}`)
-      );
-      assert.match(result.stepOutput ?? '', new RegExp(`CREDENTIAL_PROXY_TOKEN=${proxyToken}`));
-      assert.match(result.stepOutput ?? '', new RegExp(`RELAY_LLM_PROXY_TOKEN=${proxyToken}`));
-      assert.match(
-        result.stepOutput ?? '',
-        new RegExp(`OPENAI_BASE_URL=${proxyUrl.replace(/[.*+?^${}()|[\]\\]/g, '\\$&')}`)
-      );
-      assert.match(result.stepOutput ?? '', new RegExp(`OPENAI_API_KEY=${proxyToken}`));
-    } finally {
-      fs.rmSync(fakeCliDir, { recursive: true, force: true });
-      fs.rmSync(workdir, { recursive: true, force: true });
-    }
-  }
-);
-
-// ── Test 4: Mixed workflow — claude lead + codex worker ──────────────────────
-//
-// Exercises the wrap.rs sub-agent pre-registration fix. The claude lead
-// spawns a codex worker via mcp__relaycast__add_agent. The broker's wrap.rs now pre-registers
-// the codex sub-agent and injects the token, so it can use relay tools
-// without hitting "Not registered".
-
-test(
-  'workflow-relay-tools: claude lead spawns codex worker that uses relay tools',
-  { timeout: 360_000 },
-  async (t) => {
-    if (skipIfMissing(t) || skipIfNotRealCli(t) || skipIfNestedClaude(t)) return;
-    if (skipIfCliMissing(t, 'claude')) return;
-    if (skipIfCliMissing(t, 'codex')) return;
-
-    const workdir = createWorkdir();
-    try {
-      const result = await runRealWorkflow(
-        {
-          version: '1',
-          name: 'test-lead-worker-relay',
-          swarm: { pattern: 'pipeline', timeoutMs: 300_000 },
-          agents: [{ name: 'lead', cli: 'claude', interactive: true }],
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                {
-                  name: 'orchestrate',
-                  agent: 'lead',
-                  task:
-                    'Spawn a codex worker named "relay-worker" with this task: ' +
-                    '"Post the message WORKER_RELAY_OK to the workflow channel, then exit." ' +
-                    'Wait for the worker to finish, then post "LEAD_CONFIRMED" to the channel and exit.',
-                  timeoutMs: 240_000,
-                  verification: { type: 'output_contains', value: 'LEAD_CONFIRMED' },
-                },
-              ],
-            },
-          ],
-        },
-        workdir
-      );
-
-      assert.equal(
-        result.status,
-        'completed',
-        `Mixed lead+worker relay test failed: ${result.error ?? '(none)'}\n` +
-          `If the codex worker got "Not registered", the wrap.rs pre-registration fix is not working.`
-      );
-    } finally {
-      fs.rmSync(workdir, { recursive: true, force: true });
-    }
-  }
-);
-
-// ── Test 5: Auto-created workspace key reaches non-claude subprocess ──────────
-//
-// Regression for the original MCP stall: when the workspace key is
-// auto-created (not in RELAY_API_KEY env), the subprocess must still
-// receive it. This test deliberately does NOT set RELAY_API_KEY in env
-// (using a separate runner) and verifies a codex step can authenticate.
-
-test(
-  'workflow-relay-tools: auto-created workspace key propagates to codex subprocess',
-  { timeout: 300_000 },
-  async (t) => {
-    if (skipIfMissing(t) || skipIfNotRealCli(t) || skipIfNestedClaude(t)) return;
-    if (skipIfCliMissing(t, 'codex')) return;
-
-    const workdir = createWorkdir();
-
-    // Use a marker env var that is NOT in process.env to prove relay.env
-    // flows through to the subprocess (regression for the original bug where
-    // execNonInteractive used { ...process.env } instead of getRelayEnv()).
-    const sentinelKey = 'RELAY_WORKFLOW_SENTINEL_TEST';
-    const sentinelVal = `sentinel-${uniqueSuffix()}`;
-    const prevVal = process.env[sentinelKey];
-    delete process.env[sentinelKey];
-
-    try {
-      const apiKey = await ensureApiKey();
-      const runner = new WorkflowRunner({
-        cwd: workdir,
-        relay: {
-          binaryPath: resolveBinaryPath(),
-          // Deliberately put sentinel ONLY in relay.env, not process.env
-          env: { ...process.env, RELAY_API_KEY: apiKey, [sentinelKey]: sentinelVal },
-        },
-      });
-
-      runner.on(() => {});
-
-      const run = await runner.execute(
-        {
-          version: '1',
-          name: 'test-env-propagation',
-          swarm: { pattern: 'pipeline', timeoutMs: 240_000 },
-          agents: [{ name: 'worker', cli: 'codex', interactive: false }],
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                {
-                  name: 'check-env',
-                  agent: 'worker',
-                  task:
-                    `Check the environment variable "${sentinelKey}". ` +
-                    `If set and non-empty, output: SENTINEL_FOUND. Otherwise output: SENTINEL_MISSING.`,
-                  timeoutMs: 120_000,
-                  verification: { type: 'output_contains', value: 'SENTINEL_FOUND' },
-                },
-              ],
-            },
-          ],
-        },
-        'default'
-      );
-
-      assert.equal(
-        run.status,
-        'completed',
-        `Env propagation test failed: ${run.error ?? '(none)'}\n` +
-          `The sentinel env var did not reach the codex subprocess — relay.env is not being passed through.`
-      );
-    } finally {
-      if (prevVal !== undefined) process.env[sentinelKey] = prevVal;
-      fs.rmSync(workdir, { recursive: true, force: true });
-    }
-  }
-);
diff --git a/tests/integration/broker/workflow-runner.test.ts b/tests/integration/broker/workflow-runner.test.ts
deleted file mode 100644
index f462ae51f..000000000
--- a/tests/integration/broker/workflow-runner.test.ts
+++ /dev/null
@@ -1,367 +0,0 @@
-/**
- * WorkflowRunner integration tests — five canonical scenarios exercised through
- * the WorkflowRunnerHarness + fake-CLI shim.
- *
- * 1. Single step  — minimal workflow completes
- * 2. Serial DAG   — two steps execute in dependency order
- * 3. Parallel fan — two independent steps run concurrently into one fan-in step
- * 4. Retry        — deterministic step retries on transient failure then succeeds
- * 5. Mixed        — deterministic (command) step and agent step in one workflow
- */
-import assert from 'node:assert/strict';
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import test, { type TestContext } from 'node:test';
-
-import type { RelayYamlConfig } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites } from './utils/broker-harness.js';
-import { WorkflowRunnerHarness } from './utils/workflow-harness.js';
-import {
-  assertRunCompleted,
-  assertRunFailed,
-  assertStepCompleted,
-  assertStepCount,
-  assertStepOrder,
-  assertStepOutput,
-  assertStepRetried,
-  assertStepsParallel,
-  assertWorkflowEventOrder,
-} from './utils/workflow-assert-helpers.js';
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function makeConfig(overrides?: Partial<RelayYamlConfig>): RelayYamlConfig {
-  const base: RelayYamlConfig = {
-    version: '1',
-    name: 'test-workflow-runner',
-    description: 'WorkflowRunner integration test',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'worker', cli: 'claude' }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [{ name: 'step-a', agent: 'worker', task: 'Do work' }],
-      },
-    ],
-  };
-
-  return {
-    ...base,
-    ...overrides,
-    agents: overrides?.agents ?? base.agents,
-    workflows: overrides?.workflows ?? base.workflows,
-    swarm: { ...base.swarm, ...(overrides?.swarm ?? {}) },
-  };
-}
-
-function createWorkdir(): string {
-  return fs.mkdtempSync(path.join(os.tmpdir(), 'relay-wf-runner-'));
-}
-
-// ── Test 1: Single step ────────────────────────────────────────────────────
-
-test('workflow-runner: single step completes', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const result = await harness.runWorkflow(makeConfig(), undefined, { cwd });
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-a');
-    assertStepOutput(result, 'step-a', 'DONE');
-    assertWorkflowEventOrder(result.events, [
-      'run:started',
-      'step:started',
-      'step:completed',
-      'run:completed',
-    ]);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-runner: failed run transitions to failed status', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-a',
-                agent: 'worker',
-                task: 'Intentional failure',
-                verification: {
-                  type: 'output_contains',
-                  value: 'MUST_NOT_EXIST',
-                },
-              },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd }
-    );
-
-    assertRunFailed(result, 'MUST_NOT_EXIST');
-    assert.equal(result.run.status, 'failed');
-    assertWorkflowEventOrder(result.events, ['run:started', 'step:started', 'step:failed', 'run:failed']);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-// ── Test 2: Serial DAG ────────────────────────────────────────────────────
-
-test('workflow-runner: serial dag executes steps in dependency order', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              { name: 'step-a', agent: 'worker', task: 'Step A' },
-              { name: 'step-b', agent: 'worker', task: 'Step B', dependsOn: ['step-a'] },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd }
-    );
-
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-a');
-    assertStepCompleted(result, 'step-b');
-    assertStepOrder(result, ['step-a', 'step-b']);
-    assertStepCount(result, 'completed', 2);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-// ── Test 3: Parallel fan ──────────────────────────────────────────────────
-
-test('workflow-runner: parallel fan-out steps converge into fan-in step', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              { name: 'fan-a', agent: 'worker', task: 'Fan A' },
-              { name: 'fan-b', agent: 'worker', task: 'Fan B' },
-              {
-                name: 'merge',
-                agent: 'worker',
-                task: 'Merge results',
-                dependsOn: ['fan-a', 'fan-b'],
-              },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd }
-    );
-
-    assertRunCompleted(result);
-    assertStepsParallel(result, ['fan-a', 'fan-b']);
-    assertStepCompleted(result, 'merge');
-
-    // merge must start after both fan steps complete
-    const mergeStart = result.events.findIndex(
-      (event) => event.type === 'step:started' && 'stepName' in event && event.stepName === 'merge'
-    );
-    const fanADone = result.events.findIndex(
-      (event) => event.type === 'step:completed' && 'stepName' in event && event.stepName === 'fan-a'
-    );
-    const fanBDone = result.events.findIndex(
-      (event) => event.type === 'step:completed' && 'stepName' in event && event.stepName === 'fan-b'
-    );
-
-    assert.ok(mergeStart > fanADone, 'merge must start after fan-a completes');
-    assert.ok(mergeStart > fanBDone, 'merge must start after fan-b completes');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-// ── Test 4: Retry on transient failure ────────────────────────────────────
-
-test('workflow-runner: deterministic step retries on transient failure', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const marker = path.join(cwd, 'retry-marker.txt');
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-retry',
-                type: 'deterministic',
-                command: `if [ ! -f ${marker} ]; then touch ${marker}; exit 1; fi; echo DONE`,
-                retries: 1,
-                verification: { type: 'output_contains', value: 'DONE' },
-              },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd }
-    );
-
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-retry');
-    assertStepRetried(result, 'step-retry', 1);
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-// ── Test 5: Deterministic + agent mix ────────────────────────────────────
-
-test(
-  'workflow-runner: mixes deterministic and agent steps in one workflow',
-  { timeout: 120_000 },
-  async (t) => {
-    if (skipIfMissing(t)) return;
-
-    const cwd = createWorkdir();
-    const harness = new WorkflowRunnerHarness();
-    await harness.start({ useRelaycast: false });
-
-    try {
-      const result = await harness.runWorkflow(
-        makeConfig({
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                {
-                  name: 'prep',
-                  type: 'deterministic',
-                  command: 'echo PREPARED',
-                  verification: { type: 'output_contains', value: 'PREPARED' },
-                },
-                {
-                  name: 'agent-work',
-                  agent: 'worker',
-                  task: 'Do agent work after deterministic prep',
-                  dependsOn: ['prep'],
-                },
-              ],
-            },
-          ],
-        }),
-        undefined,
-        { cwd }
-      );
-
-      assertRunCompleted(result);
-      assertStepCompleted(result, 'prep');
-      assertStepCompleted(result, 'agent-work');
-      assertStepOrder(result, ['prep', 'agent-work']);
-      assertStepOutput(result, 'agent-work', 'DONE');
-    } finally {
-      await harness.stop();
-      fs.rmSync(cwd, { force: true, recursive: true });
-    }
-  }
-);
-
-// ── Test 6: Workflow selection ────────────────────────────────────────────
-
-test('workflow-runner: runs only the selected workflow by name', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'workflow-a',
-            steps: [{ name: 'step-a', agent: 'worker', task: 'Workflow A task' }],
-          },
-          {
-            name: 'workflow-b',
-            steps: [{ name: 'step-b', agent: 'worker', task: 'Workflow B task' }],
-          },
-        ],
-      }),
-      undefined,
-      { workflowName: 'workflow-b', cwd }
-    );
-
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-b');
-    assertStepCount(result, 'completed', 1);
-    assertStepCount(result, 'failed', 0);
-    assert.equal(
-      result.events.filter(
-        (event) =>
-          (event.type === 'step:started' ||
-            event.type === 'step:completed' ||
-            event.type === 'step:failed' ||
-            event.type === 'step:skipped') &&
-          'stepName' in event &&
-          event.stepName === 'step-a'
-      ).length,
-      0,
-      'Expected workflow A to be skipped when workflow-b is selected'
-    );
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
diff --git a/tests/integration/broker/workflow-templates.test.ts b/tests/integration/broker/workflow-templates.test.ts
deleted file mode 100644
index 65771705e..000000000
--- a/tests/integration/broker/workflow-templates.test.ts
+++ /dev/null
@@ -1,727 +0,0 @@
-/**
- * Workflow template integration tests.
- *
- * Tests that built-in workflow templates (review-loop, code-review, etc.)
- * work correctly with real CLI agents. Verifies multi-agent coordination,
- * message delivery, and workflow step sequencing.
- *
- * These tests are gated behind RELAY_INTEGRATION_REAL_CLI=1 to avoid
- * running resource-heavy tests in regular CI.
- *
- * Run:
- *   npx tsc -p tests/integration/broker/tsconfig.json
- *   RELAY_INTEGRATION_REAL_CLI=1 node --test tests/integration/broker/dist/workflow-templates.test.js
- *
- * Requires:
- *   RELAY_API_KEY — Relaycast workspace key (auto-provisioned if missing)
- *   RELAY_INTEGRATION_REAL_CLI=1 — opt-in for real CLI tests
- *   AGENT_RELAY_BIN (optional) — path to agent-relay binary
- */
-import assert from 'node:assert/strict';
-import test, { type TestContext } from 'node:test';
-
-import type { BrokerEvent } from '@agent-relay/sdk';
-import { BrokerHarness, checkPrerequisites, uniqueSuffix } from './utils/broker-harness.js';
-import {
-  assertAgentExists,
-  assertNoDroppedDeliveries,
-  assertAgentSpawnedEvent,
-} from './utils/assert-helpers.js';
-import { skipIfNotRealCli, skipIfCliMissing, sleep, firstAvailableCli } from './utils/cli-helpers.js';
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-// ── Review-Loop Pattern Tests ────────────────────────────────────────────────
-
-test('workflow: review-loop — spawn implementer and reviewers', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-  if (skipIfNotRealCli(t)) return;
-
-  // Need at least one CLI for this test
-  const cli = firstAvailableCli();
-  if (!cli) {
-    t.skip('No CLI available');
-    return;
-  }
-  if (skipIfCliMissing(t, cli)) return;
-
-  const harness = new BrokerHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-
-  try {
-    // Spawn review-loop agents
-    const implementerName = `implementer-${suffix}`;
-    const reviewerDiffName = `reviewer-diff-${suffix}`;
-    const reviewerArchName = `reviewer-arch-${suffix}`;
-
-    // Spawn implementer (interactive)
-    await harness.spawnAgent(implementerName, cli, ['review-loop']);
-    await sleep(10_000);
-    await assertAgentExists(harness, implementerName);
-
-    // Spawn reviewers (can be different CLIs in real scenario)
-    await harness.spawnAgent(reviewerDiffName, cli, ['review-loop']);
-    await harness.spawnAgent(reviewerArchName, cli, ['review-loop']);
-    await sleep(10_000);
-
-    // Verify all agents are alive
-    const agents = await harness.listAgents();
-    assert.ok(
-      agents.some((a) => a.name === implementerName),
-      'implementer should be alive'
-    );
-    assert.ok(
-      agents.some((a) => a.name === reviewerDiffName),
-      'reviewer-diff should be alive'
-    );
-    assert.ok(
-      agents.some((a) => a.name === reviewerArchName),
-      'reviewer-arch should be alive'
-    );
-
-    // Verify spawn events
-    const events = harness.getEvents();
-    assertAgentSpawnedEvent(events, implementerName);
-    assertAgentSpawnedEvent(events, reviewerDiffName);
-    assertAgentSpawnedEvent(events, reviewerArchName);
-
-    // Clean up
-    await harness.releaseAgent(implementerName);
-    await harness.releaseAgent(reviewerDiffName);
-    await harness.releaseAgent(reviewerArchName);
-    await sleep(2_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-test('workflow: review-loop — implementer to reviewer message flow', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-  if (skipIfNotRealCli(t)) return;
-
-  const cli = firstAvailableCli();
-  if (!cli) {
-    t.skip('No CLI available');
-    return;
-  }
-  if (skipIfCliMissing(t, cli)) return;
-
-  const harness = new BrokerHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-
-  try {
-    const implementerName = `implementer-${suffix}`;
-    const reviewerName = `reviewer-${suffix}`;
-
-    // Spawn both agents
-    await harness.spawnAgent(implementerName, cli, ['review-loop']);
-    await harness.spawnAgent(reviewerName, cli, ['review-loop']);
-    await sleep(15_000);
-
-    // Send task to implementer
-    const implResult = await harness.sendMessage({
-      to: implementerName,
-      from: 'coordinator',
-      text: 'Implement a simple hello world function. Output: IMPLEMENTATION COMPLETE when done.',
-    });
-    assert.ok(implResult.event_id, 'should get event_id for implementer message');
-
-    // Wait for implementer to process
-    await sleep(20_000);
-
-    // Send review request to reviewer (simulating workflow step)
-    const reviewResult = await harness.sendMessage({
-      to: reviewerName,
-      from: 'coordinator',
-      text: 'Review the implementation for code quality. Output: REVIEW:PASS or REVIEW:ISSUES',
-    });
-    assert.ok(reviewResult.event_id, 'should get event_id for reviewer message');
-
-    // Wait for review
-    await sleep(10_000);
-
-    // Verify delivery pipeline
-    const events = harness.getEvents();
-
-    // Both agents should have received messages
-    const implAck = events.find(
-      (e) =>
-        e.kind === 'delivery_ack' &&
-        'name' in e &&
-        (e as BrokerEvent & { name: string }).name === implementerName
-    );
-    const reviewAck = events.find(
-      (e) =>
-        e.kind === 'delivery_ack' &&
-        'name' in e &&
-        (e as BrokerEvent & { name: string }).name === reviewerName
-    );
-
-    assert.ok(implAck, 'implementer should acknowledge message');
-    assert.ok(reviewAck, 'reviewer should acknowledge message');
-
-    // No dropped deliveries
-    assertNoDroppedDeliveries(events);
-
-    // Clean up
-    await harness.releaseAgent(implementerName);
-    await harness.releaseAgent(reviewerName);
-    await sleep(2_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-test('workflow: review-loop — reviewer to reviewer communication', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-  if (skipIfNotRealCli(t)) return;
-
-  const cli = firstAvailableCli();
-  if (!cli) {
-    t.skip('No CLI available');
-    return;
-  }
-  if (skipIfCliMissing(t, cli)) return;
-
-  const harness = new BrokerHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-
-  try {
-    const reviewer1Name = `reviewer1-${suffix}`;
-    const reviewer2Name = `reviewer2-${suffix}`;
-
-    // Spawn two reviewers
-    await harness.spawnAgent(reviewer1Name, cli, ['review-loop']);
-    await harness.spawnAgent(reviewer2Name, cli, ['review-loop']);
-    await sleep(15_000);
-
-    // reviewer1 sends message to reviewer2 (collaborative review)
-    const r2rResult = await harness.sendMessage({
-      to: reviewer2Name,
-      from: reviewer1Name,
-      text: 'I found a potential security issue. Do you agree?',
-    });
-    assert.ok(r2rResult.event_id, 'reviewer-to-reviewer message should get event_id');
-
-    // Wait for delivery
-    await sleep(10_000);
-
-    // Verify reviewer2 received the message
-    const events = harness.getEvents();
-    const r2Ack = events.find(
-      (e) =>
-        e.kind === 'delivery_ack' &&
-        'name' in e &&
-        (e as BrokerEvent & { name: string }).name === reviewer2Name
-    );
-
-    assert.ok(r2Ack, 'reviewer2 should acknowledge message from reviewer1');
-    assertNoDroppedDeliveries(events);
-
-    // Clean up
-    await harness.releaseAgent(reviewer1Name);
-    await harness.releaseAgent(reviewer2Name);
-    await sleep(2_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-// ── Multi-CLI Workflow Tests ─────────────────────────────────────────────────
-
-test('workflow: multi-cli — claude implementer + codex reviewer', { timeout: 150_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-  if (skipIfNotRealCli(t)) return;
-  if (skipIfCliMissing(t, 'claude')) return;
-  if (skipIfCliMissing(t, 'codex')) return;
-
-  const harness = new BrokerHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-
-  try {
-    const implementerName = `impl-claude-${suffix}`;
-    const reviewerName = `review-codex-${suffix}`;
-
-    // Spawn Claude as implementer, Codex as reviewer
-    await harness.spawnAgent(implementerName, 'claude', ['workflow']);
-    await harness.spawnAgent(reviewerName, 'codex', ['workflow']);
-    await sleep(15_000);
-
-    // Verify both are alive
-    const agents = await harness.listAgents();
-    assert.ok(
-      agents.some((a) => a.name === implementerName),
-      'claude implementer should be alive'
-    );
-    assert.ok(
-      agents.some((a) => a.name === reviewerName),
-      'codex reviewer should be alive'
-    );
-
-    // Send implementation task to Claude
-    await harness.sendMessage({
-      to: implementerName,
-      from: 'coordinator',
-      text: 'Create a function that adds two numbers. Say DONE when finished.',
-    });
-    await sleep(25_000);
-
-    // Send review task to Codex
-    await harness.sendMessage({
-      to: reviewerName,
-      from: 'coordinator',
-      text: 'Review the addition function for edge cases. Say REVIEW COMPLETE when done.',
-    });
-    await sleep(15_000);
-
-    // Verify both received messages
-    const events = harness.getEvents();
-    const implAck = events.find(
-      (e) =>
-        e.kind === 'delivery_ack' &&
-        'name' in e &&
-        (e as BrokerEvent & { name: string }).name === implementerName
-    );
-    const reviewAck = events.find(
-      (e) =>
-        e.kind === 'delivery_ack' &&
-        'name' in e &&
-        (e as BrokerEvent & { name: string }).name === reviewerName
-    );
-
-    assert.ok(implAck, 'claude should acknowledge task');
-    assert.ok(reviewAck, 'codex should acknowledge review');
-    assertNoDroppedDeliveries(events);
-
-    // Clean up
-    await harness.releaseAgent(implementerName);
-    await harness.releaseAgent(reviewerName);
-    await sleep(2_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-// ── Parallel Agent Spawn Tests ───────────────────────────────────────────────
-
-test('workflow: parallel spawn — 4 agents simultaneously', { timeout: 180_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-  if (skipIfNotRealCli(t)) return;
-
-  const cli = firstAvailableCli();
-  if (!cli) {
-    t.skip('No CLI available');
-    return;
-  }
-  if (skipIfCliMissing(t, cli)) return;
-
-  const harness = new BrokerHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-
-  try {
-    const agentNames = [`agent1-${suffix}`, `agent2-${suffix}`, `agent3-${suffix}`, `agent4-${suffix}`];
-
-    // Spawn all 4 agents in parallel
-    await Promise.all(agentNames.map((name) => harness.spawnAgent(name, cli, ['parallel-test'])));
-
-    // Wait for all to initialize
-    await sleep(20_000);
-
-    // Verify all agents are alive
-    const agents = await harness.listAgents();
-    for (const name of agentNames) {
-      assert.ok(
-        agents.some((a) => a.name === name),
-        `${name} should be alive`
-      );
-    }
-
-    // Verify spawn events for all
-    const events = harness.getEvents();
-    for (const name of agentNames) {
-      assertAgentSpawnedEvent(events, name);
-    }
-
-    // Send message to each agent
-    await Promise.all(
-      agentNames.map((name) =>
-        harness.sendMessage({
-          to: name,
-          from: 'coordinator',
-          text: `Task for ${name}: acknowledge receipt`,
-        })
-      )
-    );
-
-    // Wait for deliveries
-    await sleep(15_000);
-
-    // Verify all received messages
-    const finalEvents = harness.getEvents();
-    const ackCount = finalEvents.filter(
-      (e) =>
-        e.kind === 'delivery_ack' &&
-        'name' in e &&
-        agentNames.includes((e as BrokerEvent & { name: string }).name)
-    ).length;
-
-    assert.ok(ackCount >= 1, `at least 1 agent should acknowledge, got ${ackCount}`);
-    assertNoDroppedDeliveries(finalEvents);
-
-    // Clean up
-    await Promise.all(agentNames.map((name) => harness.releaseAgent(name)));
-    await sleep(3_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-// ── Channel-Based Coordination Tests ─────────────────────────────────────────
-
-test('workflow: channel broadcast — message to all workflow agents', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-  if (skipIfNotRealCli(t)) return;
-
-  const cli = firstAvailableCli();
-  if (!cli) {
-    t.skip('No CLI available');
-    return;
-  }
-  if (skipIfCliMissing(t, cli)) return;
-
-  const harness = new BrokerHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-  const channelName = `workflow-${suffix}`;
-
-  try {
-    const agent1 = `worker1-${suffix}`;
-    const agent2 = `worker2-${suffix}`;
-
-    // Spawn agents on same channel
-    await harness.spawnAgent(agent1, cli, [channelName]);
-    await harness.spawnAgent(agent2, cli, [channelName]);
-    await sleep(15_000);
-
-    // Broadcast to channel
-    const broadcastResult = await harness.sendMessage({
-      to: `#${channelName}`,
-      from: 'coordinator',
-      text: 'All agents: report your status',
-    });
-    assert.ok(broadcastResult.event_id, 'broadcast should get event_id');
-
-    // Wait for deliveries
-    await sleep(10_000);
-
-    // Verify events
-    const events = harness.getEvents();
-    assertNoDroppedDeliveries(events);
-
-    // Clean up
-    await harness.releaseAgent(agent1);
-    await harness.releaseAgent(agent2);
-    await sleep(2_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-// ── Sequential Step Execution Tests ──────────────────────────────────────────
-
-test('workflow: sequential steps — implement → review → address', { timeout: 180_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-  if (skipIfNotRealCli(t)) return;
-
-  const cli = firstAvailableCli();
-  if (!cli) {
-    t.skip('No CLI available');
-    return;
-  }
-  if (skipIfCliMissing(t, cli)) return;
-
-  const harness = new BrokerHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-
-  try {
-    const implementerName = `impl-${suffix}`;
-    const reviewerName = `rev-${suffix}`;
-
-    // Spawn agents
-    await harness.spawnAgent(implementerName, cli, ['sequential']);
-    await harness.spawnAgent(reviewerName, cli, ['sequential']);
-    await sleep(15_000);
-
-    // Step 1: Implementation
-    const step1Result = await harness.sendMessage({
-      to: implementerName,
-      from: 'workflow-engine',
-      text: 'Step 1: Implement a factorial function. Output STEP1_COMPLETE when done.',
-    });
-    assert.ok(step1Result.event_id, 'step 1 message should get event_id');
-    await sleep(20_000);
-
-    // Step 2: Review (depends on step 1)
-    const step2Result = await harness.sendMessage({
-      to: reviewerName,
-      from: 'workflow-engine',
-      text: 'Step 2: Review the factorial implementation. Output STEP2_COMPLETE when done.',
-    });
-    assert.ok(step2Result.event_id, 'step 2 message should get event_id');
-    await sleep(15_000);
-
-    // Step 3: Address feedback (depends on step 2)
-    const step3Result = await harness.sendMessage({
-      to: implementerName,
-      from: 'workflow-engine',
-      text: 'Step 3: Address any review feedback. Output STEP3_COMPLETE when done.',
-    });
-    assert.ok(step3Result.event_id, 'step 3 message should get event_id');
-    await sleep(15_000);
-
-    // Verify all steps were acknowledged
-    const events = harness.getEvents();
-    const implAcks = events.filter(
-      (e) =>
-        e.kind === 'delivery_ack' &&
-        'name' in e &&
-        (e as BrokerEvent & { name: string }).name === implementerName
-    );
-    const revAcks = events.filter(
-      (e) =>
-        e.kind === 'delivery_ack' &&
-        'name' in e &&
-        (e as BrokerEvent & { name: string }).name === reviewerName
-    );
-
-    assert.ok(implAcks.length >= 1, 'implementer should have at least 1 ack');
-    assert.ok(revAcks.length >= 1, 'reviewer should have at least 1 ack');
-    assertNoDroppedDeliveries(events);
-
-    // Clean up
-    await harness.releaseAgent(implementerName);
-    await harness.releaseAgent(reviewerName);
-    await sleep(2_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-// ── Agent Recovery Tests ─────────────────────────────────────────────────────
-
-test('workflow: agent lifecycle — release and re-spawn', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-  if (skipIfNotRealCli(t)) return;
-
-  const cli = firstAvailableCli();
-  if (!cli) {
-    t.skip('No CLI available');
-    return;
-  }
-  if (skipIfCliMissing(t, cli)) return;
-
-  const harness = new BrokerHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-  const agentName = `lifecycle-${suffix}`;
-
-  try {
-    // First spawn
-    await harness.spawnAgent(agentName, cli, ['lifecycle']);
-    await sleep(10_000);
-    await assertAgentExists(harness, agentName);
-
-    // Release
-    await harness.releaseAgent(agentName);
-    await sleep(3_000);
-
-    // Verify agent is gone
-    const agentsAfterRelease = await harness.listAgents();
-    assert.ok(!agentsAfterRelease.some((a) => a.name === agentName), 'agent should be gone after release');
-
-    // Re-spawn with same name
-    await harness.spawnAgent(agentName, cli, ['lifecycle']);
-    await sleep(10_000);
-
-    // Verify agent is back
-    await assertAgentExists(harness, agentName);
-
-    // Verify events show two spawns
-    const events = harness.getEvents();
-    const spawnEvents = events.filter(
-      (e) =>
-        e.kind === 'agent_spawned' && 'name' in e && (e as BrokerEvent & { name: string }).name === agentName
-    );
-    assert.equal(spawnEvents.length, 2, 'should have 2 spawn events');
-
-    // Clean up
-    await harness.releaseAgent(agentName);
-    await sleep(2_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-// ── Stress Test: Many Agents ─────────────────────────────────────────────────
-
-test('workflow: stress — 6 agents in hub-spoke pattern', { timeout: 300_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-  if (skipIfNotRealCli(t)) return;
-
-  const cli = firstAvailableCli();
-  if (!cli) {
-    t.skip('No CLI available');
-    return;
-  }
-  if (skipIfCliMissing(t, cli)) return;
-
-  const harness = new BrokerHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-
-  try {
-    // Hub (lead) + 5 spokes (workers)
-    const hubName = `hub-${suffix}`;
-    const spokeNames = [
-      `spoke1-${suffix}`,
-      `spoke2-${suffix}`,
-      `spoke3-${suffix}`,
-      `spoke4-${suffix}`,
-      `spoke5-${suffix}`,
-    ];
-
-    // Spawn hub
-    await harness.spawnAgent(hubName, cli, ['stress-test']);
-    await sleep(10_000);
-
-    // Spawn spokes
-    for (const name of spokeNames) {
-      await harness.spawnAgent(name, cli, ['stress-test']);
-      await sleep(5_000); // Stagger to avoid overwhelming
-    }
-
-    // Wait for all to initialize
-    await sleep(15_000);
-
-    // Verify all agents are alive
-    const agents = await harness.listAgents();
-    assert.ok(
-      agents.some((a) => a.name === hubName),
-      'hub should be alive'
-    );
-    for (const name of spokeNames) {
-      assert.ok(
-        agents.some((a) => a.name === name),
-        `${name} should be alive`
-      );
-    }
-
-    // Hub sends message to each spoke
-    for (const spokeName of spokeNames) {
-      await harness.sendMessage({
-        to: spokeName,
-        from: hubName,
-        text: `Task for ${spokeName}: process your work item`,
-      });
-      await sleep(2_000); // Small delay between sends
-    }
-
-    // Wait for processing
-    await sleep(20_000);
-
-    // Verify deliveries
-    const events = harness.getEvents();
-    const ackCount = events.filter(
-      (e) =>
-        e.kind === 'delivery_ack' &&
-        'name' in e &&
-        spokeNames.includes((e as BrokerEvent & { name: string }).name)
-    ).length;
-
-    assert.ok(ackCount >= 1, `at least 1 spoke should acknowledge, got ${ackCount}`);
-    assertNoDroppedDeliveries(events);
-
-    // Clean up - release all
-    await harness.releaseAgent(hubName);
-    for (const name of spokeNames) {
-      await harness.releaseAgent(name);
-    }
-    await sleep(5_000);
-  } finally {
-    await harness.stop();
-  }
-});
-
-// ── Lightweight Tests (cat process, no real CLI needed) ─────────────────────
-
-test('workflow: cat — lightweight workflow simulation', { timeout: 60_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-  if (skipIfNotRealCli(t)) return;
-
-  const harness = new BrokerHarness();
-  await harness.start();
-  const suffix = uniqueSuffix();
-
-  try {
-    // Spawn "agents" using cat (lightweight, always available)
-    const implName = `cat-impl-${suffix}`;
-    const revName = `cat-rev-${suffix}`;
-
-    await harness.spawnAgent(implName, 'cat', ['cat-workflow']);
-    await harness.spawnAgent(revName, 'cat', ['cat-workflow']);
-    await sleep(5_000);
-
-    // Verify both alive
-    await assertAgentExists(harness, implName);
-    await assertAgentExists(harness, revName);
-
-    // Send workflow messages
-    await harness.sendMessage({
-      to: implName,
-      from: 'coordinator',
-      text: 'implement task',
-    });
-    await harness.sendMessage({
-      to: revName,
-      from: 'coordinator',
-      text: 'review task',
-    });
-
-    await sleep(5_000);
-
-    // Verify deliveries
-    const events = harness.getEvents();
-    const implAck = events.find(
-      (e) =>
-        e.kind === 'delivery_ack' && 'name' in e && (e as BrokerEvent & { name: string }).name === implName
-    );
-    const revAck = events.find(
-      (e) =>
-        e.kind === 'delivery_ack' && 'name' in e && (e as BrokerEvent & { name: string }).name === revName
-    );
-
-    assert.ok(implAck, 'cat-impl should acknowledge');
-    assert.ok(revAck, 'cat-rev should acknowledge');
-    assertNoDroppedDeliveries(events);
-
-    // Clean up
-    await harness.releaseAgent(implName);
-    await harness.releaseAgent(revName);
-    await sleep(2_000);
-  } finally {
-    await harness.stop();
-  }
-});
diff --git a/tests/integration/broker/workflow-verification.test.ts b/tests/integration/broker/workflow-verification.test.ts
deleted file mode 100644
index 84bb9fd78..000000000
--- a/tests/integration/broker/workflow-verification.test.ts
+++ /dev/null
@@ -1,234 +0,0 @@
-/**
- * WorkflowRunner verification check integration tests.
- */
-import fs from 'node:fs';
-import os from 'node:os';
-import path from 'node:path';
-import test, { type TestContext } from 'node:test';
-
-import type { RelayYamlConfig, VerificationCheck } from '@agent-relay/sdk/workflows';
-import { checkPrerequisites } from './utils/broker-harness.js';
-import { WorkflowRunnerHarness } from './utils/workflow-harness.js';
-import {
-  assertRunCompleted,
-  assertRunFailed,
-  assertStepCompleted,
-  assertStepFailed,
-} from './utils/workflow-assert-helpers.js';
-
-function skipIfMissing(t: TestContext): boolean {
-  const reason = checkPrerequisites();
-  if (reason) {
-    t.skip(reason);
-    return true;
-  }
-  return false;
-}
-
-function makeConfig(overrides?: Partial<RelayYamlConfig>): RelayYamlConfig {
-  const base: RelayYamlConfig = {
-    version: '1',
-    name: 'test-workflow-verification',
-    description: 'Integration test',
-    swarm: { pattern: 'dag' },
-    agents: [{ name: 'worker', cli: 'claude' }],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          {
-            name: 'step-verify-output',
-            agent: 'worker',
-            task: 'Do one thing',
-            verification: { type: 'output_contains', value: 'DONE' },
-          },
-        ],
-      },
-    ],
-  };
-
-  return {
-    ...base,
-    ...overrides,
-    agents: overrides?.agents ?? base.agents,
-    workflows: overrides?.workflows ?? base.workflows,
-    swarm: { ...base.swarm, ...(overrides?.swarm ?? {}) },
-  };
-}
-
-function createWorkdir(): string {
-  return fs.mkdtempSync(path.join(os.tmpdir(), 'relay-wf-verification-'));
-}
-
-test('workflow-verification: output_contains passes when text exists', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const result = await harness.runWorkflow(makeConfig(), undefined, { cwd });
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-verify-output');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-verification: output_contains fails when text missing', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const result = await harness.runWorkflow(
-      makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-verify-output',
-                agent: 'worker',
-                task: 'Return DONE',
-                verification: { type: 'output_contains', value: 'MISSING' },
-              },
-            ],
-          },
-        ],
-      }),
-      undefined,
-      { cwd }
-    );
-
-    assertRunFailed(result, 'does not contain');
-    assertStepFailed(result, 'step-verify-output');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test(
-  'workflow-verification: exit_code check is accepted for interactive agents',
-  { timeout: 120_000 },
-  async (t) => {
-    if (skipIfMissing(t)) return;
-
-    const cwd = createWorkdir();
-    const harness = new WorkflowRunnerHarness();
-    await harness.start({ useRelaycast: false });
-
-    try {
-      const check: VerificationCheck = { type: 'exit_code', value: '0' };
-      const result = await harness.runWorkflow(
-        makeConfig({
-          workflows: [
-            {
-              name: 'default',
-              steps: [
-                {
-                  name: 'step-verify-exit',
-                  agent: 'worker',
-                  task: 'Return DONE',
-                  verification: check,
-                },
-              ],
-            },
-          ],
-        }),
-        undefined,
-        { cwd }
-      );
-
-      assertRunCompleted(result);
-      assertStepCompleted(result, 'step-verify-exit');
-    } finally {
-      await harness.stop();
-      fs.rmSync(cwd, { force: true, recursive: true });
-    }
-  }
-);
-
-test('workflow-verification: file_exists passes when file is produced', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const marker = 'verify-marker.txt';
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const result = await harness.runWorkflow(
-      {
-        ...makeConfig(),
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-make-file',
-                type: 'deterministic',
-                command: `printf "ok" > ${marker}`,
-              },
-              {
-                name: 'step-file',
-                agent: 'worker',
-                task: 'Validate file exists',
-                dependsOn: ['step-make-file'],
-                verification: { type: 'file_exists', value: marker },
-              },
-            ],
-          },
-        ],
-      },
-      undefined,
-      { cwd }
-    );
-    assertRunCompleted(result);
-    assertStepCompleted(result, 'step-file');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
-
-test('workflow-verification: file_exists fails when file is missing', { timeout: 120_000 }, async (t) => {
-  if (skipIfMissing(t)) return;
-
-  const cwd = createWorkdir();
-  const harness = new WorkflowRunnerHarness();
-  await harness.start({ useRelaycast: false });
-
-  try {
-    const result = await harness.runWorkflow(
-      {
-        ...makeConfig(),
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              {
-                name: 'step-file',
-                agent: 'worker',
-                task: 'Expect missing file',
-                verification: { type: 'file_exists', value: 'missing-marker.txt' },
-              },
-            ],
-          },
-        ],
-      },
-      undefined,
-      { cwd }
-    );
-    assertRunFailed(result, 'does not exist');
-    assertStepFailed(result, 'step-file');
-  } finally {
-    await harness.stop();
-    fs.rmSync(cwd, { force: true, recursive: true });
-  }
-});
diff --git a/tests/workflows/README.md b/tests/workflows/README.md
deleted file mode 100644
index 4e9e7436a..000000000
--- a/tests/workflows/README.md
+++ /dev/null
@@ -1,69 +0,0 @@
-# Workflow Durability Patterns
-
-Test workflows that encode the key rules for writing workflows that don't time out or fail silently.
-
-## Workflows
-
-| File                                       | Tests                                                               |
-| ------------------------------------------ | ------------------------------------------------------------------- |
-| `test-deterministic-pipeline.yaml`         | Pure shell steps, `captureOutput`, `{{steps.X.output}}` chaining    |
-| `test-non-interactive-bounded.yaml`        | Non-interactive agents with content injected by deterministic steps |
-| `test-lead-worker-pattern.yaml`            | Interactive lead + relay-connected workers for channel coordination |
-| `test-step-sizing.yaml`                    | One step = one deliverable; chaining vs discovery                   |
-| `test-codex-simple.yaml`                   | Minimal Codex single-step agent workflow smoke test                 |
-| `test-codex-sequential.yaml`               | Codex pipeline with step output chaining                            |
-| `test-codex-parallel.yaml`                 | Codex DAG / fan-out smoke test                                      |
-| `test-codex-failure.yaml`                  | Codex verification failure should fail the workflow                 |
-| `test-gemini-simple.yaml`                  | Minimal Gemini single-step agent workflow smoke test                |
-| `test-gemini-sequential.yaml`              | Gemini pipeline with step output chaining                           |
-| `test-gemini-parallel.yaml`                | Gemini DAG / fan-out smoke test                                     |
-| `test-gemini-failure.yaml`                 | Gemini verification failure should fail the workflow                |
-| `validation-lead-worker-happy-strict.yaml` | Real happy-path lead/worker relay coordination validation           |
-| `validation-owner-retry-strict.yaml`       | Real retry-semantics validation for explicit `INCOMPLETE_RETRY`     |
-
-## Core Rules
-
-### 1. Non-interactive agents must never discover information via tools
-
-**Wrong:** Ask a `worker` agent to "read `src/foo.ts` and summarize it"  
-**Right:** Deterministic step runs `cat src/foo.ts`, captures output, injects via `{{steps.read.output}}`
-
-Non-interactive (`claude -p`) agents can use tools but it's slow, unreliable, and often times out on large files. Deterministic steps are instant.
-
-### 2. One step = one deliverable
-
-**Wrong:** "Read the codebase, design a spec, write it to disk, and validate the build"  
-**Right:** Four separate steps, each with a single clear output and `output_contains` verification
-
-### 3. Interactive leads coordinate; bounded workers stay non-interactive unless they must relay
-
-- **Lead** (`preset: lead`): reasoning, coordination, relay messaging, spawning workers
-- **Worker** (`preset: worker`): takes a small well-defined task, produces structured stdout
-- **Relay-coordinated worker**: keep it interactive and give it a channel when it must send `WORKER_DONE` or other relay messages
-
-### 4. Always set `verification.output_contains`
-
-Without verification, a step that produces empty output looks like success. Every agent step needs a sentinel value.
-
-### 5. Timeout budgets
-
-- Deterministic steps: seconds
-- Non-interactive agents with injected content: 2–5 min
-- Interactive lead agents: 10–20 min (they read channels, wait for workers)
-- Full workflow: sum of critical path + 20% buffer
-
-### 6. Never create a lead↔worker DAG deadlock
-
-**Wrong:** `work-a` and `work-b` depend on `coordinate` (lead), but `coordinate` waits for DONE signals from `work-a` and `work-b`. Neither can proceed.
-
-**Right:** Workers and lead all depend on `context` (start in parallel). A `merge` step depends on all three. Lead watches the channel for worker signals — it doesn't block the workers from starting.
-
-```
-context → work-a ─┐
-context → work-b ─┼→ merge
-context → lead  ──┘
-```
-
-### 7. Never ask an agent to read large files via tools
-
-`packages/sdk/src/workflows/runner.ts` is ~3200 lines. Asking `claude -p` to read it via the Read tool + reason about it = 20+ min timeout. Extract only the relevant lines in a deterministic step first.
diff --git a/tests/workflows/codex-exit/relay.codex-exit-v1-prompt.yaml b/tests/workflows/codex-exit/relay.codex-exit-v1-prompt.yaml
deleted file mode 100644
index 08b50f415..000000000
--- a/tests/workflows/codex-exit/relay.codex-exit-v1-prompt.yaml
+++ /dev/null
@@ -1,64 +0,0 @@
-version: '1.0'
-name: codex-exit-v1-prompt
-description: >
-  EXIT EXPERIMENT #1: Pure explicit prompt.
-  Tests whether codex reliably outputs `/exit` on its own line when the task
-  prompt gives extremely explicit, unambiguous termination instructions.
-  No lead agent — codex must self-terminate purely from prompt instructions.
-
-swarm:
-  pattern: pipeline
-  maxConcurrency: 1
-  timeoutMs: 300000 # 5 min — short test
-  channel: codex-exit-v1
-  idleNudge:
-    nudgeAfterMs: 60000 # 1 min — fast feedback on whether nudges help
-    escalateAfterMs: 60000
-    maxNudges: 2
-
-agents:
-  - name: codex-worker
-    cli: codex
-    channels: [codex-exit-v1]
-    role: 'Completes a trivial task then self-terminates by outputting /exit.'
-
-workflows:
-  - name: test-v1-explicit-prompt
-    description: >
-      Single codex agent. Task is trivial (output a string).
-      Exit mechanism: explicit multi-line prompt instruction telling codex
-      to output /exit alone on its own line immediately after finishing.
-    steps:
-      - name: do-task
-        type: agent
-        agent: codex-worker
-        task: |
-          Your task has TWO parts. Complete them in order.
-
-          PART 1 — THE TASK:
-          Output the following line to your terminal:
-            TASK_COMPLETE
-
-          PART 2 — MANDATORY TERMINATION:
-          Immediately after completing Part 1, you MUST terminate this session.
-          To terminate, output the following EXACTLY — four characters, alone on
-          their own line, with NO text before it and NO text after it:
-
-          /exit
-
-          Rules:
-          - The /exit line must be the LAST thing you output
-          - Do NOT output any explanation, summary, or closing remark after /exit
-          - Do NOT wait for further input after /exit
-          - The session MUST end with the /exit line
-
-          Example of correct output:
-          ---
-          TASK_COMPLETE
-          /exit
-          ---
-
-          Begin now. Output TASK_COMPLETE, then /exit on its own line.
-        verification:
-          type: output_contains
-          value: TASK_COMPLETE
diff --git a/tests/workflows/codex-exit/relay.codex-exit-v2-lead-relay.yaml b/tests/workflows/codex-exit/relay.codex-exit-v2-lead-relay.yaml
deleted file mode 100644
index d1be6d3ba..000000000
--- a/tests/workflows/codex-exit/relay.codex-exit-v2-lead-relay.yaml
+++ /dev/null
@@ -1,95 +0,0 @@
-version: '1.0'
-name: codex-exit-v2-lead-relay
-description: >
-  EXIT EXPERIMENT #2: Claude lead sends relay DM to trigger /exit.
-  Tests whether codex reliably outputs `/exit` when a lead agent sends a
-  direct relay message instructing it to terminate after signaling completion.
-  Both agents start simultaneously. Codex posts TASK_DONE to channel.
-  Lead sees TASK_DONE, DMs codex: "output /exit now". Codex checks inbox
-  and follows the DM instruction.
-
-swarm:
-  pattern: dag
-  maxConcurrency: 2
-  timeoutMs: 300000 # 5 min
-  channel: codex-exit-v2
-  idleNudge:
-    nudgeAfterMs: 90000 # 1.5 min — give time for relay round-trip
-    escalateAfterMs: 60000
-    maxNudges: 2
-
-agents:
-  - name: exit-lead
-    cli: claude
-    channels: [codex-exit-v2]
-    role: >
-      Monitors #codex-exit-v2. When codex-worker posts TASK_DONE, sends a relay DM
-      telling codex-worker to output /exit. Then waits for step to complete.
-    constraints:
-      model: sonnet
-
-  - name: codex-worker
-    cli: codex
-    channels: [codex-exit-v2]
-    role: >
-      Completes a trivial task, signals done on channel, then checks relay inbox
-      and follows the exit instruction from exit-lead.
-
-workflows:
-  - name: test-v2-lead-relay
-    description: >
-      Parallel: exit-lead monitors channel, codex-worker does task.
-      Codex posts completion signal → lead DMs exit instruction → codex /exits.
-    steps:
-      # Both steps start simultaneously (no dependsOn)
-
-      - name: lead-monitor
-        type: agent
-        agent: exit-lead
-        task: |
-          Your role: monitor #codex-exit-v2 and trigger codex-worker to exit
-          when it signals completion.
-
-          STEP 1 — Wait for codex-worker to post "TASK_DONE" to #codex-exit-v2.
-          Poll the channel every 5 seconds using mcp__relaycast__check_inbox or get channel messages.
-
-          STEP 2 — When you see "TASK_DONE" from codex-worker, immediately send
-          a direct message to codex-worker with this exact text:
-            "RELAY_EXIT_COMMAND: Your task is complete. Output /exit now to terminate."
-
-          STEP 3 — Wait for codex-worker's step to show as complete (it will /exit).
-
-          STEP 4 — Output: LEAD_DONE
-
-          Note: Do NOT message codex-worker until you see TASK_DONE on the channel.
-        verification:
-          type: output_contains
-          value: LEAD_DONE
-
-      - name: codex-task
-        type: agent
-        agent: codex-worker
-        task: |
-          Your task has THREE parts. Complete them in order.
-
-          PART 1 — THE TASK:
-          Output the following to your terminal:
-            TASK_RUNNING
-
-          PART 2 — SIGNAL COMPLETION:
-          Post "TASK_DONE" to #codex-exit-v2 channel using mcp__relaycast__post_message.
-          Command: mcp__relaycast__post_message(channel: "codex-exit-v2", text: "TASK_DONE")
-
-          PART 3 — WAIT FOR EXIT INSTRUCTION:
-          After posting TASK_DONE, check your relay inbox repeatedly (every 3-5 seconds).
-          Wait for a direct message containing "RELAY_EXIT_COMMAND".
-          When you receive it, immediately output the following on its own line:
-
-          /exit
-
-          The /exit must be the LAST thing you output. No text after it.
-
-          Begin now: output TASK_RUNNING, post TASK_DONE to channel, then wait for DM.
-        verification:
-          type: output_contains
-          value: TASK_RUNNING
diff --git a/tests/workflows/codex-exit/relay.codex-exit-v3-file-sentinel.yaml b/tests/workflows/codex-exit/relay.codex-exit-v3-file-sentinel.yaml
deleted file mode 100644
index 4f8b3af2b..000000000
--- a/tests/workflows/codex-exit/relay.codex-exit-v3-file-sentinel.yaml
+++ /dev/null
@@ -1,82 +0,0 @@
-version: '1.0'
-name: codex-exit-v3-file-sentinel
-description: >
-  EXIT EXPERIMENT #3: File sentinel + /exit combo.
-  Tests whether writing a completion file before /exit is more reliable than
-  /exit alone. Also confirms the file was actually written via a deterministic
-  verification step. Belt-and-suspenders: if codex writes the file but /exit
-  fails, the deterministic verify step still shows the file exists.
-
-swarm:
-  pattern: pipeline
-  maxConcurrency: 1
-  timeoutMs: 300000 # 5 min
-  channel: codex-exit-v3
-  idleNudge:
-    nudgeAfterMs: 60000
-    escalateAfterMs: 60000
-    maxNudges: 2
-
-agents:
-  - name: codex-worker
-    cli: codex
-    channels: [codex-exit-v3]
-    role: >
-      Writes a sentinel file to /tmp/codex-exit-test/sentinel.txt,
-      outputs FILE_WRITTEN, then immediately outputs /exit.
-
-workflows:
-  - name: test-v3-file-sentinel
-    description: >
-      Codex writes a file to prove it completed work, then /exits.
-      A deterministic step reads the file to confirm it was written.
-      If codex exits cleanly, both steps pass. If codex hangs after file write,
-      we learn /exit failed even with prior file evidence.
-    preflight:
-      - command: mkdir -p /tmp/codex-exit-test && rm -f /tmp/codex-exit-test/sentinel.txt
-        description: 'Clean slate — remove any prior sentinel file'
-
-    steps:
-      - name: write-and-exit
-        type: agent
-        agent: codex-worker
-        task: |
-          Your task has THREE parts. Complete them in strict order.
-
-          PART 1 — CREATE THE DIRECTORY:
-          Run this shell command (use your bash/terminal tool):
-            mkdir -p /tmp/codex-exit-test
-
-          PART 2 — WRITE THE SENTINEL FILE:
-          Write the following text to /tmp/codex-exit-test/sentinel.txt:
-            SENTINEL_WRITTEN
-
-          Use any method available to you (bash echo, file write tool, etc).
-          Then output to your terminal:
-            FILE_WRITTEN
-
-          PART 3 — TERMINATE IMMEDIATELY:
-          Output the following EXACTLY on its own line with nothing else:
-
-          /exit
-
-          The sequence of your terminal output should be:
-            FILE_WRITTEN
-            /exit
-
-          Do NOT output anything after /exit.
-          Do NOT wait for input after /exit.
-          The session ends when you output /exit.
-        verification:
-          type: output_contains
-          value: FILE_WRITTEN
-
-      - name: verify-sentinel
-        type: deterministic
-        dependsOn: [write-and-exit]
-        command: >
-          cat /tmp/codex-exit-test/sentinel.txt
-          && echo "VERIFY_PASSED"
-          || echo "VERIFY_FAILED: sentinel file not found"
-        captureOutput: true
-        failOnError: false
diff --git a/tests/workflows/codex-exit/relay.codex-exit-v4-noninteractive.yaml b/tests/workflows/codex-exit/relay.codex-exit-v4-noninteractive.yaml
deleted file mode 100644
index c8cec8143..000000000
--- a/tests/workflows/codex-exit/relay.codex-exit-v4-noninteractive.yaml
+++ /dev/null
@@ -1,53 +0,0 @@
-version: '1.0'
-name: codex-exit-v4-noninteractive
-description: >
-  EXIT EXPERIMENT #4: Non-interactive control case (interactive: false).
-  Tests codex in one-shot subprocess mode via `codex exec`.
-  No PTY, no relay messaging, no /exit dependency.
-  The process exits naturally when the command completes.
-  This should ALWAYS work and serves as the reference implementation
-  for any codex worker that does not need real-time relay communication.
-
-swarm:
-  pattern: pipeline
-  maxConcurrency: 1
-  timeoutMs: 300000 # 5 min
-  channel: codex-exit-v4
-  # No idleNudge — non-interactive agents don't need nudging
-
-agents:
-  - name: codex-worker
-    cli: codex
-    interactive: false # KEY: one-shot subprocess mode
-    channels: [codex-exit-v4]
-    role: >
-      Non-interactive codex worker. Receives task via CLI argument, runs to
-      completion, exits naturally. No /exit required. Stdout is captured output.
-
-workflows:
-  - name: test-v4-noninteractive
-    description: >
-      Control case: codex with interactive: false.
-      Uses `codex exec <task>` under the hood — one-shot, no PTY.
-      If this fails, something is wrong with the non-interactive execution path.
-      If this succeeds when V1/V2/V3 fail, it proves non-interactive is the fix.
-    steps:
-      - name: do-task
-        type: agent
-        agent: codex-worker
-        task: |
-          Output these three lines in order and nothing else:
-
-          NONINTERACTIVE_START
-          Hello from non-interactive codex
-          NONINTERACTIVE_COMPLETE
-        verification:
-          type: output_contains
-          value: NONINTERACTIVE_COMPLETE
-
-      - name: verify-output
-        type: deterministic
-        dependsOn: [do-task]
-        command: echo "Step completed successfully — codex exited naturally"
-        captureOutput: true
-        failOnError: false
diff --git a/tests/workflows/codex-exit/relay.codex-exit-v5-self-release.yaml b/tests/workflows/codex-exit/relay.codex-exit-v5-self-release.yaml
deleted file mode 100644
index 8d3647d0b..000000000
--- a/tests/workflows/codex-exit/relay.codex-exit-v5-self-release.yaml
+++ /dev/null
@@ -1,70 +0,0 @@
-version: '1.0'
-name: codex-exit-v5-self-release
-description: >
-  EXIT EXPERIMENT #5: Codex self-releases via relay MCP tools.
-  Tests whether codex can terminate itself by calling remove_agent() on its
-  own agent name, which tells the broker to release the PTY process.
-  Secondary fallback: if remove_agent fails, output /exit.
-  This tests the "agent asks the broker to release me" mechanism.
-
-swarm:
-  pattern: pipeline
-  maxConcurrency: 1
-  timeoutMs: 300000 # 5 min
-  channel: codex-exit-v5
-  idleNudge:
-    nudgeAfterMs: 90000 # give extra time for relay round-trip to broker
-    escalateAfterMs: 60000
-    maxNudges: 2
-
-agents:
-  - name: codex-worker
-    cli: codex
-    channels: [codex-exit-v5]
-    role: >
-      Completes a trivial task, finds its own relay agent name via mcp__relaycast__list_agents(),
-      then calls remove_agent() on itself to terminate the session.
-
-workflows:
-  - name: test-v5-self-release
-    description: >
-      Codex uses the relay MCP tools to self-terminate:
-        1. Do trivial task
-        2. Call mcp__relaycast__list_agents() to find own registered name
-        3. Call mcp__relaycast__remove_agent(name: "<own-name>") to ask broker to release self
-      Fallback: if remove_agent doesn't work, output /exit.
-    steps:
-      - name: do-and-self-release
-        type: agent
-        agent: codex-worker
-        task: |
-          Your task has FOUR parts. Complete them in order.
-
-          PART 1 — THE TASK:
-          Output the following to your terminal:
-            SELF_RELEASE_TEST
-
-          PART 2 — GET YOUR OWN AGENT NAME:
-          Run this shell command to get your registered agent name:
-            echo $RELAY_AGENT_NAME
-
-          Output the result:
-            FOUND_NAME: <value of $RELAY_AGENT_NAME>
-
-          PART 3 — SELF-RELEASE:
-          Call the remove_agent MCP tool using the name from Part 2.
-          This is the ONLY termination method for this task — do not output /exit.
-
-          Tool call:
-            remove_agent(name: "<value from $RELAY_AGENT_NAME>", reason: "task completed")
-
-          After calling remove_agent, output:
-            REMOVE_AGENT_CALLED
-
-          Then stop. The broker will terminate your session via the tool call.
-
-          Begin now: output SELF_RELEASE_TEST, run `echo $RELAY_AGENT_NAME`,
-          call remove_agent, output REMOVE_AGENT_CALLED.
-        verification:
-          type: output_contains
-          value: REMOVE_AGENT_CALLED
diff --git a/tests/workflows/codex-lead/relay.codex-lead-v1-basic-coord.yaml b/tests/workflows/codex-lead/relay.codex-lead-v1-basic-coord.yaml
deleted file mode 100644
index f463f91b9..000000000
--- a/tests/workflows/codex-lead/relay.codex-lead-v1-basic-coord.yaml
+++ /dev/null
@@ -1,86 +0,0 @@
-version: '1.0'
-name: codex-lead-v1-basic-coord
-description: >
-  CODEX LEAD EXPERIMENT #1: Basic channel coordination.
-  Tests whether a codex lead can post an assignment to a channel,
-  a claude worker reads it, completes the task, and signals back.
-  Verifies the fundamental lead→channel→worker→channel→lead loop works
-  when the lead is codex (not claude).
-
-swarm:
-  pattern: dag
-  maxConcurrency: 2
-  timeoutMs: 300000 # 5 min
-  channel: codex-lead-v1
-  idleNudge:
-    nudgeAfterMs: 90000
-    escalateAfterMs: 60000
-    maxNudges: 2
-
-agents:
-  - name: codex-lead
-    cli: codex
-    channels: [codex-lead-v1]
-    role: >
-      Lead agent. Posts an assignment to #codex-lead-v1, waits for the worker
-      to signal completion, then confirms and self-terminates.
-    constraints:
-      model: gpt-5.3-codex
-
-  - name: claude-worker
-    cli: claude
-    channels: [codex-lead-v1]
-    role: >
-      Worker agent. Reads the assignment from #codex-lead-v1, completes
-      the task, posts completion signal back to the channel.
-    constraints:
-      model: sonnet
-
-workflows:
-  - name: test-v1-basic-coord
-    description: >
-      Both agents start simultaneously. Codex lead posts task to channel.
-      Claude worker reads it, does the task, posts WORKER_DONE.
-      Codex lead sees WORKER_DONE and outputs LEAD_DONE then terminates.
-    steps:
-      - name: lead
-        type: agent
-        agent: codex-lead
-        task: |
-          You are the lead. Post an assignment to #codex-lead-v1, then wait
-          for the worker to complete it.
-
-          STEP 1 — Post this assignment to #codex-lead-v1:
-            "ASSIGNMENT: Write the string 'HELLO_FROM_WORKER' to your terminal output.
-             Then post WORKER_DONE to #codex-lead-v1."
-
-          STEP 2 — Poll #codex-lead-v1 every 5 seconds until you see "WORKER_DONE".
-
-          STEP 3 — When you see WORKER_DONE, output:
-            LEAD_DONE
-
-          Then terminate using remove_agent with $RELAY_AGENT_NAME.
-        verification:
-          type: output_contains
-          value: LEAD_DONE
-
-      - name: worker
-        type: agent
-        agent: claude-worker
-        task: |
-          You are the worker. Wait for an assignment from the lead on #codex-lead-v1.
-
-          STEP 1 — Poll #codex-lead-v1 until you see a message containing "ASSIGNMENT:".
-
-          STEP 2 — Complete the assignment: output the following to your terminal:
-            HELLO_FROM_WORKER
-
-          STEP 3 — Post "WORKER_DONE" to #codex-lead-v1.
-
-          STEP 4 — Output:
-            WORKER_COMPLETE
-
-          Then /exit.
-        verification:
-          type: output_contains
-          value: WORKER_COMPLETE
diff --git a/tests/workflows/codex-lead/relay.codex-lead-v2-step-chaining.yaml b/tests/workflows/codex-lead/relay.codex-lead-v2-step-chaining.yaml
deleted file mode 100644
index fadb95ed7..000000000
--- a/tests/workflows/codex-lead/relay.codex-lead-v2-step-chaining.yaml
+++ /dev/null
@@ -1,84 +0,0 @@
-version: '1.0'
-name: codex-lead-v2-step-chaining
-description: >
-  CODEX LEAD EXPERIMENT #2: Step output chaining.
-  Tests whether a codex lead can consume {{steps.worker.output}} from a
-  non-interactive claude worker and act on it. The lead runs after the worker,
-  reads the chained output, validates it, and produces its own output.
-  This is the pattern for: codex lead reviews claude worker deliverables.
-
-swarm:
-  pattern: pipeline
-  maxConcurrency: 1
-  timeoutMs: 300000 # 5 min
-  channel: codex-lead-v2
-  idleNudge:
-    nudgeAfterMs: 90000
-    escalateAfterMs: 60000
-    maxNudges: 2
-
-agents:
-  - name: claude-worker
-    cli: claude
-    # interactive PTY — runner captures PTY output as step output for chaining
-    channels: [codex-lead-v2]
-    role: >
-      Non-interactive worker. Produces a structured deliverable to stdout
-      that the codex lead will review via step output chaining.
-    constraints:
-      model: sonnet
-
-  - name: codex-lead
-    cli: codex
-    interactive: false # Non-interactive: receives {{steps.worker.output}} at spawn time, no relay needed
-    channels: [codex-lead-v2]
-    role: >
-      Lead that reviews the claude worker's output via {{steps.worker.output}}
-      and produces a verdict.
-    constraints:
-      model: gpt-5.3-codex
-
-workflows:
-  - name: test-v2-step-chaining
-    description: >
-      Sequential: claude worker runs first (non-interactive), produces output.
-      Codex lead runs second, receives worker output via step chaining,
-      validates it, and outputs a verdict.
-    steps:
-      - name: worker
-        type: agent
-        agent: claude-worker
-        task: |
-          Output the following structured report, then /exit:
-
-          WORKER_REPORT_START
-          item_1: alpha
-          item_2: beta
-          item_3: gamma
-          checksum: 42
-          WORKER_REPORT_END
-          /exit
-
-      - name: lead-review
-        type: agent
-        agent: codex-lead
-        dependsOn: [worker]
-        task: |
-          The claude worker produced this output:
-
-          {{steps.worker.output}}
-
-          Review the output above and verify:
-          1. It contains WORKER_REPORT_START and WORKER_REPORT_END
-          2. It has exactly 3 items (item_1, item_2, item_3)
-          3. The checksum value is 42
-
-          Output your verdict:
-            REVIEW_RESULT: PASS  (if all checks pass)
-            REVIEW_RESULT: FAIL  (if any check fails, with reason)
-
-          Then output:
-            LEAD_REVIEW_DONE
-        verification:
-          type: output_contains
-          value: LEAD_REVIEW_DONE
diff --git a/tests/workflows/codex-lead/relay.codex-lead-v3-multi-worker.yaml b/tests/workflows/codex-lead/relay.codex-lead-v3-multi-worker.yaml
deleted file mode 100644
index 461d4bd39..000000000
--- a/tests/workflows/codex-lead/relay.codex-lead-v3-multi-worker.yaml
+++ /dev/null
@@ -1,116 +0,0 @@
-version: '1.0'
-name: codex-lead-v3-multi-worker
-description: >
-  CODEX LEAD EXPERIMENT #3: Codex lead coordinates multiple claude workers.
-  Tests the full team pattern: codex lead posts separate assignments to two
-  claude workers via channel, both complete independently, lead collects both
-  DONE signals and outputs a summary. Verifies codex can manage parallelism.
-
-swarm:
-  pattern: dag
-  maxConcurrency: 3
-  timeoutMs: 300000 # 5 min
-  channel: codex-lead-v3
-  idleNudge:
-    nudgeAfterMs: 90000
-    escalateAfterMs: 60000
-    maxNudges: 2
-
-agents:
-  - name: codex-lead
-    cli: codex
-    channels: [codex-lead-v3]
-    role: >
-      Lead that coordinates two claude workers via #codex-lead-v3.
-      Posts individual assignments, collects both completion signals,
-      then outputs a summary and self-terminates.
-    constraints:
-      model: gpt-5.3-codex
-
-  - name: claude-worker-a
-    cli: claude
-    channels: [codex-lead-v3]
-    role: 'Worker A. Completes its assigned task and signals WORKER_A_DONE.'
-    constraints:
-      model: sonnet
-
-  - name: claude-worker-b
-    cli: claude
-    channels: [codex-lead-v3]
-    role: 'Worker B. Completes its assigned task and signals WORKER_B_DONE.'
-    constraints:
-      model: sonnet
-
-workflows:
-  - name: test-v3-multi-worker
-    description: >
-      All three start simultaneously. Codex lead posts assignments for A and B.
-      Each worker reads its assignment, completes it, posts its DONE signal.
-      Lead waits for both WORKER_A_DONE and WORKER_B_DONE, then outputs summary.
-    steps:
-      - name: lead
-        type: agent
-        agent: codex-lead
-        task: |
-          You are the lead coordinating two workers on #codex-lead-v3.
-
-          STEP 1 — Post both assignments to #codex-lead-v3:
-
-          First message:
-            "ASSIGNMENT_A: claude-worker-a, output 'RESULT_A: squares' then post WORKER_A_DONE to #codex-lead-v3."
-
-          Second message:
-            "ASSIGNMENT_B: claude-worker-b, output 'RESULT_B: circles' then post WORKER_B_DONE to #codex-lead-v3."
-
-          STEP 2 — Poll #codex-lead-v3 until you see BOTH:
-            - A message containing "WORKER_A_DONE"
-            - A message containing "WORKER_B_DONE"
-
-          STEP 3 — Once both are done, output:
-            ALL_WORKERS_DONE
-            SUMMARY: worker-a completed, worker-b completed
-
-          Then terminate using remove_agent with $RELAY_AGENT_NAME.
-        verification:
-          type: output_contains
-          value: ALL_WORKERS_DONE
-
-      - name: worker-a
-        type: agent
-        agent: claude-worker-a
-        task: |
-          You are worker-a. Watch #codex-lead-v3 for your assignment.
-
-          STEP 1 — Poll #codex-lead-v3 until you see a message containing "ASSIGNMENT_A:".
-
-          STEP 2 — Complete the assignment: output to your terminal:
-            RESULT_A: squares
-
-          STEP 3 — Post "WORKER_A_DONE" to #codex-lead-v3.
-
-          STEP 4 — Output: WORKER_A_COMPLETE
-
-          Then /exit.
-        verification:
-          type: output_contains
-          value: WORKER_A_COMPLETE
-
-      - name: worker-b
-        type: agent
-        agent: claude-worker-b
-        task: |
-          You are worker-b. Watch #codex-lead-v3 for your assignment.
-
-          STEP 1 — Poll #codex-lead-v3 until you see a message containing "ASSIGNMENT_B:".
-
-          STEP 2 — Complete the assignment: output to your terminal:
-            RESULT_B: circles
-
-          STEP 3 — Post "WORKER_B_DONE" to #codex-lead-v3.
-
-          STEP 4 — Output: WORKER_B_COMPLETE
-
-          Then /exit.
-        verification:
-          type: output_contains
-          value: WORKER_B_COMPLETE
diff --git a/tests/workflows/codex-lead/relay.codex-lead-v4-noninteractive-workers.yaml b/tests/workflows/codex-lead/relay.codex-lead-v4-noninteractive-workers.yaml
deleted file mode 100644
index 3e41a91cd..000000000
--- a/tests/workflows/codex-lead/relay.codex-lead-v4-noninteractive-workers.yaml
+++ /dev/null
@@ -1,110 +0,0 @@
-version: '1.0'
-name: codex-lead-v4-noninteractive-workers
-description: >
-  CODEX LEAD EXPERIMENT #4: Codex lead reviews two parallel claude workers via step chaining.
-  Claude workers run as interactive PTY (runner captures their PTY output as step output).
-  Codex lead runs non-interactive after both workers complete, receives their outputs
-  via {{steps.worker-1.output}} and {{steps.worker-2.output}}, and consolidates them.
-  Note: claude -p (non-interactive) hangs in piped stdio — use interactive PTY for claude workers.
-
-swarm:
-  pattern: dag
-  maxConcurrency: 3
-  timeoutMs: 300000 # 5 min
-  channel: codex-lead-v4
-  idleNudge:
-    nudgeAfterMs: 90000 # only applies to the interactive codex lead
-    escalateAfterMs: 60000
-    maxNudges: 2
-
-agents:
-  - name: claude-worker-1
-    cli: claude
-    # interactive PTY — runner captures PTY output as step output for chaining
-    channels: [codex-lead-v4]
-    role: 'Worker. Produces a structured analysis then /exits.'
-    constraints:
-      model: sonnet
-
-  - name: claude-worker-2
-    cli: claude
-    # interactive PTY — runner captures PTY output as step output for chaining
-    channels: [codex-lead-v4]
-    role: 'Worker. Produces a structured analysis then /exits.'
-    constraints:
-      model: sonnet
-
-  - name: codex-lead
-    cli: codex
-    interactive: false # Non-interactive: receives chained outputs at spawn time
-    channels: [codex-lead-v4]
-    role: >
-      Non-interactive codex lead. Receives both worker outputs via step chaining,
-      compares them, and outputs a consolidated review verdict.
-    constraints:
-      model: gpt-5.3-codex
-
-workflows:
-  - name: test-v4-noninteractive-workers
-    description: >
-      Wave 1: both claude workers run in parallel (non-interactive).
-      Wave 2: codex lead reviews both outputs via step chaining.
-      Tests that codex can reason over multiple chained inputs.
-    steps:
-      - name: worker-1
-        type: agent
-        agent: claude-worker-1
-        task: |
-          Produce this exact output, then /exit:
-
-          ANALYSIS_1_START
-          metric: latency
-          value: 42ms
-          status: ok
-          ANALYSIS_1_END
-          /exit
-
-      - name: worker-2
-        type: agent
-        agent: claude-worker-2
-        task: |
-          Produce this exact output, then /exit:
-
-          ANALYSIS_2_START
-          metric: throughput
-          value: 1200rps
-          status: ok
-          ANALYSIS_2_END
-          /exit
-
-      - name: lead-consolidate
-        type: agent
-        agent: codex-lead
-        dependsOn: [worker-1, worker-2]
-        task: |
-          You received output from two workers. Review both and consolidate.
-
-          Worker 1 output:
-          {{steps.worker-1.output}}
-
-          Worker 2 output:
-          {{steps.worker-2.output}}
-
-          Verify:
-          1. Both outputs have matching START/END tags
-          2. Both report status: ok
-          3. Extract the metric names and values
-
-          Output your consolidated report:
-            CONSOLIDATED_REPORT_START
-            worker_1_metric: <metric from worker 1>
-            worker_1_value: <value from worker 1>
-            worker_2_metric: <metric from worker 2>
-            worker_2_value: <value from worker 2>
-            overall_status: PASS
-            CONSOLIDATED_REPORT_END
-
-          Then output: CONSOLIDATION_DONE
-        verification:
-          type: output_contains
-          value: CONSOLIDATION_DONE
diff --git a/tests/workflows/codex-lead/relay.codex-lead-v5-dm-worker.yaml b/tests/workflows/codex-lead/relay.codex-lead-v5-dm-worker.yaml
deleted file mode 100644
index a166707f4..000000000
--- a/tests/workflows/codex-lead/relay.codex-lead-v5-dm-worker.yaml
+++ /dev/null
@@ -1,89 +0,0 @@
-version: '1.0'
-name: codex-lead-v5-dm-worker
-description: >
-  CODEX LEAD EXPERIMENT #5: Codex lead uses direct messaging (DM) to assign
-  work to a specific claude worker, rather than broadcasting to a channel.
-  Tests whether codex can use mcp__relaycast__send_dm with a worker name (not a channel)
-  and whether claude correctly reads its inbox for the DM assignment.
-  This is the pattern needed when the lead must send different tasks to
-  different workers without cross-contaminating their channels.
-
-swarm:
-  pattern: dag
-  maxConcurrency: 2
-  timeoutMs: 300000 # 5 min
-  channel: codex-lead-v5
-  idleNudge:
-    nudgeAfterMs: 90000
-    escalateAfterMs: 60000
-    maxNudges: 2
-
-agents:
-  - name: codex-lead
-    cli: codex
-    channels: [codex-lead-v5]
-    role: >
-      Lead that sends a DM assignment directly to claude-worker by name,
-      then waits for the completion signal on #codex-lead-v5.
-    constraints:
-      model: gpt-5.3-codex
-
-  - name: claude-worker
-    cli: claude
-    channels: [codex-lead-v5]
-    role: >
-      Worker that checks its relay inbox for a DM from codex-lead,
-      completes the assigned task, and posts completion to the channel.
-    constraints:
-      model: sonnet
-
-workflows:
-  - name: test-v5-dm-worker
-    description: >
-      Both start simultaneously. Codex lead looks up the worker's registered
-      name, sends a DM with the task. Worker checks inbox, completes task,
-      posts WORKER_DM_DONE to channel. Lead confirms and terminates.
-    steps:
-      - name: lead
-        type: agent
-        agent: codex-lead
-        task: |
-          You are the lead. Send a task directly to claude-worker via DM.
-
-          STEP 1 — Find the claude-worker's registered name:
-          Call mcp__relaycast__list_agents() to find the agent whose name starts
-          with "worker-" (it will be registered as "worker-<id>").
-
-          STEP 2 — Send a DM to that agent:
-            mcp__relaycast__send_dm(to: "<worker-agent-name>", text: "DM_TASK: Output the string 'DM_RECEIVED_AND_DONE' to your terminal, then post WORKER_DM_DONE to #codex-lead-v5.")
-
-          STEP 3 — Poll #codex-lead-v5 until you see "WORKER_DM_DONE".
-
-          STEP 4 — Output:
-            DM_COORD_COMPLETE
-
-          Then terminate using remove_agent with $RELAY_AGENT_NAME.
-        verification:
-          type: output_contains
-          value: DM_COORD_COMPLETE
-
-      - name: worker
-        type: agent
-        agent: claude-worker
-        task: |
-          You are the worker. Wait for a DM from the lead with your task.
-
-          STEP 1 — Poll your relay inbox every 5 seconds until you receive
-          a DM containing "DM_TASK:".
-
-          STEP 2 — Complete the task from the DM: output to your terminal:
-            DM_RECEIVED_AND_DONE
-
-          STEP 3 — Post "WORKER_DM_DONE" to #codex-lead-v5.
-
-          STEP 4 — Output: WORKER_DM_COMPLETE
-
-          Then /exit.
-        verification:
-          type: output_contains
-          value: WORKER_DM_COMPLETE
diff --git a/tests/workflows/e2e-owner-review.yaml b/tests/workflows/e2e-owner-review.yaml
deleted file mode 100644
index bfc53a08c..000000000
--- a/tests/workflows/e2e-owner-review.yaml
+++ /dev/null
@@ -1,243 +0,0 @@
-version: '1.0'
-name: e2e-owner-review
-description: >
-  End-to-end test for PR #511: auto step owner resolution, per-step review
-  gating, hub-role word-boundary matching, review timeout budgeting, and
-  PTY echo handling for review decisions.
-
-  Scenarios:
-    1. Hub-role agent auto-assigned as owner (lead matches)
-    2. "github-integration" agent NOT matched as hub (word-boundary)
-    3. Review gating — approval flow
-    4. Review gating — rejection flow
-    5. Tight timeout for review budget testing
-    6. Lead + workers team with owner assignment
-
-swarm:
-  pattern: dag
-  channel: e2e-owner-review
-  maxConcurrency: 4
-  timeoutMs: 900000 # 15 min global
-
-agents:
-  # Hub-role agent — should be auto-assigned as owner for interactive steps
-  - name: team-lead
-    cli: claude
-    preset: lead
-    channels: [e2e-owner-review, team-track]
-    role: 'Lead coordinator for the workflow. Assigns and monitors tasks.'
-    constraints:
-      model: sonnet
-
-  # This agent's name contains "hub" as a substring in "github", but role
-  # says "github integration" — must NOT be matched as a hub-role agent
-  - name: github-integration
-    cli: claude
-    preset: worker
-    role: 'GitHub integration agent. Handles GitHub API calls and webhooks.'
-    constraints:
-      model: sonnet
-
-  # Standard worker — non-interactive, bounded task
-  - name: impl-worker
-    cli: claude
-    preset: worker
-    constraints:
-      model: sonnet
-
-  # Dedicated reviewer — should be picked for review gates
-  - name: quality-reviewer
-    cli: claude
-    preset: reviewer
-    role: 'Reviews step outputs for correctness and completeness.'
-    constraints:
-      model: sonnet
-
-  # A coordinator agent (lower priority than lead)
-  - name: coordinator-bot
-    cli: claude
-    channels: [e2e-owner-review]
-    role: 'Coordinator for fallback ownership tests.'
-    constraints:
-      model: sonnet
-
-workflows:
-  - name: owner-review-e2e
-    description: >
-      DAG testing all PR #511 features: owner assignment, review gating,
-      hub-role matching, timeout budgeting, rejection flow, and team pattern.
-    onError: continue
-    steps:
-      # ── Scenario 1: Hub-role auto-ownership ──────────────────────────────
-      # team-lead (role: "Lead coordinator") should be auto-assigned as owner
-      # because "lead" has highest hub-role priority (6).
-
-      - name: context
-        type: deterministic
-        command: |
-          echo "PROJECT_ROOT: /tmp/e2e-owner-review"
-          echo "SCENARIO: Testing auto step owner and review gating"
-        captureOutput: true
-        failOnError: true
-
-      - name: hub-owner-test
-        type: agent
-        agent: impl-worker
-        dependsOn: [context]
-        task: |
-          List 3 benefits of automated code review.
-          Format each as "- <benefit>".
-          Then output: OWNER_TEST_DONE
-        verification:
-          type: output_contains
-          value: OWNER_TEST_DONE
-
-      # ── Scenario 2: github-integration NOT matched as hub ────────────────
-      # The agent named "github-integration" should NOT become an owner via
-      # hub-role matching. The word "hub" in "github" must not trigger a match.
-
-      - name: github-no-hub-match
-        type: agent
-        agent: github-integration
-        dependsOn: [context]
-        task: |
-          List 3 popular GitHub Actions for CI/CD.
-          Format each as "- <action>".
-          Then output: GITHUB_TEST_DONE
-        verification:
-          type: exit_code
-
-      # ── Scenario 3: Review gating — approval flow ───────────────────────
-      # After hub-owner-test completes, quality-reviewer should automatically
-      # review and approve the output.
-
-      - name: review-approval-gate
-        type: agent
-        agent: impl-worker
-        dependsOn: [hub-owner-test]
-        task: |
-          Previous step output: {{steps.hub-owner-test.output}}
-
-          Summarize the benefits listed above in one sentence.
-          Then output: APPROVAL_GATE_DONE
-        verification:
-          type: output_contains
-          value: APPROVAL_GATE_DONE
-
-      # ── Scenario 4: Review gating — rejection flow ──────────────────────
-      # This step intentionally produces bad output that a reviewer should reject.
-      # The workflow uses onError: continue so it won't abort.
-
-      - name: deliberate-bad-output
-        type: agent
-        agent: impl-worker
-        dependsOn: [context]
-        task: |
-          IMPORTANT: Output ONLY the following line with no other text:
-          THIS_IS_INTENTIONALLY_WRONG_OUTPUT_FOR_TESTING
-        verification:
-          type: output_contains
-          value: THIS_IS_INTENTIONALLY_WRONG_OUTPUT_FOR_TESTING
-
-      # ── Scenario 5: Tight timeout for review budget testing ─────────────
-      # With a 30s step timeout, the review budget should be:
-      # proportional = 30000/3 = 10000
-      # lowerBound = min(60000, 30000) = 30000
-      # upperBound = min(600000, 30000) = 30000
-      # result = min(max(10000, 30000), 30000) = 30000
-      # Review timeout must NOT exceed parent step timeout.
-
-      - name: tight-timeout-step
-        type: agent
-        agent: impl-worker
-        dependsOn: [context]
-        timeoutMs: 30000
-        task: |
-          Output exactly: TIMEOUT_TEST_DONE
-        verification:
-          type: output_contains
-          value: TIMEOUT_TEST_DONE
-
-      # ── Scenario 6: Lead + workers team with owner assignment ────────────
-      # team-lead coordinates on #team-track, workers execute in parallel.
-      # team-lead should be auto-assigned as owner for the coordination step.
-
-      - name: team-worker-1
-        type: agent
-        agent: impl-worker
-        dependsOn: [context]
-        task: |
-          You are worker-1 in a team test.
-          List 2 benefits of modular architecture.
-          Then output: TEAM_W1_DONE
-        verification:
-          type: output_contains
-          value: TEAM_W1_DONE
-
-      - name: team-worker-2
-        type: agent
-        agent: impl-worker
-        dependsOn: [context]
-        task: |
-          You are worker-2 in a team test.
-          List 2 benefits of automated testing.
-          Then output: TEAM_W2_DONE
-        verification:
-          type: output_contains
-          value: TEAM_W2_DONE
-
-      - name: team-lead-coord
-        type: agent
-        agent: team-lead
-        dependsOn: [context]
-        task: |
-          You are leading a team on #team-track.
-          Workers: team-worker-1 and team-worker-2 are running in parallel.
-
-          1. Check #team-track and inbox for TEAM_W1_DONE and TEAM_W2_DONE.
-          2. Wait up to 3 checks (30s apart) for both signals.
-          3. Once both are seen, output: TEAM_LEAD_COMPLETE
-        verification:
-          type: output_contains
-          value: TEAM_LEAD_COMPLETE
-
-      # ── Final merge: validates all scenarios ─────────────────────────────
-
-      - name: merge-results
-        type: deterministic
-        dependsOn:
-          - hub-owner-test
-          - github-no-hub-match
-          - review-approval-gate
-          - deliberate-bad-output
-          - tight-timeout-step
-          - team-lead-coord
-          - team-worker-1
-          - team-worker-2
-        command: |
-          echo "=== E2E Owner/Review Test Results ==="
-          echo "Scenario 1 (hub-owner): {{steps.hub-owner-test.output}}" | grep -q "OWNER_TEST_DONE" && echo "PASS: hub-owner" || echo "FAIL: hub-owner"
-          echo "Scenario 2 (github-no-hub): PASS (github-integration ran as worker, not hub)"
-          echo "Scenario 3 (review-approval): {{steps.review-approval-gate.output}}" | grep -q "APPROVAL_GATE_DONE" && echo "PASS: review-approval" || echo "FAIL: review-approval"
-          echo "Scenario 5 (tight-timeout): {{steps.tight-timeout-step.output}}" | grep -q "TIMEOUT_TEST_DONE" && echo "PASS: tight-timeout" || echo "FAIL: tight-timeout"
-          echo "Scenario 6 (team-pattern): {{steps.team-lead-coord.output}}" | grep -q "TEAM_LEAD_COMPLETE" && echo "PASS: team-pattern" || echo "FAIL: team-pattern"
-          echo "ALL_SCENARIOS_CHECKED"
-        captureOutput: true
-        failOnError: false
-
-coordination:
-  barriers:
-    - name: all-scenarios-done
-      waitFor:
-        - hub-owner-test
-        - github-no-hub-match
-        - review-approval-gate
-        - deliberate-bad-output
-        - tight-timeout-step
-        - team-lead-coord
-      timeoutMs: 600000
-
-state:
-  backend: memory
-  ttlMs: 3600000
-  namespace: e2e-owner-review
diff --git a/tests/workflows/real-multi-agent-owner-review.yaml b/tests/workflows/real-multi-agent-owner-review.yaml
deleted file mode 100644
index 5f9e546aa..000000000
--- a/tests/workflows/real-multi-agent-owner-review.yaml
+++ /dev/null
@@ -1,224 +0,0 @@
-version: '1.0'
-name: real-multi-agent-owner-review
-description: |
-  Complex real-world E2E test for PR #511. Multiple agents with DAG dependencies,
-  auto step owner assignment, review gating, and parallel execution.
-  Inspired by build-plan patterns. Uses real CLI agents.
-
-swarm:
-  pattern: dag
-  channel: multi-agent-review
-  maxConcurrency: 4
-  timeoutMs: 900000 # 15 min global
-
-agents:
-  # Lead — hub-role, should get auto-assigned as owner
-  - name: lead
-    cli: claude
-    preset: lead
-    channels: [multi-agent-review, coordination]
-    role: 'Lead coordinator. Plans architecture, delegates tasks, reviews progress.'
-    constraints:
-      model: sonnet
-      timeoutMs: 180000
-
-  # Two workers — parallel implementation
-  - name: worker-a
-    cli: claude
-    preset: worker
-    role: 'Backend worker. Implements server-side utilities.'
-    constraints:
-      model: sonnet
-      timeoutMs: 180000
-
-  - name: worker-b
-    cli: codex
-    preset: worker
-    role: 'Frontend worker. Implements client-side utilities.'
-    constraints:
-      timeoutMs: 180000
-
-  # Reviewer — dedicated review agent for gating
-  - name: reviewer
-    cli: claude
-    preset: reviewer
-    role: 'Quality reviewer. Reviews code for correctness, style, and edge cases.'
-    constraints:
-      model: sonnet
-      timeoutMs: 120000
-
-  # Agent with "hub" substring in name — must NOT be matched as hub-role
-  - name: github-bot
-    cli: claude
-    preset: worker
-    role: 'GitHub integration bot. Handles PR comments and status checks.'
-    constraints:
-      model: sonnet
-      timeoutMs: 120000
-
-workflows:
-  - name: multi-utility-build
-    description: |
-      Build two related utility functions in parallel, then integrate.
-      Tests: auto-owner, review gating, parallel execution, output chaining,
-      hub-role word-boundary matching (github-bot should NOT match as hub).
-    onError: continue
-    steps:
-      # ── Phase 1: Setup + Planning ──────────────────────────────────────
-      - name: setup
-        type: deterministic
-        command: |
-          WORKDIR=$(mktemp -d /tmp/relay-multi-e2e-XXXXXX)
-          mkdir -p "$WORKDIR/src" "$WORKDIR/tests"
-          echo "WORKDIR=$WORKDIR"
-          echo "Created project structure in $WORKDIR"
-        captureOutput: true
-        failOnError: true
-
-      # Lead creates the architecture plan
-      # Auto step owner should assign 'lead' here
-      - name: architecture
-        type: agent
-        agent: lead
-        dependsOn: [setup]
-        task: |
-          Context: {{steps.setup.output}}
-
-          Create an architecture plan for two small TypeScript utility modules:
-          1. `string-utils.ts` — functions: slugify(str), truncate(str, maxLen), capitalize(str)
-          2. `array-utils.ts` — functions: chunk(arr, size), unique(arr), flatten(arr)
-
-          For each module, specify:
-          - Function signatures with types
-          - Key implementation notes
-          - Edge cases to handle
-
-          Output a clear plan. End with: ARCHITECTURE_PLAN_DONE
-        verification:
-          type: output_contains
-          value: ARCHITECTURE_PLAN_DONE
-        timeoutMs: 180000
-
-      # ── Phase 2: Parallel Implementation ───────────────────────────────
-
-      # Worker A implements string-utils (claude)
-      - name: string-utils
-        type: agent
-        agent: worker-a
-        dependsOn: [architecture]
-        task: |
-          Context: {{steps.setup.output}}
-          Plan: {{steps.architecture.output}}
-
-          Implement `string-utils.ts` based on the architecture plan.
-          Write the file to the src/ directory in the working directory.
-          Include: slugify, truncate, capitalize functions.
-          Each function should handle edge cases (empty input, etc).
-
-          After writing the file, output: STRING_UTILS_DONE
-        verification:
-          type: output_contains
-          value: STRING_UTILS_DONE
-        timeoutMs: 180000
-
-      # Worker B implements array-utils (codex) — runs in parallel with string-utils
-      - name: array-utils
-        type: agent
-        agent: worker-b
-        dependsOn: [architecture]
-        task: |
-          Context: {{steps.setup.output}}
-          Plan: {{steps.architecture.output}}
-
-          Implement `array-utils.ts` based on the architecture plan.
-          Write the file to the src/ directory in the working directory.
-          Include: chunk, unique, flatten functions.
-          Each function should handle edge cases (empty arrays, etc).
-
-          After writing the file, output: ARRAY_UTILS_DONE
-        verification:
-          type: output_contains
-          value: ARRAY_UTILS_DONE
-        timeoutMs: 180000
-
-      # github-bot does a simple task — tests word-boundary matching
-      # This agent should NOT be auto-assigned as hub-role owner
-      - name: github-status
-        type: agent
-        agent: github-bot
-        dependsOn: [setup]
-        task: |
-          You are github-bot. List 3 common GitHub PR status check names.
-          Format as a bullet list. Then output: GITHUB_STATUS_DONE
-        verification:
-          type: output_contains
-          value: GITHUB_STATUS_DONE
-        timeoutMs: 120000
-
-      # ── Phase 3: Integration ───────────────────────────────────────────
-
-      # Lead integrates results from both workers
-      - name: integration
-        type: agent
-        agent: lead
-        dependsOn: [string-utils, array-utils]
-        task: |
-          Context: {{steps.setup.output}}
-
-          Both utility modules have been implemented:
-          - string-utils: {{steps.string-utils.output}}
-          - array-utils: {{steps.array-utils.output}}
-
-          Create an `index.ts` barrel file in the src/ directory that
-          re-exports all functions from both modules. Also create a brief
-          README.md in the working directory describing the utility library.
-
-          After creating both files, output: INTEGRATION_DONE
-        verification:
-          type: output_contains
-          value: INTEGRATION_DONE
-        timeoutMs: 180000
-
-      # ── Phase 4: Final Verification ────────────────────────────────────
-
-      - name: final-check
-        type: deterministic
-        dependsOn:
-          - architecture
-          - string-utils
-          - array-utils
-          - github-status
-          - integration
-        command: |
-          echo "=== Multi-Agent Owner/Review E2E Results ==="
-          echo ""
-          echo "Phase 1 — Architecture:"
-          echo "{{steps.architecture.output}}" | grep -q "ARCHITECTURE_PLAN_DONE" && echo "  PASS: architecture" || echo "  FAIL: architecture"
-          echo ""
-          echo "Phase 2 — Parallel Implementation:"
-          echo "{{steps.string-utils.output}}" | grep -q "STRING_UTILS_DONE" && echo "  PASS: string-utils (worker-a/claude)" || echo "  FAIL: string-utils"
-          echo "{{steps.array-utils.output}}" | grep -q "ARRAY_UTILS_DONE" && echo "  PASS: array-utils (worker-b/codex)" || echo "  FAIL: array-utils"
-          echo "{{steps.github-status.output}}" | grep -q "GITHUB_STATUS_DONE" && echo "  PASS: github-status (word-boundary test)" || echo "  FAIL: github-status"
-          echo ""
-          echo "Phase 3 — Integration:"
-          echo "{{steps.integration.output}}" | grep -q "INTEGRATION_DONE" && echo "  PASS: integration" || echo "  FAIL: integration"
-          echo ""
-          echo "MULTI_AGENT_TEST_COMPLETE"
-        captureOutput: true
-        failOnError: false
-
-coordination:
-  barriers:
-    - name: all-done
-      waitFor:
-        - architecture
-        - string-utils
-        - array-utils
-        - github-status
-        - integration
-      timeoutMs: 600000
-
-state:
-  backend: memory
-  ttlMs: 3600000
-  namespace: multi-agent-review
diff --git a/tests/workflows/real-owner-review-test.yaml b/tests/workflows/real-owner-review-test.yaml
deleted file mode 100644
index f1542c382..000000000
--- a/tests/workflows/real-owner-review-test.yaml
+++ /dev/null
@@ -1,121 +0,0 @@
-version: '1.0'
-name: real-owner-review-test
-description: |
-  Real-world E2E test for PR #511 features: auto step owner assignment,
-  review gating, and verification markers. Uses REAL CLI agents (claude, codex).
-  Small scope — 3 agent steps + 1 deterministic — finishes in ~5 minutes.
-
-swarm:
-  pattern: dag
-  channel: real-owner-review
-  maxConcurrency: 3
-  timeoutMs: 600000 # 10 min global
-
-agents:
-  # Lead agent — should be auto-assigned as step owner (hub-role priority)
-  - name: lead
-    cli: claude
-    preset: lead
-    channels: [real-owner-review]
-    role: 'Lead coordinator. Plans tasks and delegates to workers.'
-    constraints:
-      model: sonnet
-      timeoutMs: 180000
-
-  # Worker agent — implements based on lead's plan
-  - name: worker
-    cli: codex
-    preset: worker
-    role: 'Implementation worker. Writes code based on plans.'
-    constraints:
-      timeoutMs: 180000
-
-  # Reviewer agent — reviews worker output (tests review gating)
-  - name: reviewer
-    cli: claude
-    preset: reviewer
-    role: 'Code reviewer. Reviews implementations for correctness.'
-    constraints:
-      model: sonnet
-      timeoutMs: 120000
-
-workflows:
-  - name: utility-function
-    description: |
-      Lead plans a small utility function, worker implements it,
-      reviewer reviews the implementation. Tests auto step owner + review gate.
-    onError: continue
-    steps:
-      # Step 1: Deterministic setup — create a temp working directory
-      - name: setup
-        type: deterministic
-        command: |
-          WORKDIR=$(mktemp -d /tmp/relay-e2e-XXXXXX)
-          echo "WORKDIR=$WORKDIR"
-          echo "Created working directory: $WORKDIR"
-        captureOutput: true
-        failOnError: true
-
-      # Step 2: Lead creates a plan for a simple utility function
-      # Auto step owner should assign 'lead' as owner (hub-role match)
-      - name: plan
-        type: agent
-        agent: lead
-        dependsOn: [setup]
-        task: |
-          Context: {{steps.setup.output}}
-
-          Create a brief plan for a TypeScript utility function called `slugify`
-          that converts a string to a URL-friendly slug. The plan should include:
-          1. Function signature (input: string, output: string)
-          2. Key transformations: lowercase, replace spaces with hyphens, remove special chars
-          3. Edge cases: empty string, multiple spaces, leading/trailing whitespace
-
-          Output your plan as a numbered list. End with: PLAN_COMPLETE
-        verification:
-          type: output_contains
-          value: PLAN_COMPLETE
-        timeoutMs: 180000
-
-      # Step 3: Worker implements based on the plan (output chaining)
-      # Tests that codex agent can receive chained output and produce code
-      - name: implement
-        type: agent
-        agent: worker
-        dependsOn: [plan]
-        task: |
-          Context: {{steps.setup.output}}
-
-          Based on this plan:
-          {{steps.plan.output}}
-
-          Implement the `slugify` function in TypeScript. Write it to a file
-          called `slugify.ts` in the working directory from the context.
-          Include basic test cases as console.log assertions at the bottom.
-
-          After writing the file, output: IMPLEMENTATION_COMPLETE
-        verification:
-          type: output_contains
-          value: IMPLEMENTATION_COMPLETE
-        timeoutMs: 180000
-
-      # Step 4: Deterministic merge — check results
-      - name: verify-results
-        type: deterministic
-        dependsOn: [plan, implement]
-        command: |
-          echo "=== Real Owner/Review Test Results ==="
-          echo "Step: plan"
-          echo "{{steps.plan.output}}" | grep -q "PLAN_COMPLETE" && echo "PASS: plan completed" || echo "FAIL: plan"
-          echo ""
-          echo "Step: implement"
-          echo "{{steps.implement.output}}" | grep -q "IMPLEMENTATION_COMPLETE" && echo "PASS: implementation completed" || echo "FAIL: implementation"
-          echo ""
-          echo "ALL_STEPS_VERIFIED"
-        captureOutput: true
-        failOnError: false
-
-state:
-  backend: memory
-  ttlMs: 3600000
-  namespace: real-owner-review
diff --git a/tests/workflows/real-path-workdir-test.yaml b/tests/workflows/real-path-workdir-test.yaml
deleted file mode 100644
index 54cbf93d8..000000000
--- a/tests/workflows/real-path-workdir-test.yaml
+++ /dev/null
@@ -1,42 +0,0 @@
-version: '1.0'
-name: cross-repo-path-test
-description: E2E test for paths and workdir features (PR #488)
-paths:
-  - name: relaycast
-    path: /Users/khaliqgant/Projects/relaycast
-    description: Relaycast SDK repo
-  - name: relay-dashboard
-    path: /Users/khaliqgant/Projects/relay-dashboard
-    description: Dashboard UI
-swarm:
-  pattern: dag
-  maxConcurrency: 2
-  channel: path-test
-agents:
-  - name: analyzer
-    cli: claude
-    role: Code analyzer
-    preset: worker
-workflows:
-  - name: cross-repo-analysis
-    steps:
-      - name: check-relaycast
-        agent: analyzer
-        workdir: relaycast
-        task: |
-          Run `pwd` and `ls` in the current directory. Report what project this is based on the files you see.
-          At the very end of your response, output the exact string: RELAY_SDK_VERIFIED
-        verification:
-          type: output_contains
-          value: Relaycast
-      - name: check-dashboard
-        agent: analyzer
-        workdir: relay-dashboard
-        dependsOn: [check-relaycast]
-        task: |
-          Run `pwd` and `ls` in the current directory. Report what project this is.
-          Here is context from a previous step: {{steps.check-relaycast.output}}
-          At the very end of your response, output the exact string: DASH_VERIFIED
-        verification:
-          type: output_contains
-          value: dashboard
diff --git a/tests/workflows/real-supervisor-test.yaml b/tests/workflows/real-supervisor-test.yaml
deleted file mode 100644
index 35a8c751a..000000000
--- a/tests/workflows/real-supervisor-test.yaml
+++ /dev/null
@@ -1,98 +0,0 @@
-version: '1.0'
-name: supervisor-validation
-description: >
-  Tests the owner-supervisor model with real agents. Validates that the lead
-  agent is auto-assigned as supervisor for worker steps, runs concurrently
-  with the specialist, and signals STEP_COMPLETE independently.
-
-swarm:
-  pattern: dag
-  maxConcurrency: 3
-  timeoutMs: 600000
-  channel: supervisor-test
-
-agents:
-  - name: lead
-    cli: claude
-    preset: lead
-    role: Team lead and supervisor
-    channels: [supervisor-test]
-    constraints:
-      model: sonnet
-
-  - name: coder
-    cli: claude
-    role: Code implementer
-    channels: [supervisor-test]
-    constraints:
-      model: sonnet
-
-  - name: reviewer
-    cli: claude
-    role: Code reviewer
-    channels: [supervisor-test]
-    constraints:
-      model: sonnet
-
-workflows:
-  - name: supervised-build
-    steps:
-      - name: implement
-        type: agent
-        agent: coder
-        task: |
-          Create a file at /tmp/supervisor-test/utils.ts with a simple
-          TypeScript utility: a function called `slugify` that converts
-          a string to a URL-safe slug. Include JSDoc comments and
-          handle edge cases (empty string, special chars, multiple spaces).
-
-          When done, output: IMPLEMENT_DONE
-        verification:
-          type: file_exists
-          value: /tmp/supervisor-test/utils.ts
-
-      - name: test-it
-        type: agent
-        agent: coder
-        dependsOn: [implement]
-        task: |
-          Create a test file at /tmp/supervisor-test/utils.test.ts
-          that tests the slugify function from utils.ts.
-          Write at least 5 test cases covering edge cases.
-          Context from implementation: {{steps.implement.output}}
-
-          When done, output: TESTS_DONE
-        verification:
-          type: file_exists
-          value: /tmp/supervisor-test/utils.test.ts
-
-      - name: review
-        type: agent
-        agent: reviewer
-        dependsOn: [implement, test-it]
-        task: |
-          Review the implementation and tests:
-          Implementation: {{steps.implement.output}}
-          Tests: {{steps.test-it.output}}
-
-          Check for: correctness, edge cases, code quality.
-          Output: REVIEW_COMPLETE
-        verification:
-          type: output_contains
-          value: REVIEW_COMPLETE
-
-      - name: final-check
-        type: deterministic
-        dependsOn: [review]
-        command: |
-          echo "=== Supervisor Validation Results ==="
-          test -f /tmp/supervisor-test/utils.ts && echo "PASS: utils.ts exists" || echo "FAIL: utils.ts missing"
-          test -f /tmp/supervisor-test/utils.test.ts && echo "PASS: utils.test.ts exists" || echo "FAIL: utils.test.ts missing"
-          echo "VALIDATION_COMPLETE"
-        captureOutput: true
-        failOnError: false
-
-state:
-  backend: memory
-  ttlMs: 3600000
-  namespace: supervisor-validation
diff --git a/tests/workflows/run-e2e-owner-review.ts b/tests/workflows/run-e2e-owner-review.ts
deleted file mode 100644
index 70df9ec0b..000000000
--- a/tests/workflows/run-e2e-owner-review.ts
+++ /dev/null
@@ -1,648 +0,0 @@
-/**
- * E2E test harness for PR #511: auto step owner + per-step review gating.
- *
- * This file validates the workflow runner's owner/review features by:
- * 1. Running the unit test suite (which uses mocked DB/relay)
- * 2. Parsing a real workflow YAML and validating it against the schema
- * 3. Reporting PASS/FAIL for each scenario
- *
- * Usage:
- *   npx tsx tests/workflows/run-e2e-owner-review.ts
- *
- * Or via the test runner:
- *   npx vitest run tests/workflows/run-e2e-owner-review.ts
- */
-
-import { describe, it, expect, vi, beforeEach } from 'vitest';
-import { readFileSync } from 'node:fs';
-import { resolve, dirname } from 'node:path';
-import { fileURLToPath } from 'node:url';
-// These types are imported relative to the SDK source. When running via vitest
-// from the SDK directory, use the SDK vitest config which includes src/__tests__.
-// From repo root, the aliases resolve correctly.
-import type { WorkflowDb } from '../../packages/sdk/src/workflows/runner.js';
-import type {
-  RelayYamlConfig,
-  WorkflowRunRow,
-  WorkflowStepRow,
-} from '../../packages/sdk/src/workflows/types.js';
-
-// ── Mock fetch ──────────────────────────────────────────────────────────────
-
-const mockFetch = vi.fn().mockResolvedValue({
-  ok: true,
-  json: () => Promise.resolve({ data: { api_key: 'rk_live_test', workspace_id: 'ws-test' } }),
-  text: () => Promise.resolve(''),
-});
-vi.stubGlobal('fetch', mockFetch);
-
-// ── Mock RelayCast SDK ──────────────────────────────────────────────────────
-
-const mockRelaycastAgent = {
-  send: vi.fn().mockResolvedValue(undefined),
-  heartbeat: vi.fn().mockResolvedValue(undefined),
-  channels: {
-    create: vi.fn().mockResolvedValue(undefined),
-    join: vi.fn().mockResolvedValue(undefined),
-    invite: vi.fn().mockResolvedValue(undefined),
-  },
-};
-
-const mockRelaycast = {
-  agents: { register: vi.fn().mockResolvedValue({ token: 'token-1' }) },
-  as: vi.fn().mockReturnValue(mockRelaycastAgent),
-};
-
-class MockRelayError extends Error {
-  code: string;
-  constructor(code: string, message: string, status = 400) {
-    super(message);
-    this.code = code;
-    this.name = 'RelayError';
-    (this as any).status = status;
-  }
-}
-
-vi.mock('@relaycast/sdk', () => ({
-  RelayCast: vi.fn().mockImplementation(() => mockRelaycast),
-  RelayError: MockRelayError,
-}));
-
-// ── Mock AgentRelay ─────────────────────────────────────────────────────────
-
-let waitForExitFn: (ms?: number) => Promise<'exited' | 'timeout' | 'released'>;
-let waitForIdleFn: (ms?: number) => Promise<'idle' | 'timeout' | 'exited'>;
-let mockSpawnOutputs: string[] = [];
-
-const mockAgent = {
-  name: 'test-agent-abc',
-  get waitForExit() {
-    return waitForExitFn;
-  },
-  get waitForIdle() {
-    return waitForIdleFn;
-  },
-  release: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockHuman = {
-  name: 'WorkflowRunner',
-  sendMessage: vi.fn().mockResolvedValue(undefined),
-};
-
-const mockListeners = new Map<string, Set<(...args: any[]) => void>>();
-function emitMockEvent(event: string, ...args: any[]): void {
-  const set = mockListeners.get(event);
-  if (set) for (const cb of set) cb(...args);
-}
-
-const mockRelayInstance = {
-  spawnPty: vi.fn().mockImplementation(async ({ name, task }: { name: string; task?: string }) => {
-    const queued = mockSpawnOutputs.shift();
-    const stepComplete = task?.match(/STEP_COMPLETE:([^\n]+)/)?.[1]?.trim();
-    const isReview = task?.includes('REVIEW_DECISION: APPROVE or REJECT');
-    const output =
-      queued ??
-      (isReview
-        ? 'REVIEW_DECISION: APPROVE\nREVIEW_REASON: looks good\n'
-        : stepComplete
-          ? `STEP_COMPLETE:${stepComplete}\n`
-          : 'STEP_COMPLETE:unknown\n');
-
-    queueMicrotask(() => {
-      emitMockEvent('workerOutput', { name, chunk: output });
-    });
-
-    return { ...mockAgent, name };
-  }),
-  human: vi.fn().mockReturnValue(mockHuman),
-  shutdown: vi.fn().mockResolvedValue(undefined),
-  onBrokerStderr: vi.fn().mockReturnValue(() => {}),
-  addListener: vi.fn((event: string, cb: (...args: any[]) => void) => {
-    let set = mockListeners.get(event);
-    if (!set) {
-      set = new Set();
-      mockListeners.set(event, set);
-    }
-    set.add(cb);
-    return () => set!.delete(cb);
-  }),
-  listAgentsRaw: vi.fn().mockResolvedValue([]),
-};
-
-vi.mock('../../packages/sdk/src/relay.js', () => ({
-  AgentRelay: vi.fn().mockImplementation(() => mockRelayInstance),
-}));
-
-// Import after mocking
-const { WorkflowRunner } = await import('../../packages/sdk/src/workflows/runner.js');
-
-// ── Helpers ─────────────────────────────────────────────────────────────────
-
-function makeDb(): WorkflowDb {
-  const runs = new Map<string, WorkflowRunRow>();
-  const steps = new Map<string, WorkflowStepRow>();
-  return {
-    insertRun: vi.fn(async (run: WorkflowRunRow) => {
-      runs.set(run.id, { ...run });
-    }),
-    updateRun: vi.fn(async (id: string, patch: Partial<WorkflowRunRow>) => {
-      const existing = runs.get(id);
-      if (existing) runs.set(id, { ...existing, ...patch });
-    }),
-    getRun: vi.fn(async (id: string) => {
-      const run = runs.get(id);
-      return run ? { ...run } : null;
-    }),
-    insertStep: vi.fn(async (step: WorkflowStepRow) => {
-      steps.set(step.id, { ...step });
-    }),
-    updateStep: vi.fn(async (id: string, patch: Partial<WorkflowStepRow>) => {
-      const existing = steps.get(id);
-      if (existing) steps.set(id, { ...existing, ...patch });
-    }),
-    getStepsByRunId: vi.fn(async (runId: string) => {
-      return [...steps.values()].filter((s) => s.runId === runId);
-    }),
-  };
-}
-
-function makeConfig(overrides: Partial<RelayYamlConfig> = {}): RelayYamlConfig {
-  return {
-    version: '1',
-    name: 'e2e-owner-review-test',
-    swarm: { pattern: 'dag' },
-    agents: [
-      { name: 'agent-a', cli: 'claude' },
-      { name: 'agent-b', cli: 'claude' },
-    ],
-    workflows: [
-      {
-        name: 'default',
-        steps: [
-          { name: 'step-1', agent: 'agent-a', task: 'Do step 1' },
-          { name: 'step-2', agent: 'agent-b', task: 'Do step 2', dependsOn: ['step-1'] },
-        ],
-      },
-    ],
-    trajectories: false,
-    ...overrides,
-  };
-}
-
-function never<T>(): Promise<T> {
-  return new Promise(() => {});
-}
-
-// ── E2E Scenarios ───────────────────────────────────────────────────────────
-
-describe('PR #511 E2E: Auto Step Owner + Review Gating', () => {
-  let db: WorkflowDb;
-  let runner: InstanceType<typeof WorkflowRunner>;
-
-  beforeEach(() => {
-    vi.clearAllMocks();
-    waitForExitFn = vi.fn().mockResolvedValue('exited');
-    waitForIdleFn = vi.fn().mockImplementation(() => never());
-    mockSpawnOutputs = [];
-    mockListeners.clear();
-    db = makeDb();
-    runner = new WorkflowRunner({ db, workspaceId: 'ws-test' });
-  });
-
-  // ── Scenario 1: Hub-role agent auto-assigned as owner ───────────────────
-
-  describe('Scenario 1: Hub-role auto-ownership', () => {
-    it('should auto-assign lead agent as owner for specialist steps', async () => {
-      const ownerAssignments: Array<{ owner: string; specialist: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') {
-          ownerAssignments.push({ owner: event.ownerName, specialist: event.specialistName });
-        }
-      });
-
-      const config = makeConfig({
-        agents: [
-          { name: 'impl-worker', cli: 'claude', role: 'implementer' },
-          { name: 'team-lead', cli: 'claude', role: 'Lead coordinator for the workflow' },
-          { name: 'quality-reviewer', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'hub-owner-test', agent: 'impl-worker', task: 'List 3 benefits' }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-      expect(ownerAssignments).toHaveLength(1);
-      expect(ownerAssignments[0].owner).toBe('team-lead');
-      expect(ownerAssignments[0].specialist).toBe('impl-worker');
-    }, 15000);
-
-    it('should prioritize lead over coordinator in owner resolution', async () => {
-      const ownerAssignments: string[] = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') ownerAssignments.push(event.ownerName);
-      });
-
-      const config = makeConfig({
-        agents: [
-          { name: 'specialist', cli: 'claude', role: 'engineer' },
-          { name: 'coord-bot', cli: 'claude', role: 'coordinator' },
-          { name: 'lead-bot', cli: 'claude', role: 'lead' },
-          { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'step-1', agent: 'specialist', task: 'Do work' }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-      expect(ownerAssignments[0]).toBe('lead-bot');
-    }, 15000);
-  });
-
-  // ── Scenario 2: github-integration NOT matched as hub ───────────────────
-
-  describe('Scenario 2: Hub word-boundary matching', () => {
-    it('should NOT match "github-integration" as hub-role agent', async () => {
-      const ownerAssignments: Array<{ owner: string; specialist: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') {
-          ownerAssignments.push({ owner: event.ownerName, specialist: event.specialistName });
-        }
-      });
-
-      const config = makeConfig({
-        agents: [
-          { name: 'specialist', cli: 'claude', role: 'engineer' },
-          { name: 'github-integration', cli: 'claude', role: 'GitHub integration agent' },
-          { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'github-no-hub', agent: 'specialist', task: 'Test word boundary' }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-      // github-integration should NOT be owner — specialist owns itself
-      expect(ownerAssignments[0].owner).not.toBe('github-integration');
-      expect(ownerAssignments[0].owner).toBe('specialist');
-    }, 15000);
-
-    it('should NOT match "github-bot" with role "github integration" as hub', async () => {
-      const ownerAssignments: Array<{ owner: string; specialist: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') {
-          ownerAssignments.push({ owner: event.ownerName, specialist: event.specialistName });
-        }
-      });
-
-      const config = makeConfig({
-        agents: [
-          { name: 'specialist', cli: 'claude', role: 'engineer' },
-          { name: 'github-bot', cli: 'claude', role: 'github integration' },
-          { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'step-1', agent: 'specialist', task: 'Do work' }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-      expect(ownerAssignments[0].owner).not.toBe('github-bot');
-      expect(ownerAssignments[0].owner).toBe('specialist');
-    }, 15000);
-  });
-
-  // ── Scenario 3: Review gating — approval flow ──────────────────────────
-
-  describe('Scenario 3: Review gating approval', () => {
-    it('should emit step:review-completed with approved decision', async () => {
-      const reviewEvents: Array<{ decision: string; reviewerName: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:review-completed') {
-          reviewEvents.push({ decision: event.decision, reviewerName: event.reviewerName });
-        }
-      });
-
-      // Default mock outputs APPROVE, so no need to queue special output
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('completed');
-      expect(reviewEvents.length).toBeGreaterThanOrEqual(1);
-      expect(reviewEvents[0].decision).toBe('approved');
-    }, 15000);
-
-    it('should gate step completion on review approval', async () => {
-      const stepEvents: string[] = [];
-      runner.on((event) => {
-        if (event.type === 'step:completed' || event.type === 'step:review-completed') {
-          stepEvents.push(event.type);
-        }
-      });
-
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('completed');
-      // Review must complete before step is marked completed
-      const reviewIdx = stepEvents.indexOf('step:review-completed');
-      const completedIdx = stepEvents.indexOf('step:completed');
-      expect(reviewIdx).toBeLessThan(completedIdx);
-    }, 15000);
-  });
-
-  // ── Scenario 4: Review gating — rejection flow ─────────────────────────
-
-  describe('Scenario 4: Review gating rejection', () => {
-    it('should fail the step when reviewer rejects', async () => {
-      const events: Array<{ type: string; decision?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:review-completed') {
-          events.push({ type: event.type, decision: event.decision });
-        }
-      });
-
-      mockSpawnOutputs = [
-        'STEP_COMPLETE:step-1\n',
-        'REVIEW_DECISION: REJECT\nREVIEW_REASON: output is incomplete\n',
-      ];
-
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('review rejected');
-      expect(events).toContainEqual({ type: 'step:review-completed', decision: 'rejected' });
-    }, 15000);
-
-    it('should fail closed when review output is malformed (no REVIEW_DECISION)', async () => {
-      mockSpawnOutputs = ['STEP_COMPLETE:step-1\n', 'REVIEW_REASON: this is missing the decision line\n'];
-
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('review response malformed');
-    }, 15000);
-
-    it('should use last REVIEW_DECISION match when PTY echoes prompt (reject)', async () => {
-      const events: Array<{ type: string; decision?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:review-completed') {
-          events.push({ type: event.type, decision: event.decision });
-        }
-      });
-
-      // PTY echoes the prompt (which contains "APPROVE or REJECT"), then actual REJECT
-      const echoedPrompt =
-        'Return exactly:\nREVIEW_DECISION: APPROVE or REJECT\nREVIEW_REASON: <one sentence>\n';
-      const actualResponse = 'REVIEW_DECISION: REJECT\nREVIEW_REASON: code has critical bugs\n';
-      mockSpawnOutputs = ['STEP_COMPLETE:step-1\n', echoedPrompt + actualResponse];
-
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(events).toContainEqual({ type: 'step:review-completed', decision: 'rejected' });
-    }, 15000);
-  });
-
-  // ── Scenario 5: Review timeout budgeting ───────────────────────────────
-
-  describe('Scenario 5: Review timeout budgeting', () => {
-    it('should not allocate review timeout longer than parent step timeout', async () => {
-      const config = makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'step-1', agent: 'agent-a', task: 'Do step 1', timeoutMs: 30_000 }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-
-      // Check that the waitForExit calls respect the timeout budget
-      const waitCalls = (waitForExitFn as any).mock?.calls ?? [];
-      expect(waitCalls.length).toBeGreaterThanOrEqual(2);
-      // Second call is the review timeout — must not exceed parent step timeout
-      const reviewTimeout = waitCalls[1][0];
-      expect(reviewTimeout).toBeLessThanOrEqual(30_000);
-    }, 15000);
-
-    it('should use proportional timeout (1/3) for longer step timeouts', async () => {
-      const config = makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'step-1', agent: 'agent-a', task: 'Do step 1', timeoutMs: 900_000 }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-
-      const waitCalls = (waitForExitFn as any).mock?.calls ?? [];
-      expect(waitCalls.length).toBeGreaterThanOrEqual(2);
-      const reviewTimeout = waitCalls[1][0];
-      // proportional = 300_000, lowerBound = 60_000, upperBound = 600_000
-      // result = min(max(300_000, 60_000), 600_000) = 300_000
-      expect(reviewTimeout).toBe(300_000);
-    }, 15000);
-
-    it('should cap review timeout at 600s upper bound', async () => {
-      const config = makeConfig({
-        workflows: [
-          {
-            name: 'default',
-            steps: [{ name: 'step-1', agent: 'agent-a', task: 'Do step 1', timeoutMs: 3_600_000 }],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-
-      const waitCalls = (waitForExitFn as any).mock?.calls ?? [];
-      expect(waitCalls.length).toBeGreaterThanOrEqual(2);
-      const reviewTimeout = waitCalls[1][0];
-      // proportional = 1_200_000, lowerBound = 60_000, upperBound = 600_000
-      // result = min(max(1_200_000, 60_000), 600_000) = 600_000
-      expect(reviewTimeout).toBe(600_000);
-    }, 15000);
-  });
-
-  // ── Scenario 6: Owner timeout emission ─────────────────────────────────
-
-  describe('Scenario 6: Owner timeout events', () => {
-    it('should emit step:owner-timeout when owner exceeds time limit', async () => {
-      const events: Array<{ type: string; stepName?: string; ownerName?: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-timeout') {
-          events.push({ type: event.type, stepName: event.stepName, ownerName: event.ownerName });
-        }
-      });
-
-      waitForExitFn = vi.fn().mockResolvedValue('timeout');
-      waitForIdleFn = vi.fn().mockResolvedValue('timeout');
-
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('timed out');
-      expect(events.length).toBeGreaterThanOrEqual(1);
-      expect(events[0].type).toBe('step:owner-timeout');
-      expect(events[0].stepName).toBe('step-1');
-    }, 15000);
-
-    it('should NOT emit step:owner-timeout for review timeouts', async () => {
-      const ownerTimeouts: string[] = [];
-      const reviewEvents: string[] = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-timeout') ownerTimeouts.push(event.stepName);
-        if (event.type === 'step:review-completed') reviewEvents.push(event.decision);
-      });
-
-      // Owner succeeds, review approves — no timeouts
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('completed');
-      expect(ownerTimeouts).toHaveLength(0);
-    }, 15000);
-  });
-
-  // ── Scenario 7: Multi-agent team with owner assignment ─────────────────
-
-  describe('Scenario 7: Lead + workers team pattern', () => {
-    it('should assign lead as owner for all team steps', async () => {
-      const ownerAssignments: Array<{ owner: string; specialist: string; step: string }> = [];
-      runner.on((event) => {
-        if (event.type === 'step:owner-assigned') {
-          ownerAssignments.push({
-            owner: event.ownerName,
-            specialist: event.specialistName,
-            step: event.stepName,
-          });
-        }
-      });
-
-      const config = makeConfig({
-        agents: [
-          { name: 'team-lead', cli: 'claude', role: 'Lead coordinator' },
-          { name: 'worker-1', cli: 'claude', role: 'implementer' },
-          { name: 'worker-2', cli: 'claude', role: 'implementer' },
-          { name: 'reviewer-1', cli: 'claude', role: 'reviewer' },
-        ],
-        workflows: [
-          {
-            name: 'default',
-            steps: [
-              { name: 'work-1', agent: 'worker-1', task: 'Do task A' },
-              { name: 'work-2', agent: 'worker-2', task: 'Do task B' },
-              {
-                name: 'lead-coord',
-                agent: 'team-lead',
-                task: 'Coordinate workers',
-                dependsOn: ['work-1', 'work-2'],
-              },
-            ],
-          },
-        ],
-      });
-
-      const run = await runner.execute(config, 'default');
-      expect(run.status).toBe('completed');
-      // All steps should have owner assignments
-      expect(ownerAssignments.length).toBeGreaterThanOrEqual(3);
-      // Worker steps should be owned by the lead (hub-role agent)
-      const worker1Owner = ownerAssignments.find((a) => a.step === 'work-1');
-      const worker2Owner = ownerAssignments.find((a) => a.step === 'work-2');
-      expect(worker1Owner?.owner).toBe('team-lead');
-      expect(worker2Owner?.owner).toBe('team-lead');
-      // Lead step should own itself
-      const leadOwner = ownerAssignments.find((a) => a.step === 'lead-coord');
-      expect(leadOwner?.owner).toBe('team-lead');
-    }, 30000);
-  });
-
-  // ── Scenario 8: YAML workflow parsing ──────────────────────────────────
-
-  describe('Scenario 8: E2E workflow YAML validation', () => {
-    it('should parse the e2e-owner-review.yaml without errors', () => {
-      const __dirname = dirname(fileURLToPath(import.meta.url));
-      const yamlPath = resolve(__dirname, 'e2e-owner-review.yaml');
-      const yamlContent = readFileSync(yamlPath, 'utf-8');
-
-      // Validate it can be parsed
-      const config = runner.parseYamlString(yamlContent);
-      expect(config.name).toBe('e2e-owner-review');
-      expect(config.agents).toHaveLength(5);
-      expect(config.workflows).toHaveLength(1);
-
-      // Verify agent definitions
-      const agentNames = config.agents!.map((a: any) => a.name);
-      expect(agentNames).toContain('team-lead');
-      expect(agentNames).toContain('github-integration');
-      expect(agentNames).toContain('impl-worker');
-      expect(agentNames).toContain('quality-reviewer');
-      expect(agentNames).toContain('coordinator-bot');
-
-      // Verify workflow steps
-      const steps = config.workflows![0].steps;
-      const stepNames = steps.map((s: any) => s.name);
-      expect(stepNames).toContain('hub-owner-test');
-      expect(stepNames).toContain('github-no-hub-match');
-      expect(stepNames).toContain('review-approval-gate');
-      expect(stepNames).toContain('deliberate-bad-output');
-      expect(stepNames).toContain('tight-timeout-step');
-      expect(stepNames).toContain('team-lead-coord');
-      expect(stepNames).toContain('merge-results');
-    });
-
-    it('should detect all hub-role agents correctly from YAML', () => {
-      const __dirname = dirname(fileURLToPath(import.meta.url));
-      const yamlPath = resolve(__dirname, 'e2e-owner-review.yaml');
-      const yamlContent = readFileSync(yamlPath, 'utf-8');
-      const config = runner.parseYamlString(yamlContent);
-
-      // team-lead has role "Lead coordinator" — word "Lead" should match hub role
-      const teamLead = config.agents!.find((a: any) => a.name === 'team-lead');
-      expect(teamLead?.role).toMatch(/\blead\b/i);
-
-      // github-integration should NOT match — "hub" is substring of "github"
-      const githubAgent = config.agents!.find((a: any) => a.name === 'github-integration');
-      expect(githubAgent?.role).not.toMatch(/\bhub\b/i);
-      expect(githubAgent?.name).not.toMatch(/\bhub\b/i);
-
-      // coordinator-bot has role "Coordinator" — should match hub role
-      const coordBot = config.agents!.find((a: any) => a.name === 'coordinator-bot');
-      expect(coordBot?.role).toMatch(/\bcoordinator\b/i);
-    });
-  });
-
-  // ── Scenario 9: Owner completion marker validation ─────────────────────
-
-  describe('Scenario 9: Owner completion marker', () => {
-    it('should fail when owner does not produce STEP_COMPLETE marker', async () => {
-      mockSpawnOutputs = ['The work is done but I forgot the sentinel.\n'];
-
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('failed');
-      expect(run.error).toContain('owner completion marker');
-    }, 15000);
-
-    it('should succeed when owner produces correct STEP_COMPLETE:step-name', async () => {
-      // Default mock auto-generates correct markers, so this should succeed
-      const run = await runner.execute(makeConfig(), 'default');
-      expect(run.status).toBe('completed');
-    }, 15000);
-  });
-});
diff --git a/tests/workflows/test-codex-failure.yaml b/tests/workflows/test-codex-failure.yaml
deleted file mode 100644
index e6e2e8561..000000000
--- a/tests/workflows/test-codex-failure.yaml
+++ /dev/null
@@ -1,26 +0,0 @@
-version: '1.0'
-name: test-codex-failure
-
-description: Intentional failure case to verify workflow failure handling.
-
-swarm:
-  pattern: pipeline
-  channel: test-codex-failure
-  timeoutMs: 180000
-
-agents:
-  - name: codex-fail
-    cli: codex
-    preset: worker
-
-workflows:
-  - name: codex-failure
-    steps:
-      - name: fail-step
-        type: agent
-        agent: codex-fail
-        task: |
-          Output exactly THIS_WILL_NOT_MATCH
-        verification:
-          type: output_contains
-          value: EXPECTED_SENTINEL
diff --git a/tests/workflows/test-codex-lead-worker.yaml b/tests/workflows/test-codex-lead-worker.yaml
deleted file mode 100644
index 0cd066439..000000000
--- a/tests/workflows/test-codex-lead-worker.yaml
+++ /dev/null
@@ -1,63 +0,0 @@
-version: '1.0'
-name: test-codex-lead-worker
-
-description: Real Codex lead/worker coordination workflow.
-
-swarm:
-  pattern: dag
-  channel: test-codex-lead-worker
-  maxConcurrency: 2
-  timeoutMs: 300000
-  idleNudge:
-    nudgeAfterMs: 90000
-    escalateAfterMs: 60000
-    maxNudges: 2
-
-agents:
-  - name: codex-lead
-    cli: codex
-    preset: lead
-    channels: [test-codex-lead-worker]
-  - name: codex-worker
-    cli: codex
-    preset: worker
-    channels: [test-codex-lead-worker]
-
-workflows:
-  - name: codex-lead-worker
-    steps:
-      - name: lead
-        type: agent
-        agent: codex-lead
-        task: |
-          You are the lead on #test-codex-lead-worker.
-
-          1. Post this exact assignment to the channel:
-             ASSIGNMENT: Output WORK_RESULT: apples and then post WORKER_DONE
-
-          2. Poll the channel until you see WORKER_DONE.
-
-          3. Then output exactly:
-             LEAD_DONE
-
-          4. Exit by outputting:
-             /exit
-        verification:
-          type: output_contains
-          value: LEAD_DONE
-
-      - name: worker
-        type: agent
-        agent: codex-worker
-        task: |
-          You are the worker on #test-codex-lead-worker.
-
-          1. Poll the channel until you see ASSIGNMENT:.
-          2. Output exactly:
-             WORK_RESULT: apples
-             WORKER_COMPLETE
-          3. Post exactly WORKER_DONE to the channel.
-          4. Exit.
-        verification:
-          type: output_contains
-          value: WORKER_COMPLETE
diff --git a/tests/workflows/test-codex-map-reduce.yaml b/tests/workflows/test-codex-map-reduce.yaml
deleted file mode 100644
index f7c2c339f..000000000
--- a/tests/workflows/test-codex-map-reduce.yaml
+++ /dev/null
@@ -1,66 +0,0 @@
-version: '1.0'
-name: test-codex-map-reduce
-
-description: Real Codex map-reduce/scatter-gather workflow.
-
-swarm:
-  pattern: dag
-  channel: test-codex-map-reduce
-  maxConcurrency: 3
-  timeoutMs: 360000
-
-agents:
-  - name: codex-map-a
-    cli: codex
-    preset: worker
-  - name: codex-map-b
-    cli: codex
-    preset: worker
-  - name: codex-reducer
-    cli: codex
-    preset: worker
-
-workflows:
-  - name: codex-map-reduce
-    steps:
-      - name: map-a
-        type: agent
-        agent: codex-map-a
-        task: |
-          Output exactly:
-          FRUIT=apple
-          MAP_A_DONE
-        verification:
-          type: output_contains
-          value: MAP_A_DONE
-
-      - name: map-b
-        type: agent
-        agent: codex-map-b
-        task: |
-          Output exactly:
-          FRUIT=banana
-          MAP_B_DONE
-        verification:
-          type: output_contains
-          value: MAP_B_DONE
-
-      - name: reduce
-        type: agent
-        agent: codex-reducer
-        dependsOn: [map-a, map-b]
-        task: |
-          Combine these two outputs into a single result.
-
-          A:
-          {{steps.map-a.output}}
-
-          B:
-          {{steps.map-b.output}}
-
-          Output exactly:
-          REDUCE_RESULT=apple,banana
-          REDUCE_DONE
-        verification:
-          type: output_contains
-          value: REDUCE_DONE
diff --git a/tests/workflows/test-codex-parallel.yaml b/tests/workflows/test-codex-parallel.yaml
deleted file mode 100644
index 5caa1a478..000000000
--- a/tests/workflows/test-codex-parallel.yaml
+++ /dev/null
@@ -1,39 +0,0 @@
-version: '1.0'
-name: test-codex-parallel
-
-description: Minimal Codex parallel fan-out workflow.
-
-swarm:
-  pattern: dag
-  channel: test-codex-parallel
-  timeoutMs: 240000
-  maxConcurrency: 2
-
-agents:
-  - name: codex-left
-    cli: codex
-    preset: worker
-  - name: codex-right
-    cli: codex
-    preset: worker
-
-workflows:
-  - name: codex-parallel
-    steps:
-      - name: left
-        type: agent
-        agent: codex-left
-        task: |
-          Output exactly LEFT_OK
-        verification:
-          type: output_contains
-          value: LEFT_OK
-
-      - name: right
-        type: agent
-        agent: codex-right
-        task: |
-          Output exactly RIGHT_OK
-        verification:
-          type: output_contains
-          value: RIGHT_OK
diff --git a/tests/workflows/test-codex-sequential.yaml b/tests/workflows/test-codex-sequential.yaml
deleted file mode 100644
index e15c5c07f..000000000
--- a/tests/workflows/test-codex-sequential.yaml
+++ /dev/null
@@ -1,43 +0,0 @@
-version: '1.0'
-name: test-codex-sequential
-
-description: Minimal sequential Codex workflow with step output chaining.
-
-swarm:
-  pattern: pipeline
-  channel: test-codex-seq
-  timeoutMs: 240000
-
-agents:
-  - name: codex-a
-    cli: codex
-    preset: worker
-  - name: codex-b
-    cli: codex
-    preset: worker
-
-workflows:
-  - name: codex-sequential
-    steps:
-      - name: first
-        type: agent
-        agent: codex-a
-        task: |
-          Output exactly:
-          FIRST_OK
-          VALUE=alpha
-        verification:
-          type: output_contains
-          value: VALUE=alpha
-
-      - name: second
-        type: agent
-        agent: codex-b
-        dependsOn: [first]
-        task: |
-          Read this injected prior output and respond exactly:
-          SEEN_PREVIOUS={{steps.first.output}}
-          SECOND_OK
-        verification:
-          type: output_contains
-          value: SECOND_OK
diff --git a/tests/workflows/test-codex-simple.yaml b/tests/workflows/test-codex-simple.yaml
deleted file mode 100644
index 63ff2c801..000000000
--- a/tests/workflows/test-codex-simple.yaml
+++ /dev/null
@@ -1,29 +0,0 @@
-version: '1.0'
-name: test-codex-simple
-description: >
-  Minimal Codex-backed workflow sanity check. Validates that a single
-  non-interactive agent step can run and satisfy output verification.
-
-swarm:
-  pattern: pipeline
-  channel: test-codex-simple
-  timeoutMs: 180000
-
-agents:
-  - name: codex-worker
-    cli: codex
-    preset: worker
-
-workflows:
-  - name: codex-simple
-    steps:
-      - name: codex-step
-        type: agent
-        agent: codex-worker
-        task: |
-          Output exactly these two lines and nothing else:
-          CODEX_WORKFLOW_OK
-          DONE
-        verification:
-          type: output_contains
-          value: DONE
diff --git a/tests/workflows/test-codex-supervisor.yaml b/tests/workflows/test-codex-supervisor.yaml
deleted file mode 100644
index fd43541e4..000000000
--- a/tests/workflows/test-codex-supervisor.yaml
+++ /dev/null
@@ -1,74 +0,0 @@
-version: '1.0'
-name: test-codex-supervisor
-
-description: Real Codex supervisor workflow with two workers and a merge.
-
-swarm:
-  pattern: dag
-  channel: test-codex-supervisor
-  maxConcurrency: 3
-  timeoutMs: 360000
-
-agents:
-  - name: codex-worker-a
-    cli: codex
-    preset: worker
-  - name: codex-worker-b
-    cli: codex
-    preset: worker
-  - name: codex-reviewer
-    cli: codex
-    preset: reviewer
-
-workflows:
-  - name: codex-supervisor
-    steps:
-      - name: worker-a
-        type: agent
-        agent: codex-worker-a
-        task: |
-          Output exactly:
-          ITEM_A=red
-          WORKER_A_DONE
-        verification:
-          type: output_contains
-          value: WORKER_A_DONE
-
-      - name: worker-b
-        type: agent
-        agent: codex-worker-b
-        task: |
-          Output exactly:
-          ITEM_B=blue
-          WORKER_B_DONE
-        verification:
-          type: output_contains
-          value: WORKER_B_DONE
-
-      - name: supervisor
-        type: agent
-        agent: codex-reviewer
-        dependsOn: [worker-a, worker-b]
-        task: |
-          Review these worker outputs:
-
-          A:
-          {{steps.worker-a.output}}
-
-          B:
-          {{steps.worker-b.output}}
-
-          If both outputs are present, output exactly:
-          SUPERVISOR_OK
-          ITEMS=2
-        verification:
-          type: output_contains
-          value: SUPERVISOR_OK
-
-      - name: merge
-        type: deterministic
-        dependsOn: [supervisor]
-        command: |
-          echo "{{steps.supervisor.output}}" | grep -q "SUPERVISOR_OK" && echo "MERGE_OK" || (echo "MERGE_FAIL" >&2; exit 1)
-        captureOutput: true
-        failOnError: true
diff --git a/tests/workflows/test-deterministic-pipeline.yaml b/tests/workflows/test-deterministic-pipeline.yaml
deleted file mode 100644
index fe5b851e3..000000000
--- a/tests/workflows/test-deterministic-pipeline.yaml
+++ /dev/null
@@ -1,43 +0,0 @@
-version: '1.0'
-name: test-deterministic-pipeline
-description: >
-  Tests a pure deterministic pipeline with shell steps and output chaining.
-  No agents involved. Validates: step sequencing, captureOutput, {{steps.X.output}}
-  interpolation, failOnError, and the overall pipeline pattern.
-
-swarm:
-  pattern: pipeline
-  channel: test-det-pipeline
-  timeoutMs: 60000
-
-workflows:
-  - name: deterministic-only
-    steps:
-      - name: generate
-        type: deterministic
-        command: printf 'hello from step one\nvalue=42\n'
-        captureOutput: true
-        failOnError: true
-
-      - name: transform
-        type: deterministic
-        dependsOn: [generate]
-        command: >
-          echo "{{steps.generate.output}}" |
-          tr '[:lower:]' '[:upper:]'
-        captureOutput: true
-        failOnError: true
-
-      - name: verify
-        type: deterministic
-        dependsOn: [transform]
-        command: |
-          output="{{steps.transform.output}}"
-          if echo "$output" | grep -q "HELLO FROM STEP ONE"; then
-            echo "PIPELINE_OK"
-          else
-            echo "PIPELINE_FAIL: unexpected output: $output" >&2
-            exit 1
-          fi
-        captureOutput: true
-        failOnError: true
diff --git a/tests/workflows/test-gemini-failure.yaml b/tests/workflows/test-gemini-failure.yaml
deleted file mode 100644
index d8929150c..000000000
--- a/tests/workflows/test-gemini-failure.yaml
+++ /dev/null
@@ -1,26 +0,0 @@
-version: '1.0'
-name: test-gemini-failure
-
-description: Intentional failure case to verify Gemini workflow failure handling.
-
-swarm:
-  pattern: pipeline
-  channel: test-gemini-failure
-  timeoutMs: 180000
-
-agents:
-  - name: gemini-fail
-    cli: gemini
-    preset: worker
-
-workflows:
-  - name: gemini-failure
-    steps:
-      - name: fail-step
-        type: agent
-        agent: gemini-fail
-        task: |
-          Output exactly THIS_WILL_NOT_MATCH
-        verification:
-          type: output_contains
-          value: EXPECTED_SENTINEL
diff --git a/tests/workflows/test-gemini-lead-worker.yaml b/tests/workflows/test-gemini-lead-worker.yaml
deleted file mode 100644
index b98d8a054..000000000
--- a/tests/workflows/test-gemini-lead-worker.yaml
+++ /dev/null
@@ -1,62 +0,0 @@
-version: '1.0'
-name: test-gemini-lead-worker
-
-description: Real Gemini lead/worker coordination workflow.
-
-swarm:
-  pattern: dag
-  channel: test-gemini-lead-worker
-  maxConcurrency: 2
-  timeoutMs: 420000
-  idleNudge:
-    nudgeAfterMs: 120000
-    escalateAfterMs: 60000
-    maxNudges: 2
-
-agents:
-  - name: gemini-lead
-    cli: gemini
-    preset: lead
-    channels: [test-gemini-lead-worker]
-  - name: gemini-worker
-    cli: gemini
-    preset: worker
-    channels: [test-gemini-lead-worker]
-
-workflows:
-  - name: gemini-lead-worker
-    steps:
-      - name: lead
-        type: agent
-        agent: gemini-lead
-        task: |
-          You are the lead on #test-gemini-lead-worker.
-
-          1. Post this exact assignment to the channel:
-             ASSIGNMENT: Output WORK_RESULT: pears and then post WORKER_DONE
-
-          2. Poll the channel until you see WORKER_DONE.
-
-          3. Then output exactly:
-             LEAD_DONE
-
-          4. Exit.
-        verification:
-          type: output_contains
-          value: LEAD_DONE
-
-      - name: worker
-        type: agent
-        agent: gemini-worker
-        task: |
-          You are the worker on #test-gemini-lead-worker.
-
-          1. Poll the channel until you see ASSIGNMENT:.
-          2. Output exactly:
-             WORK_RESULT: pears
-             WORKER_COMPLETE
-          3. Post exactly WORKER_DONE to the channel.
-          4. Exit.
-        verification:
-          type: output_contains
-          value: WORKER_COMPLETE
diff --git a/tests/workflows/test-gemini-map-reduce.yaml b/tests/workflows/test-gemini-map-reduce.yaml
deleted file mode 100644
index 443f02033..000000000
--- a/tests/workflows/test-gemini-map-reduce.yaml
+++ /dev/null
@@ -1,66 +0,0 @@
-version: '1.0'
-name: test-gemini-map-reduce
-
-description: Real Gemini map-reduce/scatter-gather workflow.
-
-swarm:
-  pattern: dag
-  channel: test-gemini-map-reduce
-  maxConcurrency: 3
-  timeoutMs: 420000
-
-agents:
-  - name: gemini-map-a
-    cli: gemini
-    preset: worker
-  - name: gemini-map-b
-    cli: gemini
-    preset: worker
-  - name: gemini-reducer
-    cli: gemini
-    preset: worker
-
-workflows:
-  - name: gemini-map-reduce
-    steps:
-      - name: map-a
-        type: agent
-        agent: gemini-map-a
-        task: |
-          Output exactly:
-          FRUIT=kiwi
-          MAP_A_DONE
-        verification:
-          type: output_contains
-          value: MAP_A_DONE
-
-      - name: map-b
-        type: agent
-        agent: gemini-map-b
-        task: |
-          Output exactly:
-          FRUIT=mango
-          MAP_B_DONE
-        verification:
-          type: output_contains
-          value: MAP_B_DONE
-
-      - name: reduce
-        type: agent
-        agent: gemini-reducer
-        dependsOn: [map-a, map-b]
-        task: |
-          Combine these two outputs into a single result.
-
-          A:
-          {{steps.map-a.output}}
-
-          B:
-          {{steps.map-b.output}}
-
-          Output exactly:
-          REDUCE_RESULT=kiwi,mango
-          REDUCE_DONE
-        verification:
-          type: output_contains
-          value: REDUCE_DONE
diff --git a/tests/workflows/test-gemini-parallel.yaml b/tests/workflows/test-gemini-parallel.yaml
deleted file mode 100644
index 37522f198..000000000
--- a/tests/workflows/test-gemini-parallel.yaml
+++ /dev/null
@@ -1,39 +0,0 @@
-version: '1.0'
-name: test-gemini-parallel
-
-description: Minimal Gemini parallel fan-out workflow.
-
-swarm:
-  pattern: dag
-  channel: test-gemini-parallel
-  timeoutMs: 240000
-  maxConcurrency: 2
-
-agents:
-  - name: gemini-left
-    cli: gemini
-    preset: worker
-  - name: gemini-right
-    cli: gemini
-    preset: worker
-
-workflows:
-  - name: gemini-parallel
-    steps:
-      - name: left
-        type: agent
-        agent: gemini-left
-        task: |
-          Output exactly LEFT_OK
-        verification:
-          type: output_contains
-          value: LEFT_OK
-
-      - name: right
-        type: agent
-        agent: gemini-right
-        task: |
-          Output exactly RIGHT_OK
-        verification:
-          type: output_contains
-          value: RIGHT_OK
diff --git a/tests/workflows/test-gemini-sequential.yaml b/tests/workflows/test-gemini-sequential.yaml
deleted file mode 100644
index 730ad273a..000000000
--- a/tests/workflows/test-gemini-sequential.yaml
+++ /dev/null
@@ -1,43 +0,0 @@
-version: '1.0'
-name: test-gemini-sequential
-
-description: Minimal sequential Gemini workflow with step output chaining.
-
-swarm:
-  pattern: pipeline
-  channel: test-gemini-seq
-  timeoutMs: 240000
-
-agents:
-  - name: gemini-a
-    cli: gemini
-    preset: worker
-  - name: gemini-b
-    cli: gemini
-    preset: worker
-
-workflows:
-  - name: gemini-sequential
-    steps:
-      - name: first
-        type: agent
-        agent: gemini-a
-        task: |
-          Output exactly:
-          FIRST_OK
-          VALUE=beta
-        verification:
-          type: output_contains
-          value: VALUE=beta
-
-      - name: second
-        type: agent
-        agent: gemini-b
-        dependsOn: [first]
-        task: |
-          Read this injected prior output and respond exactly:
-          SEEN_PREVIOUS={{steps.first.output}}
-          SECOND_OK
-        verification:
-          type: output_contains
-          value: SECOND_OK
diff --git a/tests/workflows/test-gemini-simple.yaml b/tests/workflows/test-gemini-simple.yaml
deleted file mode 100644
index f495d4659..000000000
--- a/tests/workflows/test-gemini-simple.yaml
+++ /dev/null
@@ -1,28 +0,0 @@
-version: '1.0'
-name: test-gemini-simple
-
-description: Minimal Gemini-backed workflow sanity check.
-
-swarm:
-  pattern: pipeline
-  channel: test-gemini-simple
-  timeoutMs: 180000
-
-agents:
-  - name: gemini-worker
-    cli: gemini
-    preset: worker
-
-workflows:
-  - name: gemini-simple
-    steps:
-      - name: gemini-step
-        type: agent
-        agent: gemini-worker
-        task: |
-          Output exactly these two lines and nothing else:
-          GEMINI_WORKFLOW_OK
-          DONE
-        verification:
-          type: output_contains
-          value: DONE
diff --git a/tests/workflows/test-gemini-supervisor.yaml b/tests/workflows/test-gemini-supervisor.yaml
deleted file mode 100644
index ee44edde7..000000000
--- a/tests/workflows/test-gemini-supervisor.yaml
+++ /dev/null
@@ -1,74 +0,0 @@
-version: '1.0'
-name: test-gemini-supervisor
-
-description: Real Gemini supervisor workflow with two workers and a merge.
-
-swarm:
-  pattern: dag
-  channel: test-gemini-supervisor
-  maxConcurrency: 3
-  timeoutMs: 420000
-
-agents:
-  - name: gemini-worker-a
-    cli: gemini
-    preset: worker
-  - name: gemini-worker-b
-    cli: gemini
-    preset: worker
-  - name: gemini-reviewer
-    cli: gemini
-    preset: reviewer
-
-workflows:
-  - name: gemini-supervisor
-    steps:
-      - name: worker-a
-        type: agent
-        agent: gemini-worker-a
-        task: |
-          Output exactly:
-          ITEM_A=green
-          WORKER_A_DONE
-        verification:
-          type: output_contains
-          value: WORKER_A_DONE
-
-      - name: worker-b
-        type: agent
-        agent: gemini-worker-b
-        task: |
-          Output exactly:
-          ITEM_B=yellow
-          WORKER_B_DONE
-        verification:
-          type: output_contains
-          value: WORKER_B_DONE
-
-      - name: supervisor
-        type: agent
-        agent: gemini-reviewer
-        dependsOn: [worker-a, worker-b]
-        task: |
-          Review these worker outputs.
-
-          A:
-          {{steps.worker-a.output}}
-
-          B:
-          {{steps.worker-b.output}}
-
-          If both outputs are present, output exactly:
-          SUPERVISOR_OK
-          ITEMS=2
-        verification:
-          type: output_contains
-          value: SUPERVISOR_OK
-
-      - name: merge
-        type: deterministic
-        dependsOn: [supervisor]
-        command: |
-          echo "{{steps.supervisor.output}}" | grep -q "SUPERVISOR_OK" && echo "MERGE_OK" || (echo "MERGE_FAIL" >&2; exit 1)
-        captureOutput: true
-        failOnError: true
diff --git a/tests/workflows/test-lead-worker-pattern.yaml b/tests/workflows/test-lead-worker-pattern.yaml
deleted file mode 100644
index e4fb4e072..000000000
--- a/tests/workflows/test-lead-worker-pattern.yaml
+++ /dev/null
@@ -1,120 +0,0 @@
-version: '1.0'
-name: test-lead-worker-pattern
-description: >
-  Tests the canonical relay-coordinated lead + worker(s) pattern.
-  Lead is interactive (PTY, relay-aware). Workers that must post channel signals
-  are also interactive and relay-connected.
-
-  DAG structure: context → [work-a, work-b, coordinate] → merge
-  Workers and lead all start after context. Lead watches the channel for
-  worker DONE signals. Workers post signals when complete. Lead posts
-  LEAD_COMPLETE once both are seen. Merge step validates all outputs.
-
-  This is the correct pattern — workers are NOT downstream of the lead step.
-  The lead runs in parallel with workers and monitors their progress.
-
-swarm:
-  pattern: dag
-  channel: test-lw-pattern
-  timeoutMs: 600000 # 10 min
-  idleNudge:
-    nudgeAfterMs: 180000 # 3 min — give lead time to observe worker signals
-    escalateAfterMs: 60000
-    maxNudges: 2
-
-agents:
-  - name: lead
-    cli: claude
-    preset: lead
-    channels: [test-lw-pattern]
-    constraints:
-      model: sonnet
-
-  - name: worker-a
-    cli: claude
-    role: worker
-    channels: [test-lw-pattern]
-    constraints:
-      model: sonnet
-
-  - name: worker-b
-    cli: claude
-    role: worker
-    channels: [test-lw-pattern]
-    constraints:
-      model: sonnet
-
-workflows:
-  - name: lead-worker
-    steps:
-      - name: context
-        type: deterministic
-        command: >
-          echo "TASK_A: List 3 benefits of TypeScript type safety." &&
-          echo "TASK_B: List 3 benefits of pure functions."
-        captureOutput: true
-        failOnError: true
-
-      # Steps 2, 3, 4 all start in parallel after context.
-      # Relay-coordinated workers stay interactive so they can send channel signals.
-      - name: work-a
-        type: agent
-        agent: worker-a
-        dependsOn: [context]
-        task: |
-          List exactly 3 benefits of TypeScript type safety.
-          Format each as a single sentence starting with "- ".
-          Then post exactly WORKER_A_DONE to #test-lw-pattern.
-          Then output exactly:
-          WORKER_A_DONE
-          /exit
-        verification:
-          type: output_contains
-          value: WORKER_A_DONE
-
-      - name: work-b
-        type: agent
-        agent: worker-b
-        dependsOn: [context]
-        task: |
-          List exactly 3 benefits of pure functions.
-          Format each as a single sentence starting with "- ".
-          Then post exactly WORKER_B_DONE to #test-lw-pattern.
-          Then output exactly:
-          WORKER_B_DONE
-          /exit
-        verification:
-          type: output_contains
-          value: WORKER_B_DONE
-
-      - name: coordinate
-        type: agent
-        agent: lead
-        dependsOn: [context]
-        task: |
-          You are monitoring two parallel workers on channel #test-lw-pattern.
-          The workers are already running and will post their results there.
-
-          Context for reference:
-          {{steps.context.output}}
-
-          Instructions:
-          1. Check your inbox and the channel for worker-authored WORKER_A_DONE and WORKER_B_DONE signals.
-          2. If you don't see them yet, wait 30 seconds and check again (up to 5 times).
-          3. Once you see both signals, post to #test-lw-pattern: LEAD_COMPLETE
-          4. Then output exactly:
-             LEAD_COMPLETE
-             /exit
-        verification:
-          type: output_contains
-          value: LEAD_COMPLETE
-
-      - name: merge
-        type: deterministic
-        dependsOn: [work-a, work-b, coordinate]
-        command: |
-          echo "work-a: {{steps.work-a.output}}" | grep -q "WORKER_A_DONE" && \
-          echo "work-b: {{steps.work-b.output}}" | grep -q "WORKER_B_DONE" && \
-          echo "ALL_COMPLETE" || (echo "MERGE_FAIL" >&2; exit 1)
-        captureOutput: true
-        failOnError: true
diff --git a/tests/workflows/test-non-interactive-bounded.yaml b/tests/workflows/test-non-interactive-bounded.yaml
deleted file mode 100644
index 0b258a7a3..000000000
--- a/tests/workflows/test-non-interactive-bounded.yaml
+++ /dev/null
@@ -1,74 +0,0 @@
-version: '1.0'
-name: test-non-interactive-bounded
-description: >
-  Validates that non-interactive (preset: worker/analyst/reviewer) agents
-  complete reliably when the task is small and self-contained.
-  Key rule: non-interactive agents must NEVER discover information via tools —
-  all file content is injected by a prior deterministic step.
-
-swarm:
-  pattern: pipeline
-  channel: test-ni-bounded
-  timeoutMs: 300000 # 5 min total — any step taking longer is a bug
-
-agents:
-  - name: summarizer
-    cli: claude
-    preset: worker
-    constraints:
-      model: sonnet
-
-  - name: validator
-    cli: claude
-    preset: reviewer
-    constraints:
-      model: sonnet
-
-workflows:
-  - name: bounded-non-interactive
-    steps:
-      # Step 1: deterministic — read a small file and inject its content
-      - name: read-file
-        type: deterministic
-        command: >
-          echo "FILE_CONTENT_START" &&
-          head -30 packages/sdk/src/workflows/types.ts &&
-          echo "FILE_CONTENT_END"
-        captureOutput: true
-        failOnError: true
-
-      # Step 2: non-interactive agent receives the content directly — no tool use needed
-      - name: summarize
-        type: agent
-        agent: summarizer
-        dependsOn: [read-file]
-        task: |
-          Summarize the following TypeScript type definitions in 3 bullet points.
-          Do not read any files — all content is provided below.
-
-          {{steps.read-file.output}}
-
-          Output exactly:
-          SUMMARY_START
-          - <bullet 1>
-          - <bullet 2>
-          - <bullet 3>
-          SUMMARY_DONE
-        verification:
-          type: output_contains
-          value: SUMMARY_DONE
-
-      # Step 3: reviewer validates the summary — also gets content injected
-      - name: review
-        type: agent
-        agent: validator
-        dependsOn: [summarize]
-        task: |
-          Check that the following summary contains exactly 3 bullet points
-          and each bullet is non-empty. Reply REVIEW_PASS if correct,
-          REVIEW_FAIL with a reason if not.
-
-          {{steps.summarize.output}}
-        verification:
-          type: output_contains
-          value: REVIEW_PASS
diff --git a/tests/workflows/test-step-sizing.yaml b/tests/workflows/test-step-sizing.yaml
deleted file mode 100644
index 0d8b7c5b3..000000000
--- a/tests/workflows/test-step-sizing.yaml
+++ /dev/null
@@ -1,66 +0,0 @@
-version: '1.0'
-name: test-step-sizing
-description: >
-  Demonstrates the correct step-sizing principle: one agent step = one clear,
-  bounded deliverable. Compares a correctly-sized step (succeeds fast) against
-  a deliberately oversized step (too many concerns in one prompt) to show why
-  splitting matters. Use this as a reference for authoring durable workflows.
-
-swarm:
-  pattern: dag
-  channel: test-step-sizing
-  timeoutMs: 300000 # 5 min
-
-agents:
-  - name: worker
-    cli: claude
-    preset: worker
-    constraints:
-      model: sonnet
-
-workflows:
-  - name: step-sizing
-    steps:
-      # GOOD: one step, one deliverable, small input injected directly
-      - name: good-small-task
-        type: agent
-        agent: worker
-        task: |
-          Count the number of vowels in this string: "the quick brown fox"
-
-          Output only: VOWEL_COUNT=<number>
-          Then: TASK_DONE
-        verification:
-          type: output_contains
-          value: TASK_DONE
-
-      # GOOD: chained — second step gets the output of the first injected, not discovered
-      - name: good-chained-task
-        type: agent
-        agent: worker
-        dependsOn: [good-small-task]
-        task: |
-          The previous step produced this output:
-
-          {{steps.good-small-task.output}}
-
-          Extract the number from VOWEL_COUNT=<number> and output:
-          DOUBLED=<that number times 2>
-          Then: CHAIN_DONE
-        verification:
-          type: output_contains
-          value: CHAIN_DONE
-
-      # GOOD: deterministic validation requires no agent
-      - name: validate
-        type: deterministic
-        dependsOn: [good-chained-task]
-        command: |
-          output='{{steps.good-chained-task.output}}'
-          if echo "$output" | grep -q 'DOUBLED='; then
-            echo "VALIDATION_PASS"
-          else
-            echo "VALIDATION_FAIL" >&2; exit 1
-          fi
-        captureOutput: true
-        failOnError: true
diff --git a/tests/workflows/test-trajectory-quality.yaml b/tests/workflows/test-trajectory-quality.yaml
deleted file mode 100644
index 90c6b39ac..000000000
--- a/tests/workflows/test-trajectory-quality.yaml
+++ /dev/null
@@ -1,58 +0,0 @@
-version: '1.0'
-name: test-trajectory-quality
-description: >
-  Verifies that trajectory files capture reasoning (purpose, step intent,
-  completion sentinel) not just mechanical event logs.
-  Verification_mismatch classification is covered by trajectory-quality.test.ts.
-
-swarm:
-  pattern: pipeline
-  channel: test-traj-quality
-  timeoutMs: 300000
-
-agents:
-  - name: worker
-    cli: claude
-    preset: worker
-    constraints:
-      model: haiku
-
-workflows:
-  - name: trajectory-quality
-    steps:
-      - name: work
-        type: agent
-        agent: worker
-        task: 'Output exactly: WORK_DONE'
-        verification:
-          type: output_contains
-          value: WORK_DONE
-
-      - name: check-trajectory
-        type: deterministic
-        dependsOn: [work]
-        # Search across all trajectory files for any that belong to THIS workflow
-        # (identified by the workflow name in the task title). Old runs in the
-        # directory don't interfere — we find the one that matches this run.
-        command: >-
-          node -e "
-          const fs=require('fs');
-          const dirs=['.trajectories/active','.trajectories/completed'];
-          const files=dirs.flatMap(d=>fs.existsSync(d)?fs.readdirSync(d).filter(f=>f.endsWith('.json')).map(f=>d+'/'+f):[]);
-          if(!files.length){console.error('No trajectory files found');process.exit(1);}
-          const parsed=files.map(f=>{try{return JSON.parse(fs.readFileSync(f,'utf8'));}catch{return null;}}).filter(Boolean);
-          const t=parsed.find(x=>x.task&&x.task.title&&x.task.title.includes('trajectory-quality'));
-          if(!t){console.error('No trajectory for this run. Titles:',parsed.map(x=>x.task&&x.task.title));process.exit(1);}
-          const events=t.chapters.flatMap(c=>c.events);
-          const has=s=>events.some(e=>e.content.includes(s));
-          if(!has('Verifies that trajectory')){console.error('FAIL: no purpose event. Events:',events.slice(0,5).map(e=>e.content));process.exit(1);}
-          console.log('PASS purpose');
-          if(!has('Output exactly')){console.error('FAIL: no step intent event');process.exit(1);}
-          console.log('PASS step intent');
-          if(!has('WORK_DONE')){console.error('FAIL: completion sentinel missing');process.exit(1);}
-          console.log('PASS sentinel');
-          console.log('TRAJECTORY_QUALITY_PASS');
-          console.log('(retrospective/approach checked by integration tests after run completes)');
-          "
-        captureOutput: true
-        failOnError: true
diff --git a/tests/workflows/validation-interactive-codex-lead-worker.yaml b/tests/workflows/validation-interactive-codex-lead-worker.yaml
deleted file mode 100644
index e4215f2bd..000000000
--- a/tests/workflows/validation-interactive-codex-lead-worker.yaml
+++ /dev/null
@@ -1,65 +0,0 @@
-version: '1.0'
-name: validation-interactive-codex-lead-worker
-swarm:
-  pattern: dag
-  channel: validation-interactive-codex-lead-worker
-  timeoutMs: 180000
-  idleNudge:
-    nudgeAfterMs: 60000
-    escalateAfterMs: 45000
-    maxNudges: 2
-agents:
-  - name: lead
-    cli: codex
-    channels: [validation-interactive-codex-lead-worker]
-    constraints:
-      model: gpt-5.3-codex
-  - name: worker
-    cli: codex
-    preset: worker
-    interactive: true
-    channels: [validation-interactive-codex-lead-worker]
-    constraints:
-      model: gpt-5.3-codex
-workflows:
-  - name: happy-path
-    steps:
-      - name: lead-step
-        type: agent
-        agent: lead
-        task: |
-          You are the lead coordinating a single worker on #validation-interactive-codex-lead-worker.
-
-          STEP 1 — Post exactly this channel message:
-          ASSIGNMENT: Output WORKER_SIGNAL locally, then post WORKER_DONE to #validation-interactive-codex-lead-worker.
-
-          STEP 2 — Poll the channel until you see a message containing WORKER_DONE.
-
-          STEP 3 — Output exactly:
-          LEAD_DONE
-
-          Then self-terminate immediately.
-        verification:
-          type: output_contains
-          value: LEAD_DONE
-
-      - name: worker-step
-        type: agent
-        agent: worker
-        task: |
-          You are the worker on #validation-interactive-codex-lead-worker.
-
-          STEP 1 — Wait until the channel contains a message with ASSIGNMENT:.
-
-          STEP 2 — Output exactly:
-          WORKER_SIGNAL
-
-          STEP 3 — Post exactly WORKER_DONE to #validation-interactive-codex-lead-worker.
-
-          STEP 4 — Output exactly:
-          WORKER_DONE_LOCAL
-
-          Then self-terminate immediately.
-        verification:
-          type: output_contains
-          value: WORKER_DONE_LOCAL
diff --git a/tests/workflows/validation-lead-worker-happy-strict.yaml b/tests/workflows/validation-lead-worker-happy-strict.yaml
deleted file mode 100644
index ebb0526ce..000000000
--- a/tests/workflows/validation-lead-worker-happy-strict.yaml
+++ /dev/null
@@ -1,29 +0,0 @@
-version: '1.0'
-name: validation-lead-worker-happy-strict
-swarm:
-  pattern: dag
-  channel: validation-lead-worker-happy-strict
-  timeoutMs: 180000
-agents:
-  - name: lead
-    cli: claude
-    preset: lead
-    channels: [validation-lead-worker-happy-strict]
-  - name: worker
-    cli: claude
-    preset: worker
-    interactive: true
-    channels: [validation-lead-worker-happy-strict]
-workflows:
-  - name: happy-strict
-    steps:
-      - name: worker-step
-        type: agent
-        agent: worker
-        task: |
-          Output exactly:
-          WORKER_DONE_LOCALLY
-          /exit
-        verification:
-          type: output_contains
-          value: WORKER_DONE_LOCALLY
diff --git a/tests/workflows/validation-legacy-marker.yaml b/tests/workflows/validation-legacy-marker.yaml
deleted file mode 100644
index c0dba3698..000000000
--- a/tests/workflows/validation-legacy-marker.yaml
+++ /dev/null
@@ -1,23 +0,0 @@
-version: '1.0'
-name: validation-legacy-marker
-swarm:
-  pattern: pipeline
-  channel: validation-legacy-marker
-  timeoutMs: 180000
-agents:
-  - name: legacy-worker
-    cli: codex
-    preset: worker
-workflows:
-  - name: legacy-marker
-    steps:
-      - name: legacy-step
-        type: agent
-        agent: legacy-worker
-        task: |
-          Output exactly:
-          STEP_COMPLETE:legacy-step
-          LEGACY_OK
-        verification:
-          type: output_contains
-          value: LEGACY_OK
diff --git a/tests/workflows/validation-map-reduce.yaml b/tests/workflows/validation-map-reduce.yaml
deleted file mode 100644
index f1d9a624c..000000000
--- a/tests/workflows/validation-map-reduce.yaml
+++ /dev/null
@@ -1,54 +0,0 @@
-version: '1.0'
-name: validation-map-reduce
-swarm:
-  pattern: dag
-  channel: validation-map-reduce
-  timeoutMs: 360000
-  maxConcurrency: 3
-agents:
-  - name: map-a
-    cli: codex
-    preset: worker
-  - name: map-b
-    cli: codex
-    preset: worker
-  - name: reducer
-    cli: codex
-    preset: worker
-workflows:
-  - name: map-reduce
-    steps:
-      - name: map-a-step
-        type: agent
-        agent: map-a
-        task: |
-          Output exactly:
-          FRUIT=apple
-          MAP_A_DONE
-        verification:
-          type: output_contains
-          value: MAP_A_DONE
-      - name: map-b-step
-        type: agent
-        agent: map-b
-        task: |
-          Output exactly:
-          FRUIT=banana
-          MAP_B_DONE
-        verification:
-          type: output_contains
-          value: MAP_B_DONE
-      - name: reduce-step
-        type: agent
-        agent: reducer
-        dependsOn: [map-a-step, map-b-step]
-        task: |
-          Combine these outputs:
-          A: {{steps.map-a-step.output}}
-          B: {{steps.map-b-step.output}}
-          Output exactly:
-          REDUCE_RESULT=apple,banana
-          REDUCE_DONE
-        verification:
-          type: output_contains
-          value: REDUCE_DONE
diff --git a/tests/workflows/validation-owner-retry-strict.yaml b/tests/workflows/validation-owner-retry-strict.yaml
deleted file mode 100644
index 0a759b6a0..000000000
--- a/tests/workflows/validation-owner-retry-strict.yaml
+++ /dev/null
@@ -1,38 +0,0 @@
-version: '1.0'
-name: validation-owner-retry-strict
-swarm:
-  pattern: pipeline
-  channel: validation-owner-retry-strict
-  timeoutMs: 300000
-agents:
-  - name: worker
-    cli: codex
-    preset: worker
-  - name: reviewer
-    cli: codex
-    preset: reviewer
-workflows:
-  - name: owner-retry-strict
-    steps:
-      - name: worker-step
-        type: agent
-        agent: worker
-        task: |
-          Output exactly:
-          PARTIAL_OUTPUT
-        verification:
-          type: output_contains
-          value: PARTIAL_OUTPUT
-      - name: review-step
-        type: agent
-        agent: reviewer
-        dependsOn: [worker-step]
-        task: |
-          Review this output:
-          {{steps.worker-step.output}}
-          Output exactly:
-          OWNER_DECISION: INCOMPLETE_RETRY
-          REASON: explicit retry requested
-        verification:
-          type: output_contains
-          value: 'OWNER_DECISION: INCOMPLETE_RETRY'
diff --git a/tests/workflows/validation-supervisor.yaml b/tests/workflows/validation-supervisor.yaml
deleted file mode 100644
index 77836495f..000000000
--- a/tests/workflows/validation-supervisor.yaml
+++ /dev/null
@@ -1,54 +0,0 @@
-version: '1.0'
-name: validation-supervisor
-swarm:
-  pattern: dag
-  channel: validation-supervisor
-  timeoutMs: 360000
-  maxConcurrency: 3
-agents:
-  - name: worker-a
-    cli: codex
-    preset: worker
-  - name: worker-b
-    cli: codex
-    preset: worker
-  - name: reviewer
-    cli: codex
-    preset: reviewer
-workflows:
-  - name: supervisor
-    steps:
-      - name: worker-a-step
-        type: agent
-        agent: worker-a
-        task: |
-          Output exactly:
-          ITEM_A=red
-          WORKER_A_DONE
-        verification:
-          type: output_contains
-          value: WORKER_A_DONE
-      - name: worker-b-step
-        type: agent
-        agent: worker-b
-        task: |
-          Output exactly:
-          ITEM_B=blue
-          WORKER_B_DONE
-        verification:
-          type: output_contains
-          value: WORKER_B_DONE
-      - name: review-step
-        type: agent
-        agent: reviewer
-        dependsOn: [worker-a-step, worker-b-step]
-        task: |
-          Review these outputs:
-          A: {{steps.worker-a-step.output}}
-          B: {{steps.worker-b-step.output}}
-          Output exactly:
-          OWNER_DECISION: COMPLETE
-          REASON: both worker outputs present
-        verification:
-          type: output_contains
-          value: 'OWNER_DECISION: COMPLETE'
diff --git a/tests/workflows/validation-wrong-sender-lead-posts-worker-done.yaml b/tests/workflows/validation-wrong-sender-lead-posts-worker-done.yaml
deleted file mode 100644
index ec745c7c0..000000000
--- a/tests/workflows/validation-wrong-sender-lead-posts-worker-done.yaml
+++ /dev/null
@@ -1,49 +0,0 @@
-version: '1.0'
-name: validation-wrong-sender-lead-posts-worker-done
-swarm:
-  pattern: dag
-  channel: validation-wrong-sender-lead-posts-worker-done
-  timeoutMs: 420000
-  maxConcurrency: 2
-  idleNudge:
-    nudgeAfterMs: 90000
-    escalateAfterMs: 60000
-    maxNudges: 1
-agents:
-  - name: lead
-    cli: codex
-    preset: lead
-    channels: [validation-wrong-sender-lead-posts-worker-done]
-  - name: worker
-    cli: codex
-    preset: worker
-    channels: [validation-wrong-sender-lead-posts-worker-done]
-workflows:
-  - name: wrong-sender-strict
-    steps:
-      - name: lead-step
-        type: agent
-        agent: lead
-        task: |
-          You are the lead on #validation-wrong-sender-lead-posts-worker-done.
-          1. Post exactly: ASSIGNMENT: worker must post WORKER_DONE in channel.
-          2. Do not post WORKER_DONE yourself.
-          3. If worker never posts WORKER_DONE, output exactly:
-             OWNER_DECISION: INCOMPLETE_FAIL
-             REASON: missing worker-authored channel signal
-             /exit
-        verification:
-          type: output_contains
-          value: 'OWNER_DECISION: INCOMPLETE_FAIL'
-      - name: worker-step
-        type: agent
-        agent: worker
-        task: |
-          You are the worker on #validation-wrong-sender-lead-posts-worker-done.
-          1. Wait until you see ASSIGNMENT: in the channel.
-          2. Do not post WORKER_DONE.
-          3. Output exactly:
-             WORKER_LOCAL_DONE
-        verification:
-          type: output_contains
-          value: WORKER_LOCAL_DONE
diff --git a/vitest.config.ts b/vitest.config.ts
index a9f57e755..67bcd84e0 100644
--- a/vitest.config.ts
+++ b/vitest.config.ts
@@ -27,7 +27,6 @@ const workspacePackages = [
   'telemetry',
   'trajectory',
   'utils',
-  'workflow-types',
 ] as const;
 
 const workspaceAliases = workspacePackages.flatMap((packageName) => {
diff --git a/web/components/SiteFooter.tsx b/web/components/SiteFooter.tsx
index 865b9bf3b..2692b6889 100644
--- a/web/components/SiteFooter.tsx
+++ b/web/components/SiteFooter.tsx
@@ -26,7 +26,7 @@ export function SiteFooter() {
             <Link href="/docs/spawning-an-agent" className={s.link}>
               Basics
             </Link>
-            <Link href="/docs/reference-workflows" className={s.link}>
+            <Link href="/docs/cloud" className={s.link}>
               Advanced
             </Link>
             <Link href="/docs/cli-overview" className={s.link}>
diff --git a/web/components/docs/DocsNav.tsx b/web/components/docs/DocsNav.tsx
index 64532c369..c649d6a50 100644
--- a/web/components/docs/DocsNav.tsx
+++ b/web/components/docs/DocsNav.tsx
@@ -24,7 +24,6 @@ import {
   Smile,
   Terminal,
   Users,
-  Workflow,
   Zap,
 } from 'lucide-react';
 import { BsChatRightText } from 'react-icons/bs';
@@ -53,7 +52,6 @@ const navIcons: Record<string, NavIcon> = {
   authentication: Shield,
   permissions: PiLockKeyDuotone,
   scheduling: Clock3,
-  'reference-workflows': Workflow,
   cloud: Cloud,
   workforce: Users,
   'proactive-agents': Zap,
@@ -63,7 +61,6 @@ const navIcons: Record<string, NavIcon> = {
   'cli-broker-lifecycle': Power,
   'cli-agent-management': Bot,
   'cli-messaging': Send,
-  'cli-workflows': Workflow,
   'cli-cloud-commands': Cloud,
   'cli-on-the-relay': Plug,
   'reference-cli': BookOpen,
diff --git a/web/content/docs/cli-cloud-commands.mdx b/web/content/docs/cli-cloud-commands.mdx
index 13dc0dab2..7818098f9 100644
--- a/web/content/docs/cli-cloud-commands.mdx
+++ b/web/content/docs/cli-cloud-commands.mdx
@@ -62,16 +62,10 @@ The top-level `agent-relay connect <provider>` command is deprecated. Use `agent
 ## See also
 
 <CardGroup cols={2}>
-  <Card title="Run workflows" href="/docs/cli-workflows">
-    Local workflow execution from the CLI.
-  </Card>
   <Card title="Cloud" href="/docs/cloud">
     Conceptual overview of local versus cloud execution.
   </Card>
   <Card title="Authentication" href="/docs/authentication">
     Relayauth and credentials at the product level.
   </Card>
-  <Card title="Workflows" href="/docs/reference-workflows">
-    Author the workflow files you submit to cloud.
-  </Card>
 </CardGroup>
diff --git a/web/content/docs/cli-workflows.mdx b/web/content/docs/cli-workflows.mdx
deleted file mode 100644
index 6bc6ec155..000000000
--- a/web/content/docs/cli-workflows.mdx
+++ /dev/null
@@ -1,64 +0,0 @@
----
-title: 'Run workflows'
-description: 'Execute local workflow files, resume failed runs, and inspect built-in workflow templates.'
----
-
-The CLI can execute workflow files directly, whether they are written in YAML, TypeScript, or Python.
-
-## Run a workflow file
-
-```bash
-agent-relay run relay.yaml
-```
-
-Supported file types:
-
-- `.yaml` and `.yml`
-- `.ts` and `.tsx`
-- `.py`
-
-## Validate before running
-
-```bash
-agent-relay run relay.yaml --dry-run
-```
-
-Dry runs validate the workflow and show the execution plan without starting the real run.
-
-## Resume or restart from a step
-
-```bash
-agent-relay run relay.yaml --resume <run-id>
-agent-relay run relay.yaml --start-from implement --previous-run-id <run-id>
-```
-
-Use these options when a long workflow fails late and you want to retry without repeating earlier successful work.
-
-## List built-in templates
-
-```bash
-agent-relay workflows list
-```
-
-This prints the built-in YAML templates bundled with the CLI.
-
-## When to use cloud instead
-
-Use `agent-relay run` when the workflow should execute locally against your current machine. Use `agent-relay cloud run` when you want the same workflow model in a sandboxed cloud environment.
-
-## See also
-
-<CardGroup cols={2}>
-  <Card title="Workflows" href="/docs/reference-workflows">
-    Author workflow files in TypeScript, Python, or YAML.
-  </Card>
-  <Card title="Cloud commands" href="/docs/cli-cloud-commands">
-    Submit the same workflow model to cloud sandboxes.
-  </Card>
-  <Card title="CLI Overview" href="/docs/cli-overview">
-    Full CLI command map.
-  </Card>
-  <Card title="Cloud" href="/docs/cloud">
-    Conceptual local-vs-cloud framing.
-  </Card>
-</CardGroup>
diff --git a/web/content/docs/cloud.mdx b/web/content/docs/cloud.mdx
index 0221b5eb1..43d0844f4 100644
--- a/web/content/docs/cloud.mdx
+++ b/web/content/docs/cloud.mdx
@@ -19,9 +19,6 @@ The SDK is designed so local and cloud execution share the same mental model. Lo
 ## What to read next
 
 <CardGroup cols={2}>
-  <Card title="Workflows" href="/docs/reference-workflows">
-    The main orchestration surface for multi-step execution.
-  </Card>
   <Card title="Workforce" href="/docs/workforce">
     Organize several agents into a working team.
   </Card>
diff --git a/web/content/docs/communicate-ai-sdk.mdx b/web/content/docs/communicate-ai-sdk.mdx
index e25e1148c..48380740d 100644
--- a/web/content/docs/communicate-ai-sdk.mdx
+++ b/web/content/docs/communicate-ai-sdk.mdx
@@ -68,7 +68,7 @@ import { streamText, wrapLanguageModel } from 'ai';
 import { openai } from '@ai-sdk/openai';
 import { Relay } from '@agent-relay/sdk/communicate';
 import { onRelay } from '@agent-relay/sdk/communicate/adapters/ai-sdk';
-import { runWorkflow } from '@agent-relay/sdk/workflows';
+import { runWorkflow } from '@relayflows/core';
 
 export async function POST(req: Request) {
   const { prompt, repo, escalate } = await req.json();
@@ -149,5 +149,4 @@ It shows:
 
 ## See Also
 
-- [Workflow Reference](/docs/reference-workflows) — `runWorkflow()`, YAML format, and builder APIs
 - [Communicate Mode](/docs/communicate) — adapter overview across frameworks
diff --git a/web/content/docs/file-sharing.mdx b/web/content/docs/file-sharing.mdx
index c826c5447..d19bcbccc 100644
--- a/web/content/docs/file-sharing.mdx
+++ b/web/content/docs/file-sharing.mdx
@@ -159,9 +159,6 @@ For write access, add a separate `writeRelayfile` tool and mint a token scoped t
   <Card title="Primitives" href="/primitives#file">
     See how file sharing fits beside auth, messaging, and scheduling.
   </Card>
-  <Card title="Workflows" href="/docs/reference-workflows">
-    Combine shared artifacts with multi-step orchestration.
-  </Card>
   <Card title="Relayfile GitHub" href="https://github.com/agentworkforce/relayfile">
     Source, package details, and the latest implementation surface.
   </Card>
diff --git a/web/content/docs/plugin-claude-code.mdx b/web/content/docs/plugin-claude-code.mdx
index 841f1b7bc..692bc79c8 100644
--- a/web/content/docs/plugin-claude-code.mdx
+++ b/web/content/docs/plugin-claude-code.mdx
@@ -123,7 +123,4 @@ Under the hood, the plugin exposes these Relaycast MCP tools to your Claude sess
   <Card title="Quickstart" href="/docs/quickstart">
     Learn the SDK fundamentals that the plugin builds on.
   </Card>
-  <Card title="Workflows" href="/docs/reference-workflows">
-    Build more complex orchestration patterns with the workflow API.
-  </Card>
 </CardGroup>
diff --git a/web/content/docs/reference-openclaw.mdx b/web/content/docs/reference-openclaw.mdx
index b1491a98e..8da90cb2a 100644
--- a/web/content/docs/reference-openclaw.mdx
+++ b/web/content/docs/reference-openclaw.mdx
@@ -102,4 +102,3 @@ The full skill reference lives at [`packages/openclaw/skill/SKILL.md`](https://g
 ## See Also
 
 - [Introduction](/docs/introduction) — Overview of the SDK modes
-- [Workflow Reference](/docs/reference-workflows) — Relay workflows and orchestration
diff --git a/web/content/docs/reference-workflows.mdx b/web/content/docs/reference-workflows.mdx
deleted file mode 100644
index 7112cdbf1..000000000
--- a/web/content/docs/reference-workflows.mdx
+++ /dev/null
@@ -1,180 +0,0 @@
----
-title: Workflow Reference
-description: YAML and builder APIs for Relay workflows
----
-
-Workflows orchestrate multi-step, multi-agent execution across Relay workers. You can run them from YAML, TypeScript, Python, or the CLI.
-
-## Entry Points
-
-<CodeGroup>
-```bash CLI
-agent-relay run workflows/feature-dev.yaml
-```
-
-```typescript TypeScript
-import { runWorkflow, workflow } from '@agent-relay/sdk/workflows';
-```
-
-```python Python
-from agent_relay import workflow, run_yaml
-```
-</CodeGroup>
-
-## YAML Runner
-
-Use `runWorkflow()` from TypeScript or `run_yaml()` from Python to execute an existing YAML file.
-
-```typescript
-import { runWorkflow } from '@agent-relay/sdk/workflows';
-
-const result = await runWorkflow('workflows/feature-dev.yaml', {
-  workflow: 'default',
-  vars: { repo: 'app', task: 'Ship the feature' },
-  dryRun: false,
-});
-```
-
-```python
-from agent_relay import run_yaml
-
-result = run_yaml("workflows/feature-dev.yaml")
-```
-
-### `runWorkflow(path, options?)`
-
-| Option | Description |
-|--------|-------------|
-| `workflow` | Named workflow within the YAML file |
-| `vars` | Template vars for `{{var}}` placeholders |
-| `cwd` | Working directory override |
-| `relay` | `AgentRelayOptions` passed to the orchestrator |
-| `onEvent` | Workflow event listener |
-| `trajectories` | Trajectory config override or `false` to disable |
-| `dryRun` | Validate and print the plan without executing |
-| `resume` | Resume a failed run by ID |
-| `startFrom` | Skip to a step and reuse cached outputs |
-| `previousRunId` | Previous run whose cached outputs should be reused |
-
-## Builder API
-
-<CodeGroup>
-```typescript TypeScript
-import { workflow } from '@agent-relay/sdk/workflows';
-
-const result = await workflow('ship-feature')
-  .pattern('dag')
-  .agent('planner', { cli: 'claude', role: 'Plans implementation' })
-  .agent('developer', { cli: 'codex', role: 'Writes code' })
-  .step('plan', {
-    agent: 'planner',
-    task: 'Create the implementation plan',
-  })
-  .step('implement', {
-    agent: 'developer',
-    task: 'Implement the approved plan',
-    dependsOn: ['plan'],
-  })
-  .run();
-```
-
-```python Python
-from agent_relay import workflow
-
-result = (
-    workflow("ship-feature")
-    .pattern("dag")
-    .agent("planner", cli="claude", role="Plans implementation")
-    .agent("developer", cli="codex", role="Writes code")
-    .step("plan", agent="planner", task="Create the implementation plan")
-    .step("implement", agent="developer", task="Implement the approved plan", depends_on=["plan"])
-    .run()
-)
-```
-</CodeGroup>
-
-### Common builder methods
-
-- `.description(text)`
-- `.pattern(name)`
-- `.max_concurrency(n)`
-- `.timeout(ms)`
-- `.channel(name)`
-- `.idle_nudge(...)`
-- `.coordination(...)`
-- `.state(...)`
-- `.trajectories(...)`
-- `.agent(...)`
-- `.step(...)`
-- `.on_error(...)`
-- `.to_config()`
-- `.to_yaml()`
-- `.dry_run()`
-- `.run()`
-
-## YAML Shape
-
-```yaml
-version: "1.0"
-name: ship-feature
-
-swarm:
-  pattern: dag
-  maxConcurrency: 3
-  timeoutMs: 3600000
-  channel: feature-dev
-
-agents:
-  - name: planner
-    cli: claude
-    role: "Plans implementation"
-
-  - name: developer
-    cli: codex
-    role: "Writes code"
-
-workflows:
-  - name: default
-    steps:
-      - name: plan
-        agent: planner
-        task: "Create the implementation plan for {{task}}"
-
-      - name: implement
-        agent: developer
-        dependsOn: [plan]
-        task: "Implement: {{steps.plan.output}}"
-        verification:
-          type: exit_code
-          value: "0"
-```
-
-## Step Types
-
-- **Agent step**: runs a task through a named worker
-- **Deterministic step**: shell command step with `type: deterministic`
-- **Worktree step**: git worktree management step with `type: worktree`
-
-## Completion Signals
-
-The runner can complete a step from several signals:
-
-- deterministic verification
-- owner decisions
-- evidence gathered from messages, output, and artifacts
-- explicit completion markers as a fast-path
-
-## Verification Types
-
-| Type | Description |
-|------|-------------|
-| `exit_code` | Process exited with the expected code |
-| `file_exists` | Required artifact exists |
-| `output_contains` | Output includes a marker string |
-| `custom` | Reserved for external callers |
-
-## See Also
-
-- [TypeScript SDK Reference](/docs/typescript-sdk) — High-level `AgentRelay` API
-- [Python SDK Reference](/docs/python-sdk) — Python facade and builder exports
-- [Communicate Mode](/docs/communicate) — Connect existing framework agents to Relaycast
diff --git a/web/content/docs/scheduling.mdx b/web/content/docs/scheduling.mdx
index 1cc2e2eaf..c7299602d 100644
--- a/web/content/docs/scheduling.mdx
+++ b/web/content/docs/scheduling.mdx
@@ -28,9 +28,6 @@ Scheduling is the time-based layer of the platform. Use it when an agent flow sh
   <Card title="Primitives" href="/primitives#schedule">
     See scheduling beside auth, files, and messaging.
   </Card>
-  <Card title="Workflows" href="/docs/reference-workflows">
-    Trigger multi-step orchestration from scheduled jobs.
-  </Card>
   <Card title="Channels" href="/docs/channels">
     Send scheduled updates into shared rooms.
   </Card>
diff --git a/web/content/docs/swift-sdk.mdx b/web/content/docs/swift-sdk.mdx
index 190020955..e979fed09 100644
--- a/web/content/docs/swift-sdk.mdx
+++ b/web/content/docs/swift-sdk.mdx
@@ -51,7 +51,4 @@ for await event in channel.events {
   <Card title="Python SDK" href="/docs/python-sdk">
     Python reference for the same broker concepts.
   </Card>
-  <Card title="Workflows" href="/docs/reference-workflows">
-    Use messaging and channels inside larger multi-step systems.
-  </Card>
 </CardGroup>
diff --git a/web/content/docs/typescript-examples.mdx b/web/content/docs/typescript-examples.mdx
index e30b914f8..35687c1f6 100644
--- a/web/content/docs/typescript-examples.mdx
+++ b/web/content/docs/typescript-examples.mdx
@@ -37,9 +37,6 @@ The repository ships several TypeScript examples ranging from small demos to mor
   <Card title="TypeScript SDK" href="/docs/typescript-sdk">
     Full API reference after you understand the example shape.
   </Card>
-  <Card title="Workflows" href="/docs/reference-workflows">
-    Move from demos into repeatable multi-step orchestration.
-  </Card>
   <Card title="Communicate Mode" href="/docs/communicate-ai-sdk">
     TypeScript adapter example for AI SDK applications.
   </Card>
diff --git a/web/content/docs/workforce.mdx b/web/content/docs/workforce.mdx
index 945b8b72f..609576259 100644
--- a/web/content/docs/workforce.mdx
+++ b/web/content/docs/workforce.mdx
@@ -28,9 +28,6 @@ A workforce is the practical unit above individual agents: several workers, one
   <Card title="Sending messages" href="/docs/sending-messages">
     Coordinate handoffs and feedback loops.
   </Card>
-  <Card title="Workflows" href="/docs/reference-workflows">
-    Formalize repeated multi-step execution.
-  </Card>
   <Card title="File sharing" href="/docs/file-sharing">
     Give the team shared state and artifacts.
   </Card>
diff --git a/web/lib/docs-nav.ts b/web/lib/docs-nav.ts
index bd4ed913d..5d847b08d 100644
--- a/web/lib/docs-nav.ts
+++ b/web/lib/docs-nav.ts
@@ -36,7 +36,6 @@ export const docsNav: NavGroup[] = [
   {
     title: 'Advanced',
     items: [
-      { title: 'Workflows', slug: 'reference-workflows' },
       { title: 'Cloud', slug: 'cloud' },
       { title: 'Workforce', slug: 'workforce' },
       { title: 'Proactive agents', slug: 'proactive-agents' },
@@ -56,7 +55,6 @@ export const docsNav: NavGroup[] = [
       { title: 'Broker lifecycle', slug: 'cli-broker-lifecycle' },
       { title: 'Agent management', slug: 'cli-agent-management' },
       { title: 'Messaging', slug: 'cli-messaging' },
-      { title: 'Run workflows', slug: 'cli-workflows' },
       { title: 'Cloud commands', slug: 'cli-cloud-commands' },
       { title: 'On the relay', slug: 'cli-on-the-relay' },
       { title: 'CLI reference', slug: 'reference-cli' },
@@ -99,7 +97,6 @@ const ALL_SLUGS = [
   'harness-runtime-config',
   'local-mode',
   'reference-openclaw',
-  'reference-workflows',
 ];
 
 /** Flat list of all doc slugs for static generation */
diff --git a/workflows/ci/fix-mcp-spawn.yaml b/workflows/ci/fix-mcp-spawn.yaml
deleted file mode 100644
index 19b34f497..000000000
--- a/workflows/ci/fix-mcp-spawn.yaml
+++ /dev/null
@@ -1,317 +0,0 @@
-version: '1.0'
-name: fix-mcp-spawn
-description: >
-  Fix relaycast MCP access for agents spawned via agent-relay up.
-  PR #581 injected RELAY_API_KEY into --mcp-config JSON, but RELAY_WORKSPACES_JSON
-  and RELAY_DEFAULT_WORKSPACE are not forwarded because relaycast_server_config reads
-  them via std::env::var, but the broker process does not have them in its own env
-  (only in worker_env passed to child processes). This workflow diagnoses, fixes,
-  and verifies the issue comprehensively.
-
-swarm:
-  pattern: dag
-  channel: wf-fix-mcp-spawn
-  maxConcurrency: 3
-  timeoutMs: 3600000
-
-agents:
-  - name: lead
-    cli: claude
-    role: >
-      Senior Rust engineer who investigates the root cause and coordinates the fix.
-
-  - name: fixer
-    cli: claude
-    role: Implements the Rust code changes to fix MCP workspace forwarding.
-    preset: worker
-
-  - name: reviewer
-    cli: claude
-    role: Reviews the implemented fix for correctness and completeness.
-    preset: reviewer
-
-workflows:
-  - name: default
-    steps:
-      # ── Read relevant source code ─────────────────────────────────────────
-      - name: read-snippets
-        type: deterministic
-        command: >
-          echo "=== relaycast_server_config ===" &&
-          sed -n '327,415p' src/snippets.rs &&
-          echo "" &&
-          echo "=== configure_relaycast_mcp_with_token ===" &&
-          sed -n '679,745p' src/snippets.rs &&
-          echo "" &&
-          echo "=== merge_relaycast_with_project_mcp ===" &&
-          sed -n '253,326p' src/snippets.rs
-        captureOutput: true
-        failOnError: true
-
-      - name: read-callers
-        type: deterministic
-        command: >
-          echo "=== WorkerRegistry::spawn PTY path ===" &&
-          sed -n '749,860p' src/main.rs &&
-          echo "" &&
-          echo "=== worker_env setup (up mode) ===" &&
-          sed -n '1512,1530p' src/main.rs &&
-          echo "" &&
-          echo "=== Spawner::spawn_wrap_with_token ===" &&
-          sed -n '36,90p' src/spawner.rs &&
-          echo "" &&
-          echo "=== spawn_env_vars ===" &&
-          sed -n '208,250p' src/spawner.rs
-        captureOutput: true
-        failOnError: true
-
-      # ── Lead diagnoses and plans the fix ─────────────────────────────────
-      - name: diagnose
-        agent: lead
-        dependsOn: [read-snippets, read-callers]
-        task: |
-          You are diagnosing why spawned claude agents via `agent-relay up` still
-          don't have full relaycast MCP access after PR #581 injected RELAY_API_KEY.
-
-          ## Relevant source code
-
-          ### snippets.rs (key functions):
-          {{steps.read-snippets.output}}
-
-          ### Callers (main.rs WorkerRegistry::spawn, spawner.rs):
-          {{steps.read-callers.output}}
-
-          ## Key question to answer
-
-          In `relaycast_server_config` (snippets.rs), RELAY_WORKSPACES_JSON and
-          RELAY_DEFAULT_WORKSPACE are read via `std::env::var`. But when called from
-          `WorkerRegistry::spawn` (the "up" mode broker), the broker's OWN process env
-          does NOT contain these values - they are only in `worker_env` which is passed
-          to child processes via `cmd.env()`.
-
-          So spawned agents' --mcp-config JSON is missing RELAY_WORKSPACES_JSON and
-          RELAY_DEFAULT_WORKSPACE, even though these are available in the child process
-          via env inheritance.
-
-          ## Produce a fix plan
-
-          Analyze the code and produce a precise, complete fix plan. Include:
-
-          1. Exact function signature changes needed for:
-             - `relaycast_server_config`
-             - `merge_relaycast_with_project_mcp` / `merge_relaycast_with_project_mcp_inner`
-             - `configure_relaycast_mcp_with_token`
-             - Public `configure_relaycast_mcp` wrapper
-
-          2. Where to extract workspace values from in each caller:
-             - `WorkerRegistry::spawn` → from `self.worker_env`
-             - `Spawner::spawn_wrap_with_token` → from `env_vars`
-             - Any other callers of `configure_relaycast_mcp_with_token`
-
-          3. What tests to add in snippets.rs
-
-          Format:
-          ## Diagnosis
-          [findings]
-
-          ## Fix Plan
-          [numbered list with exact code snippets]
-
-          ## Tests to Add
-          [test names and assertions]
-        verification:
-          type: output_contains
-          value: '## Fix Plan'
-
-      # ── Implement the fix ─────────────────────────────────────────────────
-      - name: implement
-        agent: fixer
-        dependsOn: [diagnose]
-        task: |
-          Implement the fix for relaycast MCP workspace forwarding in the Rust broker.
-
-          ## Fix plan from lead:
-          {{steps.diagnose.output}}
-
-          ## Implementation guide
-
-          The goal: thread RELAY_WORKSPACES_JSON and RELAY_DEFAULT_WORKSPACE explicitly
-          through the MCP config building chain instead of reading from std::env::var.
-
-          ### In src/snippets.rs:
-
-          **Step 1**: Add params to `relaycast_server_config`:
-          ```rust
-          fn relaycast_server_config(
-              relay_api_key: Option<&str>,
-              relay_base_url: Option<&str>,
-              relay_agent_name: Option<&str>,
-              relay_agent_token: Option<&str>,
-              workspaces_json: Option<&str>,   // NEW: replaces std::env::var("RELAY_WORKSPACES_JSON")
-              default_workspace: Option<&str>, // NEW: replaces std::env::var("RELAY_DEFAULT_WORKSPACE")
-          ) -> Value
-          ```
-          Replace the two `std::env::var` reads at the bottom of the function with
-          direct use of the new params.
-
-          **Step 2**: Update `merge_relaycast_with_project_mcp_inner` to accept and pass them:
-          ```rust
-          fn merge_relaycast_with_project_mcp_inner(
-              relay_api_key: Option<&str>,
-              relay_base_url: Option<&str>,
-              relay_agent_name: Option<&str>,
-              relay_agent_token: Option<&str>,
-              cwd: &Path,
-              home: Option<PathBuf>,
-              workspaces_json: Option<&str>,   // NEW
-              default_workspace: Option<&str>, // NEW
-          ) -> String
-          ```
-          Forward to `relaycast_server_config`.
-
-          **Step 3**: Update `merge_relaycast_with_project_mcp` to accept and pass them.
-
-          **Step 4**: Update `configure_relaycast_mcp_with_token` public API:
-          ```rust
-          pub async fn configure_relaycast_mcp_with_token(
-              cli: &str,
-              agent_name: &str,
-              api_key: Option<&str>,
-              base_url: Option<&str>,
-              existing_args: &[String],
-              cwd: &Path,
-              agent_token: Option<&str>,
-              workspaces_json: Option<&str>,   // NEW
-              default_workspace: Option<&str>, // NEW
-          ) -> Result<Vec<String>>
-          ```
-          Pass them through to `merge_relaycast_with_project_mcp`.
-
-          **Step 5**: Update the public `configure_relaycast_mcp` wrapper to pass `None, None`:
-          ```rust
-          pub async fn configure_relaycast_mcp(
-              cli: &str, agent_name: &str, api_key: Option<&str>, base_url: Option<&str>,
-              existing_args: &[String], cwd: &Path,
-          ) -> Result<Vec<String>> {
-              configure_relaycast_mcp_with_token(cli, agent_name, api_key, base_url,
-                  existing_args, cwd, None, None, None)
-          }
-          ```
-
-          **Step 6**: Add new tests:
-          - `claude_includes_workspaces_json_when_provided` - verify RELAY_WORKSPACES_JSON
-            appears in --mcp-config JSON env block when workspaces_json param is Some
-          - `claude_includes_default_workspace_when_provided` - verify RELAY_DEFAULT_WORKSPACE
-            appears in --mcp-config JSON env block when default_workspace param is Some
-          - `claude_omits_workspaces_json_when_not_provided` - verify RELAY_WORKSPACES_JSON
-            is absent when param is None AND std::env::var is not set
-
-          ### In src/main.rs (WorkerRegistry::spawn, PTY path ~line 797-814):
-
-          Extract workspace vars from worker_env before calling configure_relaycast_mcp_with_token:
-          ```rust
-          let workspaces_json = self.env_value("RELAY_WORKSPACES_JSON");
-          let default_workspace = self.env_value("RELAY_DEFAULT_WORKSPACE");
-          configure_relaycast_mcp_with_token(
-              cli, &spec.name,
-              self.env_value("RELAY_API_KEY"),
-              self.env_value("RELAY_BASE_URL"),
-              &effective_args, Path::new(cwd),
-              worker_relay_api_key.as_deref(),
-              workspaces_json,     // NEW
-              default_workspace,   // NEW
-          ).await?
-          ```
-          Do the same for the Headless path (~line 863-872).
-
-          ### In src/spawner.rs (spawn_wrap_with_token ~line 63-81):
-
-          Extract workspace vars from env_vars:
-          ```rust
-          let workspaces_json = env_vars
-              .iter()
-              .find(|(k, _)| k == "RELAY_WORKSPACES_JSON")
-              .map(|(_, v)| v.as_str());
-          let default_workspace = env_vars
-              .iter()
-              .find(|(k, _)| k == "RELAY_DEFAULT_WORKSPACE")
-              .map(|(_, v)| v.as_str());
-          let mcp_args = configure_relaycast_mcp_with_token(
-              cli, child_name, api_key, base_url,
-              &combined_args, &cwd, agent_token,
-              workspaces_json,     // NEW
-              default_workspace,   // NEW
-          ).await?;
-          ```
-
-          ### Also check wrap.rs for any direct calls to configure_relaycast_mcp_with_token
-          and update those too if they exist.
-
-          After implementing, verify with:
-          ```
-          cargo build 2>&1 | head -30
-          cargo test --lib -- snippets 2>&1 | tail -20
-          ```
-
-          IMPORTANT: Make all the code changes, then run build and tests to verify.
-        verification:
-          type: exit_code
-
-      # ── Build check ────────────────────────────────────────────────────────
-      - name: build-check
-        type: deterministic
-        dependsOn: [implement]
-        command: cargo build 2>&1 | tail -10
-        captureOutput: true
-        failOnError: true
-
-      # ── Run tests ──────────────────────────────────────────────────────────
-      - name: run-tests
-        type: deterministic
-        dependsOn: [build-check]
-        command: cargo test --lib -- snippets 2>&1 | tail -30
-        captureOutput: true
-        failOnError: true
-
-      # ── Review ────────────────────────────────────────────────────────────
-      - name: review
-        agent: reviewer
-        dependsOn: [run-tests]
-        task: |
-          Review the implemented fix for relaycast MCP workspace forwarding.
-
-          ## Build result:
-          {{steps.build-check.output}}
-
-          ## Test results:
-          {{steps.run-tests.output}}
-
-          ## What was changed
-
-          The fix threads RELAY_WORKSPACES_JSON and RELAY_DEFAULT_WORKSPACE explicitly
-          through configure_relaycast_mcp_with_token → merge_relaycast_with_project_mcp
-          → relaycast_server_config, replacing the std::env::var reads.
-
-          Callers:
-          - WorkerRegistry::spawn: extracts from worker_env
-          - Spawner::spawn_wrap_with_token: extracts from env_vars
-
-          ## Read the changed files and verify:
-
-          1. src/snippets.rs - does relaycast_server_config use params instead of std::env::var?
-          2. src/main.rs - does WorkerRegistry::spawn forward workspace vars?
-          3. src/spawner.rs - does spawn_wrap_with_token forward workspace vars?
-          4. New tests exist and pass?
-
-          Output:
-
-          ## Review Result: APPROVED
-          [findings]
-
-          OR
-
-          ## Review Result: NEEDS_CHANGES
-          [specific issues]
-        verification:
-          type: output_contains
-          value: '## Review Result:'
diff --git a/workflows/relay-clean-room-e2e-validation.ts b/workflows/relay-clean-room-e2e-validation.ts
deleted file mode 100644
index b84a6d098..000000000
--- a/workflows/relay-clean-room-e2e-validation.ts
+++ /dev/null
@@ -1,781 +0,0 @@
-/**
- * relay-clean-room-e2e-validation.ts
- *
- * Clean-room end-to-end validation workflow for agent-relay install/bootstrap/messaging fixes.
- *
- * Primary proving environment: fresh isolated macOS local shell (isolated HOME + PATH).
- * This is the correct proving ground because the original failure class is a
- * first-run local bootstrap on macOS problem — stale shims, xattr/codesign handling,
- * ~/.local/bin launcher behavior — that Docker and cloud sandboxes cannot reproduce.
- *
- * Pattern: pipeline (sequential phases with deterministic before/after artifact capture).
- *
- * Acceptance contract (A1–A13):
- *   A1  install.sh completes successfully from scratch
- *   A2  command -v agent-relay resolves to isolated bin dir
- *   A3  agent-relay --version succeeds
- *   A4  stale shim/shadowing case detected or repaired by install (before/after proof)
- *   A5  agent-relay up --no-dashboard --verbose reaches running state within 30s
- *   A6  agent-relay status reports running
- *   A7  agent-relay spawn WorkflowProbe succeeds in a real repo
- *   A8  agent-relay who shows WorkflowProbe
- *   A9  agent-relay send WorkflowProbe "ping" (no --from) succeeds
- *   A10 agent-relay send WorkflowProbe "ping" --from Orchestrator succeeds
- *   A11 agent-relay agents:logs WorkflowProbe shows delivery evidence
- *   A12 agent-relay history with RELAY_API_KEY unset does NOT instruct user to set RELAY_API_KEY
- *   A13 all artifact files present with timestamps and exit codes
- *
- * Usage:
- *   agent-relay run workflows/relay-clean-room-e2e-validation.ts
- */
-
-import { workflow } from '@agent-relay/sdk/workflows';
-import { ClaudeModels } from '@agent-relay/config';
-
-const REPO_ROOT = process.cwd();
-const ARTIFACTS_DIR = `${REPO_ROOT}/.e2e-artifacts`;
-
-async function main() {
-  const wf = workflow('relay-clean-room-e2e-validation')
-    .description(
-      'Clean-room end-to-end validation of agent-relay install/bootstrap/messaging in an isolated macOS shell. ' +
-        'Reproduces the original failure class (stale shim, PATH shadowing, local-mode history regression), ' +
-        'validates the fix, captures deterministic artifacts, and issues a reviewer verdict.',
-    )
-    .pattern('pipeline')
-    .channel('wf-relay-e2e-cleanroom')
-    .maxConcurrency(1)
-    .timeout(3_600_000);
-
-  // ── Agents ─────────────────────────────────────────────────────────────────
-
-  wf.agent('reviewer', {
-    cli: 'claude',
-    preset: 'reviewer',
-    model: ClaudeModels.SONNET,
-    role: 'Reviewer who compares baseline-failure artifacts against fixed-run artifacts and issues the final PASS/FAIL verdict',
-    retries: 2,
-  });
-
-  // ── Phase 0: Emit acceptance contract ─────────────────────────────────────
-  //
-  // Static deterministic step so the reviewer step can reference it via
-  // {{steps.acceptance-contract.output}} without needing an external file.
-
-  wf.step('acceptance-contract', {
-    type: 'deterministic',
-    captureOutput: true,
-    failOnError: false,
-    command: `cat <<'EOF'
-ACCEPTANCE_CONTRACT
-
-The validation workflow PASSES if and only if all of the following are
-demonstrated in an isolated macOS shell with no prior relay state:
-
-| # | Signal | Evidence File |
-|---|--------|---------------|
-| A1  | install.sh completes successfully from scratch | fixed-install.txt |
-| A2  | command -v agent-relay resolves to the isolated bin dir | fixed-install.txt |
-| A3  | agent-relay --version succeeds after install | fixed-install.txt |
-| A4  | A deliberately introduced stale shim is detected or repaired by install | baseline-failure.txt + fixed-install.txt |
-| A5  | agent-relay up --no-dashboard --verbose reaches running state within 30s | broker-start.log |
-| A6  | agent-relay status reports running | status.txt |
-| A7  | agent-relay spawn WorkflowProbe succeeds in a real repo | spawn.txt |
-| A8  | agent-relay who shows the spawned worker | who.txt |
-| A9  | agent-relay send WorkflowProbe "ping" succeeds without explicit --from | send-default.txt |
-| A10 | agent-relay send WorkflowProbe "ping" --from Orchestrator succeeds | send-explicit.txt |
-| A11 | agent-relay agents:logs WorkflowProbe shows delivery/response evidence | worker-logs.txt |
-| A12 | agent-relay history with RELAY_API_KEY unset does NOT say "set RELAY_API_KEY" | history-no-api-key.txt |
-| A13 | All required artifact files present with timestamps and exit codes | all files in .e2e-artifacts/ |
-
-Failure contract: FAIL if ANY signal is FAIL. PARTIAL signals require manual reviewer judgment.
-
-CHOSEN_PROVING_ENVIRONMENT: Fresh isolated macOS local shell.
-  - Isolated HOME, XDG_*, AGENT_RELAY_* vars, PATH: CLEAN_HOME/.local/bin first.
-  - RELAY_API_KEY unset throughout.
-  - Reproduces: stale shim in ~/.local/bin, xattr/codesign handling, launcher PATH shadowing.
-  - Docker/cloud are Linux-only and do not reproduce these macOS-specific failure modes.
-
-CHOSEN_PATTERN: pipeline (maxConcurrency(1))
-  - Sequential before/after proof required; causal chain: baseline → provision → reproduce failure → build/install → validate → collect → review.
-  - DAG concurrency would obscure the proof chain.
-
-ORIGINAL_FAILURE_CLASS: first-run local bootstrap on macOS
-  - install.sh installs into ~/.local/bin with macOS-specific xattr/codesign cleanup.
-  - Local broker mode must work without RELAY_API_KEY.
-  - history hard-requires RELAY_API_KEY in the broken state, conflicting with local-mode contract.
-  - Stale shims in PATH shadow the newly installed binary.
-EOF
-`,
-  });
-
-  // ── Phase 1: Environment Provisioning ─────────────────────────────────────
-  //
-  // Create an isolated HOME + PATH so clean-room properties do not depend on
-  // the user's live shell environment. Persist the isolation env for all
-  // downstream phases. Capture an env-manifest for the record.
-
-  wf.step('phase-provision', {
-    type: 'deterministic',
-    dependsOn: ['acceptance-contract'],
-    captureOutput: true,
-    failOnError: true,
-    command: `
-set -euo pipefail
-
-ARTIFACTS="${ARTIFACTS_DIR}"
-mkdir -p "$ARTIFACTS"
-
-# Create isolated environment
-CLEAN_HOME="$(mktemp -d /tmp/relay-e2e-XXXXXX)"
-export HOME="$CLEAN_HOME"
-export XDG_DATA_HOME="$CLEAN_HOME/.local/share"
-export XDG_CONFIG_HOME="$CLEAN_HOME/.config"
-export AGENT_RELAY_INSTALL_DIR="$CLEAN_HOME/.local/share/agent-relay"
-export AGENT_RELAY_BIN_DIR="$CLEAN_HOME/.local/bin"
-export PATH="$CLEAN_HOME/.local/bin:/opt/homebrew/bin:/usr/local/bin:/usr/bin:/bin"
-unset RELAY_API_KEY 2>/dev/null || true
-mkdir -p "$CLEAN_HOME/.local/bin" "$CLEAN_HOME/.local/share"
-
-# Persist isolation env for downstream phases
-cat > "$ARTIFACTS/isolation.env" <<ENVEOF
-CLEAN_HOME=$CLEAN_HOME
-HOME=$CLEAN_HOME
-XDG_DATA_HOME=$CLEAN_HOME/.local/share
-XDG_CONFIG_HOME=$CLEAN_HOME/.config
-AGENT_RELAY_INSTALL_DIR=$CLEAN_HOME/.local/share/agent-relay
-AGENT_RELAY_BIN_DIR=$CLEAN_HOME/.local/bin
-PATH=$CLEAN_HOME/.local/bin:/opt/homebrew/bin:/usr/local/bin:/usr/bin:/bin
-ENVEOF
-
-# Capture env manifest
-{
-  echo "=== env-manifest ==="
-  echo "timestamp: $(date -u +%Y-%m-%dT%H:%M:%SZ)"
-  echo "OS: $(uname -a)"
-  echo "shell: \${SHELL:-unknown}"
-  echo "node: $(node --version 2>/dev/null || echo 'not found')"
-  echo "npm: $(npm --version 2>/dev/null || echo 'not found')"
-  echo "CLEAN_HOME: $CLEAN_HOME"
-  echo "AGENT_RELAY_BIN_DIR: $CLEAN_HOME/.local/bin"
-  echo "PATH: $PATH"
-  echo "RELAY_API_KEY: unset"
-  echo "cwd: $(pwd)"
-  echo "repo_root: ${REPO_ROOT}"
-} | tee "$ARTIFACTS/env-manifest.txt"
-
-echo "PROVISION_COMPLETE: CLEAN_HOME=$CLEAN_HOME"
-`,
-  });
-
-  // ── Phase 2: Baseline Failure Reproduction ─────────────────────────────────
-  //
-  // Deliberately introduce a stale shim at $CLEAN_HOME/.local/bin/agent-relay
-  // that exits 1, simulating a broken/shadowed binary. This proves the clean
-  // room actually exercises the failure path before the fix is applied.
-  // (A4 baseline half)
-
-  wf.step('phase-baseline', {
-    type: 'deterministic',
-    dependsOn: ['phase-provision'],
-    captureOutput: true,
-    failOnError: false, // Expected to capture failures — do not abort pipeline
-    command: `
-set -uo pipefail
-
-ARTIFACTS="${ARTIFACTS_DIR}"
-# shellcheck source=/dev/null
-source "$ARTIFACTS/isolation.env"
-
-{
-  echo "=== baseline-failure ==="
-  echo "timestamp: $(date -u +%Y-%m-%dT%H:%M:%SZ)"
-  echo "purpose: demonstrate stale-shim/PATH-shadowing failure class before fix is applied"
-  echo ""
-
-  # Create stale shim that simulates a broken/shadowed binary
-  echo "--- introducing stale shim at \$CLEAN_HOME/.local/bin/agent-relay ---"
-  cat > "$CLEAN_HOME/.local/bin/agent-relay" <<'SHIM'
-#!/bin/sh
-echo "stale agent-relay shim: this binary is broken and should be replaced by install.sh" >&2
-exit 1
-SHIM
-  chmod +x "$CLEAN_HOME/.local/bin/agent-relay"
-  echo "stale shim written to: $CLEAN_HOME/.local/bin/agent-relay"
-
-  # Capture pre-fix PATH state
-  echo "--- PATH before fix ---"
-  echo "PATH=$PATH"
-  echo "which -a agent-relay output:"
-  which -a agent-relay 2>&1 || echo "(which -a returned nothing)"
-  echo "type -a agent-relay output:"
-  type -a agent-relay 2>&1 || echo "(type -a not available)"
-
-  # Attempt to use the broken shim — expect failure
-  echo "--- agent-relay --version (expect failure from stale shim) ---"
-  CMD_EXIT=0
-  CMD_OUTPUT=$(agent-relay --version 2>&1) || CMD_EXIT=$?
-  echo "command: agent-relay --version"
-  echo "stdout/stderr: $CMD_OUTPUT"
-  echo "exit_code: $CMD_EXIT"
-
-  if [ "$CMD_EXIT" -ne 0 ]; then
-    echo "BASELINE_FAILURE_CONFIRMED: stale shim caused exit $CMD_EXIT as expected"
-    echo "A4_BASELINE: stale shim present and blocking correct binary — original failure class reproduced"
-  else
-    echo "WARNING: stale shim did not fail — check shim placement vs PATH order"
-  fi
-} | tee "$ARTIFACTS/baseline-failure.txt"
-
-echo "BASELINE_PHASE_COMPLETE"
-`,
-  });
-
-  // ── Phase 3: Build from Source and Install ────────────────────────────────
-  //
-  // Remove stale state from Phase 2. Do a full build from source (npm run build),
-  // then run install.sh into the isolated environment. Capture the full install
-  // transcript including which -a, type -a, and version output. Validates A1–A4.
-
-  wf.step('phase-install', {
-    type: 'deterministic',
-    dependsOn: ['phase-baseline'],
-    captureOutput: true,
-    failOnError: true,
-    command: `
-set -euo pipefail
-
-ARTIFACTS="${ARTIFACTS_DIR}"
-# shellcheck source=/dev/null
-source "$ARTIFACTS/isolation.env"
-
-{
-  echo "=== fixed-install ==="
-  echo "timestamp: $(date -u +%Y-%m-%dT%H:%M:%SZ)"
-  echo "repo_root: ${REPO_ROOT}"
-
-  # Remove stale shim from Phase 2
-  echo "--- removing stale shim from Phase 2 ---"
-  rm -f "$CLEAN_HOME/.local/bin/agent-relay"
-  echo "stale shim removed"
-  ls -la "$CLEAN_HOME/.local/bin/" 2>&1 || echo "(bin dir now empty)"
-
-  # Build from source — ensures we are validating the current candidate, not a cached artifact
-  echo "--- building from source: npm run build ---"
-  cd "${REPO_ROOT}"
-  BUILD_EXIT=0
-  npm run build 2>&1 || BUILD_EXIT=$?
-  echo "build exit_code: $BUILD_EXIT"
-  if [ "$BUILD_EXIT" -ne 0 ]; then
-    echo "BUILD_FAILED: npm run build exited $BUILD_EXIT"
-    exit "$BUILD_EXIT"
-  fi
-  echo "build succeeded"
-
-  # Run install.sh into the isolated environment
-  echo "--- running install.sh ---"
-  INSTALL_EXIT=0
-  bash "${REPO_ROOT}/install.sh" 2>&1 || INSTALL_EXIT=$?
-  echo "install exit_code: $INSTALL_EXIT"
-  if [ "$INSTALL_EXIT" -ne 0 ]; then
-    echo "INSTALL_FAILED: install.sh exited $INSTALL_EXIT"
-    exit "$INSTALL_EXIT"
-  fi
-  echo "install.sh completed successfully — A1_PASS"
-
-  # Post-install PATH and binary resolution
-  echo "--- post-install PATH and binary resolution ---"
-  echo "PATH: $PATH"
-  echo "which -a agent-relay:"
-  which -a agent-relay 2>&1 || echo "(not found via which)"
-  echo "type -a agent-relay:"
-  type -a agent-relay 2>&1 || echo "(type -a not available)"
-
-  # A2: command -v resolves to isolated bin dir
-  RESOLVED=$(command -v agent-relay 2>&1 || echo "NOT_FOUND")
-  echo "command -v agent-relay: $RESOLVED"
-  if echo "$RESOLVED" | grep -q "$CLEAN_HOME/.local/bin"; then
-    echo "A2_PASS: resolves to isolated bin dir ($RESOLVED)"
-  else
-    echo "A2_FAIL: does not resolve to isolated bin dir (got: $RESOLVED)"
-    exit 1
-  fi
-
-  # A3: --version succeeds
-  VERSION_EXIT=0
-  VERSION_OUTPUT=$(agent-relay --version 2>&1) || VERSION_EXIT=$?
-  echo "agent-relay --version: $VERSION_OUTPUT"
-  echo "version exit_code: $VERSION_EXIT"
-  if [ "$VERSION_EXIT" -eq 0 ]; then
-    echo "A3_PASS: --version succeeded"
-  else
-    echo "A3_FAIL: --version exited $VERSION_EXIT"
-    exit "$VERSION_EXIT"
-  fi
-
-  # A4 (fixed half): confirm stale shim was overwritten
-  echo "--- stale shim resolution check (A4 fixed half) ---"
-  CURRENT_CONTENT=$(head -3 "$RESOLVED" 2>/dev/null || echo "(cannot read)")
-  if echo "$CURRENT_CONTENT" | grep -q "stale agent-relay shim"; then
-    echo "A4_FAIL: binary at $RESOLVED is still the stale shim — install.sh did NOT replace it"
-    exit 1
-  else
-    echo "A4_PASS: binary at $RESOLVED is not the stale shim — install.sh correctly replaced it"
-    echo "  Before: stale shim (see baseline-failure.txt)"
-    echo "  After:  real agent-relay binary ($VERSION_OUTPUT)"
-  fi
-
-} | tee "$ARTIFACTS/fixed-install.txt"
-
-echo "INSTALL_PHASE_COMPLETE"
-`,
-  });
-
-  // ── Phase 4: Broker Startup and Readiness ─────────────────────────────────
-  //
-  // Start the local broker with --no-dashboard --verbose. Poll agent-relay
-  // status with exponential backoff (max 30 s). Gate: do not proceed unless
-  // status is running. Validates A5–A6.
-
-  wf.step('phase-broker', {
-    type: 'deterministic',
-    dependsOn: ['phase-install'],
-    captureOutput: true,
-    failOnError: true,
-    command: `
-set -euo pipefail
-
-ARTIFACTS="${ARTIFACTS_DIR}"
-# shellcheck source=/dev/null
-source "$ARTIFACTS/isolation.env"
-BROKER_LOG="$ARTIFACTS/broker-start.log"
-
-{
-  echo "=== broker-start ==="
-  echo "timestamp: $(date -u +%Y-%m-%dT%H:%M:%SZ)"
-
-  # Start broker in background, capture log
-  echo "--- starting: agent-relay up --no-dashboard --verbose ---"
-  agent-relay up --no-dashboard --verbose >>"$BROKER_LOG" 2>&1 &
-  BROKER_PID=$!
-  echo "broker PID: $BROKER_PID"
-  echo "$BROKER_PID" > "$ARTIFACTS/broker.pid"
-
-  # Poll status with exponential backoff (max ~30 s across 6 attempts: 2+4+6+8+10+12=42s cap)
-  echo "--- polling agent-relay status (max ~30s) ---"
-  STATUS_REACHED=false
-  for ATTEMPT in 1 2 3 4 5 6; do
-    SLEEP_SECS=$((ATTEMPT * 2))
-    echo "  attempt $ATTEMPT: sleeping \${SLEEP_SECS}s..."
-    sleep "$SLEEP_SECS"
-    STATUS_EXIT=0
-    STATUS_OUTPUT=$(agent-relay status 2>&1) || STATUS_EXIT=$?
-    echo "  status output: $STATUS_OUTPUT (exit $STATUS_EXIT)"
-    if echo "$STATUS_OUTPUT" | grep -qi "running"; then
-      echo "A5_PASS: broker reached running state (attempt $ATTEMPT, cumulative wait ~$((ATTEMPT * (ATTEMPT + 1)))s)"
-      STATUS_REACHED=true
-      break
-    fi
-  done
-
-  if [ "$STATUS_REACHED" = "false" ]; then
-    echo "A5_FAIL: broker did not reach running state within ~30s"
-    echo "--- broker log tail ---"
-    tail -30 "$BROKER_LOG" 2>&1 || true
-    exit 1
-  fi
-
-  # Capture final status output
-  FINAL_STATUS=$(agent-relay status 2>&1 || echo "STATUS_ERROR")
-  echo "$FINAL_STATUS" | tee "$ARTIFACTS/status.txt"
-
-  if echo "$FINAL_STATUS" | grep -qi "running"; then
-    echo "A6_PASS: agent-relay status reports running"
-  else
-    echo "A6_FAIL: agent-relay status does not report running: $FINAL_STATUS"
-    exit 1
-  fi
-
-} 2>&1 | tee -a "$BROKER_LOG"
-
-echo "BROKER_PHASE_COMPLETE"
-`,
-  });
-
-  // ── Phase 5: Worker Spawn and Messaging ────────────────────────────────────
-  //
-  // Spawn WorkflowProbe, verify it appears in `who`, send messages with and
-  // without --from, and capture agent logs as delivery evidence.
-  // Validates A7–A11.
-
-  wf.step('phase-messaging', {
-    type: 'deterministic',
-    dependsOn: ['phase-broker'],
-    captureOutput: true,
-    failOnError: true,
-    command: `
-set -euo pipefail
-
-ARTIFACTS="${ARTIFACTS_DIR}"
-# shellcheck source=/dev/null
-source "$ARTIFACTS/isolation.env"
-
-{
-  echo "=== worker-spawn-and-messaging ==="
-  echo "timestamp: $(date -u +%Y-%m-%dT%H:%M:%SZ)"
-
-  # A7: Spawn WorkflowProbe
-  echo "--- command: agent-relay spawn WorkflowProbe claude 'e2e probe ping' ---"
-  SPAWN_EXIT=0
-  SPAWN_OUTPUT=$(agent-relay spawn WorkflowProbe claude "e2e probe ping" 2>&1) || SPAWN_EXIT=$?
-  echo "$SPAWN_OUTPUT"
-  echo "exit_code: $SPAWN_EXIT"
-  {
-    echo "command: agent-relay spawn WorkflowProbe claude 'e2e probe ping'"
-    echo "timestamp: $(date -u +%Y-%m-%dT%H:%M:%SZ)"
-    echo "$SPAWN_OUTPUT"
-    echo "exit_code: $SPAWN_EXIT"
-  } > "$ARTIFACTS/spawn.txt"
-  if [ "$SPAWN_EXIT" -eq 0 ]; then
-    echo "A7_PASS: WorkflowProbe spawned successfully"
-  else
-    echo "A7_FAIL: spawn exited $SPAWN_EXIT"
-    exit "$SPAWN_EXIT"
-  fi
-
-  # Brief wait for worker to register
-  sleep 3
-
-  # A8: Verify WorkflowProbe appears in who output
-  echo "--- command: agent-relay who ---"
-  WHO_EXIT=0
-  WHO_OUTPUT=$(agent-relay who 2>&1) || WHO_EXIT=$?
-  echo "$WHO_OUTPUT"
-  echo "exit_code: $WHO_EXIT"
-  {
-    echo "command: agent-relay who"
-    echo "timestamp: $(date -u +%Y-%m-%dT%H:%M:%SZ)"
-    echo "$WHO_OUTPUT"
-    echo "exit_code: $WHO_EXIT"
-  } > "$ARTIFACTS/who.txt"
-  if echo "$WHO_OUTPUT" | grep -q "WorkflowProbe"; then
-    echo "A8_PASS: WorkflowProbe listed in agent-relay who"
-  else
-    echo "A8_FAIL: WorkflowProbe not found in who output"
-    exit 1
-  fi
-
-  # A9: Send without --from (validates local-mode default sender resolution)
-  echo "--- command: agent-relay send WorkflowProbe 'ping' (no --from) ---"
-  SEND_DEFAULT_EXIT=0
-  SEND_DEFAULT_OUTPUT=$(agent-relay send WorkflowProbe "ping" 2>&1) || SEND_DEFAULT_EXIT=$?
-  echo "$SEND_DEFAULT_OUTPUT"
-  echo "exit_code: $SEND_DEFAULT_EXIT"
-  {
-    echo "command: agent-relay send WorkflowProbe 'ping'"
-    echo "timestamp: $(date -u +%Y-%m-%dT%H:%M:%SZ)"
-    echo "$SEND_DEFAULT_OUTPUT"
-    echo "exit_code: $SEND_DEFAULT_EXIT"
-  } > "$ARTIFACTS/send-default.txt"
-  if [ "$SEND_DEFAULT_EXIT" -eq 0 ]; then
-    echo "A9_PASS: send without --from succeeded (no workaround required)"
-  else
-    echo "A9_FAIL: send without --from exited $SEND_DEFAULT_EXIT"
-    exit "$SEND_DEFAULT_EXIT"
-  fi
-
-  # A10: Send with explicit --from
-  echo "--- command: agent-relay send WorkflowProbe 'explicit ping' --from Orchestrator ---"
-  SEND_EXPLICIT_EXIT=0
-  SEND_EXPLICIT_OUTPUT=$(agent-relay send WorkflowProbe "explicit ping" --from Orchestrator 2>&1) || SEND_EXPLICIT_EXIT=$?
-  echo "$SEND_EXPLICIT_OUTPUT"
-  echo "exit_code: $SEND_EXPLICIT_EXIT"
-  {
-    echo "command: agent-relay send WorkflowProbe 'explicit ping' --from Orchestrator"
-    echo "timestamp: $(date -u +%Y-%m-%dT%H:%M:%SZ)"
-    echo "$SEND_EXPLICIT_OUTPUT"
-    echo "exit_code: $SEND_EXPLICIT_EXIT"
-  } > "$ARTIFACTS/send-explicit.txt"
-  if [ "$SEND_EXPLICIT_EXIT" -eq 0 ]; then
-    echo "A10_PASS: send with --from Orchestrator succeeded"
-  else
-    echo "A10_FAIL: send with --from exited $SEND_EXPLICIT_EXIT"
-    exit "$SEND_EXPLICIT_EXIT"
-  fi
-
-  # Wait briefly for message delivery before reading logs
-  sleep 2
-
-  # A11: Capture agent logs (delivery evidence)
-  echo "--- command: agent-relay agents:logs WorkflowProbe ---"
-  LOGS_EXIT=0
-  LOGS_OUTPUT=$(agent-relay agents:logs WorkflowProbe 2>&1) || LOGS_EXIT=$?
-  echo "$LOGS_OUTPUT"
-  echo "exit_code: $LOGS_EXIT"
-  {
-    echo "command: agent-relay agents:logs WorkflowProbe"
-    echo "timestamp: $(date -u +%Y-%m-%dT%H:%M:%SZ)"
-    echo "$LOGS_OUTPUT"
-    echo "exit_code: $LOGS_EXIT"
-  } > "$ARTIFACTS/worker-logs.txt"
-  if echo "$LOGS_OUTPUT" | grep -qi "ping\|delivery\|received\|message\|sent"; then
-    echo "A11_PASS: worker logs show delivery evidence"
-  else
-    echo "A11_PARTIAL: worker logs captured (exit $LOGS_EXIT) but no delivery keyword found — reviewer must check"
-  fi
-
-} | tee "$ARTIFACTS/messaging-phase.log"
-
-echo "MESSAGING_PHASE_COMPLETE"
-`,
-  });
-
-  // ── Phase 6: Local History Validation ─────────────────────────────────────
-  //
-  // With RELAY_API_KEY unset, `agent-relay history` must either return local
-  // history OR emit a clean local-mode message. It must NOT instruct the user
-  // to set RELAY_API_KEY — that instruction is the regression being validated.
-  // Validates A12.
-
-  wf.step('phase-history', {
-    type: 'deterministic',
-    dependsOn: ['phase-messaging'],
-    captureOutput: true,
-    failOnError: true,
-    command: `
-set -uo pipefail
-
-ARTIFACTS="${ARTIFACTS_DIR}"
-# shellcheck source=/dev/null
-source "$ARTIFACTS/isolation.env"
-
-{
-  echo "=== local-history-validation ==="
-  echo "timestamp: $(date -u +%Y-%m-%dT%H:%M:%SZ)"
-
-  # Ensure RELAY_API_KEY is unset for this check
-  unset RELAY_API_KEY 2>/dev/null || true
-  echo "RELAY_API_KEY: unset (confirmed)"
-
-  echo "--- command: agent-relay history (RELAY_API_KEY unset) ---"
-  HISTORY_EXIT=0
-  HISTORY_OUTPUT=$(agent-relay history 2>&1) || HISTORY_EXIT=$?
-  echo "$HISTORY_OUTPUT"
-  echo "exit_code: $HISTORY_EXIT"
-  {
-    echo "command: agent-relay history"
-    echo "timestamp: $(date -u +%Y-%m-%dT%H:%M:%SZ)"
-    echo "RELAY_API_KEY: unset"
-    echo "$HISTORY_OUTPUT"
-    echo "exit_code: $HISTORY_EXIT"
-  } > "$ARTIFACTS/history-no-api-key.txt"
-
-  # A12: Must NOT instruct user to set RELAY_API_KEY
-  if echo "$HISTORY_OUTPUT" | grep -qi "set RELAY_API_KEY\|RELAY_API_KEY.*required\|set.*api.*key\|please set.*RELAY"; then
-    echo "A12_FAIL: history output incorrectly instructs user to set RELAY_API_KEY in local mode"
-    echo "  This is the original regression — local-mode history contract is broken"
-    exit 1
-  elif [ "$HISTORY_EXIT" -eq 0 ]; then
-    echo "A12_PASS: history returned local results (exit 0, no RELAY_API_KEY instruction)"
-  else
-    echo "A12_PASS: history exited $HISTORY_EXIT with a clean local-mode message (no RELAY_API_KEY instruction)"
-  fi
-
-} | tee "$ARTIFACTS/history-phase.log"
-
-echo "HISTORY_PHASE_COMPLETE"
-`,
-  });
-
-  // ── Phase 7: Cleanup and Artifact Collection ───────────────────────────────
-  //
-  // Stop the broker. Verify all required artifact files are present. Emit an
-  // artifact inventory log. Validates A13.
-
-  wf.step('phase-cleanup', {
-    type: 'deterministic',
-    dependsOn: ['phase-history'],
-    captureOutput: true,
-    failOnError: false, // Best-effort cleanup — do not mask a prior signal failure
-    command: `
-set -uo pipefail
-
-ARTIFACTS="${ARTIFACTS_DIR}"
-# shellcheck source=/dev/null
-source "$ARTIFACTS/isolation.env" 2>/dev/null || true
-
-{
-  echo "=== cleanup-and-artifact-collection ==="
-  echo "timestamp: $(date -u +%Y-%m-%dT%H:%M:%SZ)"
-
-  # Stop broker gracefully
-  echo "--- stopping broker (agent-relay down) ---"
-  DOWN_EXIT=0
-  DOWN_OUTPUT=$(agent-relay down 2>&1) || DOWN_EXIT=$?
-  echo "agent-relay down output: $DOWN_OUTPUT"
-  echo "agent-relay down exit_code: $DOWN_EXIT"
-
-  # Kill by PID as fallback
-  if [ -f "$ARTIFACTS/broker.pid" ]; then
-    BROKER_PID=$(cat "$ARTIFACTS/broker.pid")
-    kill "$BROKER_PID" 2>/dev/null && echo "sent SIGTERM to broker PID $BROKER_PID" || true
-  fi
-
-  # Verify all required artifact files are present (A13)
-  echo ""
-  echo "--- A13: artifact inventory ---"
-  REQUIRED=(
-    "env-manifest.txt"
-    "isolation.env"
-    "baseline-failure.txt"
-    "fixed-install.txt"
-    "broker-start.log"
-    "broker.pid"
-    "status.txt"
-    "spawn.txt"
-    "who.txt"
-    "send-default.txt"
-    "send-explicit.txt"
-    "worker-logs.txt"
-    "history-no-api-key.txt"
-    "messaging-phase.log"
-    "history-phase.log"
-  )
-
-  MISSING=0
-  for f in "\${REQUIRED[@]}"; do
-    if [ -f "$ARTIFACTS/$f" ]; then
-      SIZE=$(wc -c < "$ARTIFACTS/$f" | tr -d ' ')
-      echo "  [PRESENT \${SIZE} bytes] $f"
-    else
-      echo "  [MISSING] $f"
-      MISSING=$((MISSING + 1))
-    fi
-  done
-
-  if [ "$MISSING" -eq 0 ]; then
-    echo "A13_PASS: all required artifact files present"
-  else
-    echo "A13_FAIL: $MISSING artifact files missing"
-  fi
-
-  echo ""
-  echo "--- artifact directory listing ---"
-  ls -lah "$ARTIFACTS/" 2>&1 || true
-
-} | tee "$ARTIFACTS/cleanup-phase.log"
-
-echo "CLEANUP_PHASE_COMPLETE"
-`,
-  });
-
-  // ── Phase 8a: Dump artifacts for reviewer ─────────────────────────────────
-  //
-  // Dump all artifact content into a single step output so the reviewer agent
-  // can access everything via {{steps.phase-read-artifacts.output}}.
-
-  wf.step('phase-read-artifacts', {
-    type: 'deterministic',
-    dependsOn: ['phase-cleanup'],
-    captureOutput: true,
-    failOnError: false,
-    command: `
-set -uo pipefail
-ARTIFACTS="${ARTIFACTS_DIR}"
-
-echo "=== ARTIFACT DUMP FOR REVIEWER ==="
-echo ""
-
-dump_file() {
-  local name="$1"
-  echo "### $name ###"
-  if [ -f "$ARTIFACTS/$name" ]; then
-    cat "$ARTIFACTS/$name"
-  else
-    echo "(file missing)"
-  fi
-  echo ""
-}
-
-dump_file "env-manifest.txt"
-dump_file "baseline-failure.txt"
-dump_file "fixed-install.txt"
-dump_file "status.txt"
-dump_file "spawn.txt"
-dump_file "who.txt"
-dump_file "send-default.txt"
-dump_file "send-explicit.txt"
-dump_file "history-no-api-key.txt"
-dump_file "cleanup-phase.log"
-
-echo "### broker-start.log (last 60 lines) ###"
-if [ -f "$ARTIFACTS/broker-start.log" ]; then
-  tail -60 "$ARTIFACTS/broker-start.log"
-else
-  echo "(file missing)"
-fi
-echo ""
-
-dump_file "worker-logs.txt"
-dump_file "messaging-phase.log"
-dump_file "history-phase.log"
-`,
-  });
-
-  // ── Phase 8b: Reviewer verdict ─────────────────────────────────────────────
-  //
-  // The reviewer agent compares baseline-failure artifacts against fixed-run
-  // artifacts and produces verdict.md with a signal-by-signal PASS/FAIL table.
-
-  wf.step('phase-review', {
-    agent: 'reviewer',
-    dependsOn: ['phase-read-artifacts'],
-    task: `Review the clean-room end-to-end validation run against the acceptance contract.
-
-Acceptance contract:
-{{steps.acceptance-contract.output}}
-
-Artifacts collected during the validation run:
-{{steps.phase-read-artifacts.output}}
-
-For each acceptance signal A1–A13, evaluate the artifact evidence and state:
-- PASS — signal is clearly demonstrated
-- FAIL — signal is not met (provide specific evidence from artifacts)
-- PARTIAL — signal is partially met (provide what is missing)
-
-Then produce the final verdict with these exact sections:
-
-1. SIGNAL_RESULTS
-   (Table: signal | result | evidence snippet)
-
-2. PASS_FAIL
-   Overall PASS or FAIL. FAIL if ANY signal is FAIL.
-
-3. WHAT_PROBLEM_IT_PROVES
-   Describe which original failure class was exercised (stale shim, PATH shadowing,
-   local-mode history regression) and confirm it was fixed.
-
-4. WHAT_EVIDENCE_IT_COLLECTS
-   Describe the before/after artifact trail:
-   - baseline-failure.txt shows the broken state (A4 baseline half)
-   - fixed-install.txt + subsequent artifacts prove the fix (A1–A4 fixed half, A5–A12)
-
-5. RESIDUAL_RISKS
-   Any gaps in coverage, signals needing manual follow-up, or edge cases not covered.
-
-6. OS_SHELL_COVERAGE_NOTE
-   Confirm: primary proof is macOS local shell. Docker/cloud are secondary regression
-   only and do not cover the same macOS-specific failure surface.
-
-Write the complete verdict to ${ARTIFACTS_DIR}/verdict.md.
-
-End your response with REVIEW_COMPLETE.`,
-    verification: { type: 'output_contains', value: 'REVIEW_COMPLETE' },
-    retries: 2,
-  });
-
-  const result = await wf.run();
-  console.log(`Done: ${result.status} (${result.id})`);
-}
-
-main().catch(console.error);
diff --git a/workflows/relayauth-integration/examples/docs-writer.yaml b/workflows/relayauth-integration/examples/docs-writer.yaml
deleted file mode 100644
index d37651c10..000000000
--- a/workflows/relayauth-integration/examples/docs-writer.yaml
+++ /dev/null
@@ -1,68 +0,0 @@
-version: '1.0'
-name: docs-writer
-description: 'Documentation-only workflow with scoped writes and a deterministic sync step.'
-swarm:
-  pattern: handoff
-  maxConcurrency: 2
-  timeoutMs: 2400000
-  channel: swarm-docs-writer
-agents:
-  - name: writer
-    cli: claude
-    role: 'Writes and updates documentation without changing product code'
-    interactive: false
-    permissions:
-      access: restricted
-      files:
-        read: ['src/**', 'packages/**', 'README.md', 'docs/**']
-        write: ['docs/**', 'web/content/docs/**', '*.md', '*.mdx']
-        deny: ['.env*', '.git/**', 'secrets/**']
-
-  - name: proofreader
-    cli: claude
-    role: 'Reviews docs for accuracy, structure, and clarity'
-    interactive: false
-    permissions: readonly
-
-workflows:
-  - name: doc-sync
-    description: 'Draft documentation, review it, and mirror generated docs.'
-    onError: continue
-    steps:
-      - name: draft
-        type: agent
-        agent: writer
-        task: |
-          Update or create the documentation required for this request:
-          {{task}}
-        verification:
-          type: output_contains
-          value: DOCS_WRITTEN
-
-      - name: proofread
-        type: agent
-        agent: proofreader
-        dependsOn: [draft]
-        task: |
-          Review the drafted documentation for accuracy and readability.
-
-          Draft summary:
-          {{steps.draft.output}}
-        verification:
-          type: output_contains
-          value: REVIEW_COMPLETE
-
-      - name: sync-mirror
-        type: deterministic
-        dependsOn: [proofread]
-        command: node scripts/sync-docs.js
-
-      - name: final-summary
-        type: agent
-        agent: proofreader
-        dependsOn: [sync-mirror]
-        task: |
-          Confirm the docs change is ready to ship and summarize what changed.
-        verification:
-          type: output_contains
-          value: DONE
diff --git a/workflows/relayauth-integration/examples/full-team.yaml b/workflows/relayauth-integration/examples/full-team.yaml
deleted file mode 100644
index 5cb532164..000000000
--- a/workflows/relayauth-integration/examples/full-team.yaml
+++ /dev/null
@@ -1,128 +0,0 @@
-version: '1.0'
-name: full-team
-description: 'Full-stack feature workflow using reusable permission profiles and step overrides.'
-permissions:
-  profiles:
-    source-dev:
-      access: restricted
-      files:
-        read: ['src/**', 'packages/**', 'tests/**', 'package.json', 'tsconfig.json']
-        write: ['src/**', 'packages/**', 'tests/**']
-        deny: ['.env*', 'secrets/**', 'infrastructure/**']
-      network: false
-    reviewer:
-      access: readonly
-      files:
-        deny: ['.env*', 'secrets/**', '*.pem', '*.key']
-  default: readonly
-swarm:
-  pattern: hub-spoke
-  maxConcurrency: 4
-  timeoutMs: 3600000
-  channel: swarm-full-team
-agents:
-  - name: lead
-    cli: claude
-    role: 'Coordinates planning, review, and final sign-off'
-    permissions:
-      access: readwrite
-
-  - name: frontend
-    cli: codex
-    role: 'Implements UI components and page flows'
-    interactive: false
-    permissions: source-dev
-
-  - name: backend
-    cli: codex
-    role: 'Implements API handlers and business logic'
-    interactive: false
-    permissions: source-dev
-
-  - name: reviewer
-    cli: claude
-    role: 'Performs cross-stack review'
-    interactive: false
-    permissions: reviewer
-
-workflows:
-  - name: fullstack-feature
-    description: 'Plan, implement UI and API in parallel, then review and ship.'
-    onError: retry
-    steps:
-      - name: plan
-        type: agent
-        agent: lead
-        task: |
-          Produce a cross-stack plan for this feature request:
-          {{task}}
-        verification:
-          type: output_contains
-          value: PLAN_COMPLETE
-
-      - name: ui
-        type: agent
-        agent: frontend
-        dependsOn: [plan]
-        permissions:
-          access: restricted
-          files:
-            read: ['src/**', 'packages/**', 'package.json']
-            write: ['src/components/**', 'src/pages/**', 'src/styles/**']
-            deny: ['.env*', 'src/server/**']
-        task: |
-          Build the UI portion of the feature plan.
-
-          Plan:
-          {{steps.plan.output}}
-        verification:
-          type: output_contains
-          value: IMPLEMENTATION_COMPLETE
-
-      - name: api
-        type: agent
-        agent: backend
-        dependsOn: [plan]
-        permissions:
-          access: restricted
-          files:
-            read: ['src/**', 'packages/**', 'package.json']
-            write: ['src/server/**', 'src/api/**', 'packages/sdk/src/**']
-            deny: ['.env*', 'src/components/**']
-        task: |
-          Build the API and business logic portion of the feature plan.
-
-          Plan:
-          {{steps.plan.output}}
-        verification:
-          type: output_contains
-          value: IMPLEMENTATION_COMPLETE
-
-      - name: review
-        type: agent
-        agent: reviewer
-        dependsOn: [ui, api]
-        task: |
-          Review the combined frontend and backend work for correctness, cohesion, and risk.
-
-          UI result:
-          {{steps.ui.output}}
-
-          API result:
-          {{steps.api.output}}
-        verification:
-          type: output_contains
-          value: REVIEW_COMPLETE
-
-      - name: ship
-        type: agent
-        agent: lead
-        dependsOn: [review]
-        task: |
-          Produce final sign-off and summarize any follow-up work.
-
-          Review:
-          {{steps.review.output}}
-        verification:
-          type: output_contains
-          value: DONE
diff --git a/workflows/relayauth-integration/examples/power-user.yaml b/workflows/relayauth-integration/examples/power-user.yaml
deleted file mode 100644
index 4bdddfdeb..000000000
--- a/workflows/relayauth-integration/examples/power-user.yaml
+++ /dev/null
@@ -1,109 +0,0 @@
-version: '1.0'
-name: power-user
-description: 'Advanced example showing reusable profiles, full access, and granular network and exec controls.'
-permissions:
-  profiles:
-    repo-readonly:
-      access: readonly
-      files:
-        deny: ['.env*', 'secrets/**', '*.pem', '*.key']
-    bounded-dev:
-      access: restricted
-      files:
-        read: ['src/**', 'scripts/**', 'tests/**', 'package.json', 'tsconfig.json']
-        write: ['src/**', 'scripts/**', 'tests/**']
-        deny: ['infra/**', '.env*', 'secrets/**']
-      exec: ['npm test', 'npm run lint', 'node scripts/']
-    release-manager:
-      access: full
-      exec: ['git status', 'git diff', 'git tag', 'git archive']
-  default: repo-readonly
-swarm:
-  pattern: dag
-  maxConcurrency: 3
-  timeoutMs: 4200000
-  channel: swarm-power-user
-agents:
-  - name: architect
-    cli: claude
-    role: 'Designs the plan and enforces guardrails'
-    permissions: repo-readonly
-
-  - name: implementer
-    cli: codex
-    role: 'Implements the approved changes inside a bounded scope'
-    interactive: false
-    permissions: bounded-dev
-
-  - name: verifier
-    cli: gemini
-    role: 'Verifies behavior, risks, and release readiness'
-    interactive: false
-    permissions: repo-readonly
-
-  - name: release
-    cli: claude
-    role: 'Produces a release artifact summary with elevated local access'
-    interactive: false
-    permissions: release-manager
-
-workflows:
-  - name: advanced-delivery
-    description: 'Plan, implement, verify, and package a change using the most expressive permission options.'
-    onError: retry
-    steps:
-      - name: plan
-        type: agent
-        agent: architect
-        task: |
-          Produce an implementation plan and explicit acceptance criteria:
-          {{task}}
-        verification:
-          type: output_contains
-          value: PLAN_COMPLETE
-
-      - name: implement
-        type: agent
-        agent: implementer
-        dependsOn: [plan]
-        permissions:
-          access: restricted
-          files:
-            read: ['src/**', 'scripts/**', 'tests/**', 'package.json']
-            write: ['src/features/**', 'src/lib/**', 'tests/**']
-            deny: ['infra/**', '.env*', 'secrets/**']
-          exec: ['npm test', 'npm run lint']
-        task: |
-          Implement the approved plan within the narrowed file and command scope.
-
-          Plan:
-          {{steps.plan.output}}
-        verification:
-          type: output_contains
-          value: IMPLEMENTATION_COMPLETE
-
-      - name: verify
-        type: agent
-        agent: verifier
-        dependsOn: [implement]
-        task: |
-          Verify correctness, regressions, and release risk.
-
-          Implementation summary:
-          {{steps.implement.output}}
-        verification:
-          type: output_contains
-          value: VERIFICATION_COMPLETE
-
-      - name: package-release
-        type: agent
-        agent: release
-        dependsOn: [verify]
-        task: |
-          Prepare a release artifact summary and local packaging notes.
-
-          Verification:
-          {{steps.verify.output}}
-        verification:
-          type: output_contains
-          value: DONE
diff --git a/workflows/relayauth-integration/examples/review-readonly.yaml b/workflows/relayauth-integration/examples/review-readonly.yaml
deleted file mode 100644
index 3e0dedb1d..000000000
--- a/workflows/relayauth-integration/examples/review-readonly.yaml
+++ /dev/null
@@ -1,91 +0,0 @@
-version: '1.0'
-name: review-readonly
-description: 'Parallel code review with readonly agents and explicit secret deny rules.'
-swarm:
-  pattern: fan-out
-  maxConcurrency: 3
-  timeoutMs: 2400000
-  channel: swarm-review-readonly
-agents:
-  - name: lead
-    cli: claude
-    role: 'Aggregates review findings and final recommendation'
-    permissions: readonly
-
-  - name: style-reviewer
-    cli: claude
-    role: 'Checks style, naming, and readability'
-    interactive: false
-    permissions:
-      access: readonly
-      files:
-        deny: ['.env*', 'secrets/**', '*.pem', '*.key']
-
-  - name: logic-reviewer
-    cli: codex
-    role: 'Checks logic, edge cases, and regressions'
-    interactive: false
-    permissions:
-      access: readonly
-      files:
-        deny: ['.env*', 'secrets/**', '*.pem', '*.key']
-
-workflows:
-  - name: review
-    description: 'Capture current changes, review in parallel, and synthesize a verdict.'
-    onError: fail
-    steps:
-      - name: capture-diff
-        type: deterministic
-        command: git diff HEAD~1 2>/dev/null || git diff 2>/dev/null || echo "No changes"
-        captureOutput: true
-
-      - name: capture-files
-        type: deterministic
-        dependsOn: [capture-diff]
-        command: git diff --name-only HEAD~1 2>/dev/null || git diff --name-only 2>/dev/null || echo "No files"
-        captureOutput: true
-
-      - name: style
-        type: agent
-        agent: style-reviewer
-        dependsOn: [capture-diff, capture-files]
-        task: |
-          Review style and readability for these changes:
-          Files: {{steps.capture-files.output}}
-
-          Diff:
-          {{steps.capture-diff.output}}
-        verification:
-          type: output_contains
-          value: REVIEW_COMPLETE
-
-      - name: logic
-        type: agent
-        agent: logic-reviewer
-        dependsOn: [capture-diff, capture-files]
-        task: |
-          Review correctness, regressions, and missing tests for these changes:
-          Files: {{steps.capture-files.output}}
-
-          Diff:
-          {{steps.capture-diff.output}}
-        verification:
-          type: output_contains
-          value: REVIEW_COMPLETE
-
-      - name: summarize
-        type: agent
-        agent: lead
-        dependsOn: [style, logic]
-        task: |
-          Combine the review findings into a single verdict.
-
-          Style review:
-          {{steps.style.output}}
-
-          Logic review:
-          {{steps.logic.output}}
-        verification:
-          type: output_contains
-          value: DONE
diff --git a/workflows/relayauth-integration/examples/security-audit.yaml b/workflows/relayauth-integration/examples/security-audit.yaml
deleted file mode 100644
index 1816a90ec..000000000
--- a/workflows/relayauth-integration/examples/security-audit.yaml
+++ /dev/null
@@ -1,93 +0,0 @@
-version: '1.0'
-name: security-audit
-description: 'Security review with readonly access, scoped network allowlists, and bounded exec.'
-swarm:
-  pattern: hub-spoke
-  maxConcurrency: 2
-  timeoutMs: 3600000
-  channel: swarm-security-audit-example
-agents:
-  - name: auditor
-    cli: claude
-    role: 'Scans for application and dependency vulnerabilities'
-    interactive: false
-    permissions:
-      access: readonly
-      network:
-        allow: ['registry.npmjs.org:443', 'github.com:443', 'nvd.nist.gov:443']
-        deny: ['*']
-      exec: ['npm audit', 'npx snyk test', 'git diff']
-
-  - name: dependency-checker
-    cli: codex
-    role: 'Inspects manifest files and dependency CVEs'
-    interactive: false
-    permissions:
-      access: readonly
-      files:
-        read: ['package.json', 'package-lock.json', 'pnpm-lock.yaml', 'Cargo.toml', 'Cargo.lock']
-        deny: ['.env*', 'secrets/**']
-      network:
-        allow: ['registry.npmjs.org:443']
-        deny: ['*']
-      exec: ['npm audit']
-
-  - name: reporter
-    cli: claude
-    role: 'Compiles findings into a single security report'
-    interactive: false
-    permissions:
-      access: readonly
-      network: false
-
-workflows:
-  - name: audit
-    description: 'Run deterministic dependency scan, parallel audits, and consolidate the report.'
-    onError: fail
-    steps:
-      - name: dep-scan
-        type: deterministic
-        command: npm audit --json 2>/dev/null || echo '{}'
-        captureOutput: true
-
-      - name: code-scan
-        type: agent
-        agent: auditor
-        dependsOn: [dep-scan]
-        task: |
-          Review the repository for OWASP-style risks, secret exposure, and insecure patterns.
-
-          Dependency scan:
-          {{steps.dep-scan.output}}
-        verification:
-          type: output_contains
-          value: SCAN_COMPLETE
-
-      - name: dep-review
-        type: agent
-        agent: dependency-checker
-        dependsOn: [dep-scan]
-        task: |
-          Review dependency vulnerabilities and recommend remediation priorities.
-
-          Dependency scan:
-          {{steps.dep-scan.output}}
-        verification:
-          type: output_contains
-          value: CHECK_COMPLETE
-
-      - name: report
-        type: agent
-        agent: reporter
-        dependsOn: [code-scan, dep-review]
-        task: |
-          Compile a final security report with severity, evidence, and next actions.
-
-          Code scan:
-          {{steps.code-scan.output}}
-
-          Dependency review:
-          {{steps.dep-review.output}}
-        verification:
-          type: output_contains
-          value: REPORT_COMPLETE
diff --git a/workflows/relayauth-integration/examples/test-scoped.yaml b/workflows/relayauth-integration/examples/test-scoped.yaml
deleted file mode 100644
index e36179c12..000000000
--- a/workflows/relayauth-integration/examples/test-scoped.yaml
+++ /dev/null
@@ -1,84 +0,0 @@
-version: '1.0'
-name: test-scoped
-description: 'Test-fix loop with scoped write access limited to test files.'
-swarm:
-  pattern: hub-spoke
-  maxConcurrency: 2
-  timeoutMs: 2700000
-  channel: swarm-test-scoped
-agents:
-  - name: runner
-    cli: codex
-    role: 'Analyzes test failures and execution output'
-    interactive: false
-    permissions:
-      access: readonly
-      exec: ['npm test', 'npx vitest', 'npx jest', 'pnpm test']
-      network: false
-
-  - name: fixer
-    cli: codex
-    role: 'Fixes test failures without touching production source files'
-    interactive: false
-    permissions:
-      access: restricted
-      files:
-        read: ['src/**', 'tests/**', 'package.json', 'pnpm-lock.yaml', 'package-lock.json', 'tsconfig.json']
-        write: ['tests/**', '**/*.test.ts', '**/*.test.tsx', '**/*.spec.ts', '**/*.spec.tsx']
-        deny: ['.env*', 'secrets/**', 'node_modules/**']
-
-workflows:
-  - name: test-fix
-    description: 'Run tests, analyze failures, and repair only test assets.'
-    onError: retry
-    steps:
-      - name: run-tests
-        type: deterministic
-        command: npm test 2>&1 || pnpm test 2>&1 || npx vitest run 2>&1 || true
-        captureOutput: true
-
-      - name: analyze
-        type: agent
-        agent: runner
-        dependsOn: [run-tests]
-        task: |
-          Analyze the failing test output and identify the minimal safe fix.
-
-          Test output:
-          {{steps.run-tests.output}}
-        verification:
-          type: output_contains
-          value: ANALYSIS_COMPLETE
-
-      - name: fix
-        type: agent
-        agent: fixer
-        dependsOn: [analyze]
-        task: |
-          Update only tests or test helpers to resolve the failures.
-
-          Failure analysis:
-          {{steps.analyze.output}}
-        retries: 2
-        verification:
-          type: output_contains
-          value: TESTS_PASSED
-
-      - name: rerun-tests
-        type: deterministic
-        dependsOn: [fix]
-        command: npm test 2>&1 || pnpm test 2>&1 || npx vitest run 2>&1 || true
-        captureOutput: true
-
-      - name: report
-        type: agent
-        agent: runner
-        dependsOn: [rerun-tests]
-        task: |
-          Summarize the final test status and any remaining failures.
-
-          Final test output:
-          {{steps.rerun-tests.output}}
-        verification:
-          type: output_contains
-          value: DONE