diff --git a/.archon/workflows/defaults/archon-workflow-builder.yaml b/.archon/workflows/defaults/archon-workflow-builder.yaml
index a12758b0ec..f0b321fd96 100644
--- a/.archon/workflows/defaults/archon-workflow-builder.yaml
+++ b/.archon/workflows/defaults/archon-workflow-builder.yaml
@@ -178,7 +178,7 @@ nodes:
       5. Use `bash` nodes for deterministic shell operations (file checks, git commands, installs)
       6. Use `script` nodes for typed data transforms (TypeScript JSON parsing, Python with deps)
          — stdout is captured as output, stderr is forwarded as a warning.
-         $nodeId.output is NOT shell-quoted in script bodies.
+         `$nodeId.output` is NOT shell-quoted in script bodies.
          - **TypeScript/bun**: assign directly — `const data = $nodeId.output;`
            (JSON is valid JS expression syntax; avoid String.raw — it breaks on backticks)
          - **Python/uv**: use json.loads — `import json; data = json.loads("""$nodeId.output""")`
diff --git a/packages/workflows/src/defaults/bundled-defaults.generated.ts b/packages/workflows/src/defaults/bundled-defaults.generated.ts
index 43ffbb6f9b..953bf94cf5 100644
--- a/packages/workflows/src/defaults/bundled-defaults.generated.ts
+++ b/packages/workflows/src/defaults/bundled-defaults.generated.ts
@@ -74,5 +74,5 @@ export const BUNDLED_WORKFLOWS: Record<string, string> = {
   "archon-smart-pr-review": "name: archon-smart-pr-review\ndescription: |\n  Use when: User wants a smart, efficient PR review that adapts to PR complexity.\n  Triggers: \"smart review\", \"review this PR\", \"review PR #123\", \"efficient review\",\n            \"smart PR review\", \"quick review\".\n  Does: Gathers PR scope -> classifies complexity -> routes to only relevant review agents ->\n        synthesizes findings -> auto-fixes CRITICAL/HIGH issues.\n  NOT for: When you explicitly want ALL review agents (use archon-comprehensive-pr-review instead).\n\n  Unlike the comprehensive review, this workflow classifies the PR first and only runs\n  the review agents that are relevant. A 3-line typo fix skips test-coverage and docs-impact.\n\nnodes:\n  - id: scope\n    command: archon-pr-review-scope\n\n  - id: sync\n    command: archon-sync-pr-with-main\n    depends_on: [scope]\n\n  - id: classify\n    prompt: |\n      You are a PR complexity classifier. Analyze the PR scope below and determine\n      which review agents should run.\n\n      ## PR Scope\n      $scope.output\n\n      ## Rules\n      - **Code review**: Always run unless the diff is empty or only touches non-code files\n        (e.g. README-only, config-only, or .yaml-only changes).\n      - **Error handling**: Run if the diff touches code with try/catch, error handling,\n        async/await, or adds new failure paths.\n      - **Test coverage**: Run if the diff touches source code (not just tests, docs, or config).\n      - **Comment quality**: Run if the diff adds or modifies comments, docstrings, JSDoc,\n        or significant documentation within code files.\n      - **Docs impact**: Run if the diff adds/removes/renames public APIs, commands, CLI flags,\n        environment variables, or user-facing features.\n\n      Classify the PR complexity:\n      - **trivial**: Typo fixes, formatting, single-line changes, version bumps\n      - **small**: 1-3 files, straightforward logic, no architectural changes\n      - **medium**: 4-10 files, moderate logic changes, some cross-cutting concerns\n      - **large**: 10+ files, architectural changes, new subsystems, complex refactors\n\n      Provide your reasoning for each decision.\n    depends_on: [scope]\n    model: haiku\n    allowed_tools: []\n    output_format:\n      type: object\n      properties:\n        run_code_review:\n          type: string\n          enum: [\"true\", \"false\"]\n        run_error_handling:\n          type: string\n          enum: [\"true\", \"false\"]\n        run_test_coverage:\n          type: string\n          enum: [\"true\", \"false\"]\n        run_comment_quality:\n          type: string\n          enum: [\"true\", \"false\"]\n        run_docs_impact:\n          type: string\n          enum: [\"true\", \"false\"]\n        complexity:\n          type: string\n          enum: [\"trivial\", \"small\", \"medium\", \"large\"]\n        reasoning:\n          type: string\n      required:\n        - run_code_review\n        - run_error_handling\n        - run_test_coverage\n        - run_comment_quality\n        - run_docs_impact\n        - complexity\n        - reasoning\n\n  - id: code-review\n    command: archon-code-review-agent\n    depends_on: [classify, sync]\n    when: \"$classify.output.run_code_review == 'true'\"\n\n  - id: error-handling\n    command: archon-error-handling-agent\n    depends_on: [classify, sync]\n    when: \"$classify.output.run_error_handling == 'true'\"\n\n  - id: test-coverage\n    command: archon-test-coverage-agent\n    depends_on: [classify, sync]\n    when: \"$classify.output.run_test_coverage == 'true'\"\n\n  - id: comment-quality\n    command: archon-comment-quality-agent\n    depends_on: [classify, sync]\n    when: \"$classify.output.run_comment_quality == 'true'\"\n\n  - id: docs-impact\n    command: archon-docs-impact-agent\n    depends_on: [classify, sync]\n    when: \"$classify.output.run_docs_impact == 'true'\"\n\n  - id: synthesize\n    command: archon-synthesize-review\n    depends_on: [code-review, error-handling, test-coverage, comment-quality, docs-impact]\n    trigger_rule: one_success\n\n  - id: implement-fixes\n    command: archon-implement-review-fixes\n    depends_on: [synthesize]\n\n  # Optional: push notification when review completes.\n  # To enable, create .archon/mcp/ntfy.json — see docs/mcp-servers.md\n  - id: check-ntfy\n    bash: \"test -f .archon/mcp/ntfy.json && echo 'true' || echo 'false'\"\n    depends_on: [implement-fixes]\n\n  - id: notify\n    depends_on: [check-ntfy, synthesize, implement-fixes]\n    when: \"$check-ntfy.output == 'true'\"\n    trigger_rule: all_success\n    mcp: .archon/mcp/ntfy.json\n    allowed_tools: []\n    prompt: |\n      Send a push notification summarizing the PR review results.\n\n      Review synthesis:\n      $synthesize.output\n\n      Fix results:\n      $implement-fixes.output\n\n      Send with:\n      - title: \"PR Review Complete\"\n      - message: 1-2 sentence summary — verdict and issue count. Short enough for a lock screen.\n      - priority: 3 if ready to merge, 4 if needs fixes, 5 if critical issues remain\n",
   "archon-test-loop-dag": "name: archon-test-loop-dag\ndescription: |\n  Use when: User explicitly says \"test-loop-dag\" or \"run test-loop-dag\".\n  IMPORTANT: This is a DAG workflow with a loop node that iterates until completion.\n  NOT for: General testing questions or debugging.\n  Does: Initializes a counter, iterates until it reaches 3, then reports completion.\n\nnodes:\n  - id: setup\n    bash: |\n      echo \"0\" > .archon/test-loop-dag-counter.txt\n      echo \"Counter initialized to 0\"\n\n  - id: loop-counter\n    depends_on: [setup]\n    loop:\n      prompt: |\n        You are testing the loop node functionality within a DAG workflow.\n\n        ## Your Task\n\n        1. Read the file `.archon/test-loop-dag-counter.txt`\n        2. Parse the current counter value\n        3. Increment it by 1\n        4. Write the new value back to the file\n        5. Report the current iteration\n\n        ## User Intent\n\n        $USER_MESSAGE\n\n        ## Completion Criteria\n\n        - If the counter reaches 3 or higher, output: <promise>COMPLETE</promise>\n        - Otherwise, just report your progress and end normally\n\n        ## Important\n\n        Be concise. Just do the task and report the counter value.\n      until: COMPLETE\n      max_iterations: 5\n      fresh_context: false\n\n  - id: report\n    depends_on: [loop-counter]\n    prompt: |\n      The loop counter test has completed. The loop node output was:\n\n      $loop-counter.output\n\n      Read `.archon/test-loop-dag-counter.txt` and confirm the final counter value.\n      Report: \"Test loop DAG completed successfully. Final counter: {value}\"\n",
   "archon-validate-pr": "name: archon-validate-pr\ndescription: |\n  Use when: User wants a thorough PR validation that tests both main (bug present) and feature branch (bug fixed).\n  Triggers: \"validate PR\", \"validate pr #123\", \"test this PR\", \"verify PR\", \"full PR validation\",\n            \"validate pull request\", \"test PR end-to-end\".\n  Does: Fetches PR info -> finds free ports -> parallel code review (main vs feature) ->\n        E2E test on main (reproduce bug) -> E2E test on feature (verify fix) -> final verdict report.\n  NOT for: Quick code-only reviews (use archon-smart-pr-review), fixing issues, general exploration.\n\n  This workflow is designed for running in parallel — each instance finds its own free ports\n  to avoid conflicts. Produces artifacts in $ARTIFACTS_DIR/ and posts a validation report.\n\nprovider: claude\nmodel: opus\n\nnodes:\n  # ═══════════════════════════════════════════════════════════════\n  # PHASE 1: SETUP — Fetch PR info and allocate ports\n  # ═══════════════════════════════════════════════════════════════\n\n  - id: fetch-pr\n    bash: |\n      # Extract PR number from arguments\n      PR_NUMBER=$(echo \"$ARGUMENTS\" | grep -oE '/pull/[0-9]+' | grep -oE '[0-9]+' | head -1)\n      # Fallback: extract first number if no URL path found (e.g., \"validate PR 42\")\n      if [ -z \"$PR_NUMBER\" ]; then\n        PR_NUMBER=$(echo \"$ARGUMENTS\" | grep -oE '[0-9]+' | head -1)\n      fi\n      if [ -z \"$PR_NUMBER\" ]; then\n        # Try getting PR from current branch\n        PR_NUMBER=$(gh pr view --json number -q '.number' 2>/dev/null)\n      fi\n\n      if [ -z \"$PR_NUMBER\" ]; then\n        echo \"ERROR: No PR number found in arguments: $ARGUMENTS\"\n        exit 1\n      fi\n\n      echo \"$PR_NUMBER\" > \"$ARTIFACTS_DIR/.pr-number\"\n\n      # Fetch full PR details\n      gh pr view \"$PR_NUMBER\" --json number,title,body,url,headRefName,baseRefName,files,additions,deletions,changedFiles,state,author,labels,isDraft\n\n  - id: find-ports\n    bash: |\n      # Use Bun to let the OS pick truly free ports (cross-platform: Linux, macOS, Windows)\n      BACKEND_PORT=$(bun -e \"const s = Bun.serve({port: 0, fetch: () => new Response('')}); console.log(s.port); s.stop()\")\n      FRONTEND_PORT=$(bun -e \"const s = Bun.serve({port: 0, fetch: () => new Response('')}); console.log(s.port); s.stop()\")\n\n      echo \"$BACKEND_PORT\" > \"$ARTIFACTS_DIR/.backend-port\"\n      echo \"$FRONTEND_PORT\" > \"$ARTIFACTS_DIR/.frontend-port\"\n\n      echo \"BACKEND_PORT=$BACKEND_PORT\"\n      echo \"FRONTEND_PORT=$FRONTEND_PORT\"\n\n  - id: resolve-paths\n    bash: |\n      # Resolve canonical repo path (main branch) vs worktree path (feature branch)\n      CANONICAL_REPO=$(git rev-parse --path-format=absolute --git-common-dir 2>/dev/null | sed 's|/\\.git$||')\n      WORKTREE_PATH=$(pwd)\n      FEATURE_BRANCH=$(git branch --show-current)\n\n      # Get PR branch info\n      PR_NUMBER=$(cat \"$ARTIFACTS_DIR/.pr-number\")\n      PR_HEAD=$(gh pr view \"$PR_NUMBER\" --json headRefName -q '.headRefName')\n      PR_BASE=$(gh pr view \"$PR_NUMBER\" --json baseRefName -q '.baseRefName')\n\n      echo \"$CANONICAL_REPO\" > \"$ARTIFACTS_DIR/.canonical-repo\"\n      echo \"$WORKTREE_PATH\" > \"$ARTIFACTS_DIR/.worktree-path\"\n      echo \"$FEATURE_BRANCH\" > \"$ARTIFACTS_DIR/.feature-branch\"\n      echo \"$PR_HEAD\" > \"$ARTIFACTS_DIR/.pr-head\"\n      echo \"$PR_BASE\" > \"$ARTIFACTS_DIR/.pr-base\"\n\n      echo \"CANONICAL_REPO=$CANONICAL_REPO\"\n      echo \"WORKTREE_PATH=$WORKTREE_PATH\"\n      echo \"FEATURE_BRANCH=$FEATURE_BRANCH\"\n      echo \"PR_HEAD=$PR_HEAD\"\n      echo \"PR_BASE=$PR_BASE\"\n    depends_on: [fetch-pr]\n\n  # ═══════════════════════════════════════════════════════════════\n  # PHASE 2: CODE REVIEW — Parallel analysis of main vs feature\n  # ═══════════════════════════════════════════════════════════════\n\n  - id: code-review-main\n    command: archon-validate-pr-code-review-main\n    depends_on: [fetch-pr, resolve-paths]\n    context: fresh\n\n  - id: code-review-feature\n    command: archon-validate-pr-code-review-feature\n    depends_on: [fetch-pr, resolve-paths, code-review-main]\n    context: fresh\n\n  # ═══════════════════════════════════════════════════════════════\n  # PHASE 3: E2E TESTING — Sequential (after code reviews finish)\n  # ═══════════════════════════════════════════════════════════════\n\n  - id: classify-testability\n    prompt: |\n      You are a PR testability classifier. Determine whether this PR's changes can be\n      validated via browser E2E testing, or if it requires code-review-only validation.\n\n      ## PR Details\n\n      $fetch-pr.output\n\n      ## Rules\n\n      - **e2e_testable**: Changes affect the Web UI (components, hooks, styles, API routes\n        that serve the frontend, SSE streaming, layout, user-visible behavior). These can be\n        validated by starting Archon and using agent-browser to interact with the UI.\n      - **code_review_only**: Changes are purely backend logic, CLI-only, workflow engine,\n        database schemas, git operations, build tooling, tests, documentation, or other\n        non-UI code. No visual validation possible.\n\n      Consider: even if a change is backend, if it affects what the frontend displays\n      (e.g., API response format changes, SSE event changes), it IS e2e_testable.\n    depends_on: [fetch-pr]\n    model: haiku\n    allowed_tools: []\n    output_format:\n      type: object\n      properties:\n        testable:\n          type: string\n          enum: [\"e2e_testable\", \"code_review_only\"]\n        reasoning:\n          type: string\n        test_plan:\n          type: string\n      required: [testable, reasoning, test_plan]\n\n  - id: e2e-test-main\n    command: archon-validate-pr-e2e-main\n    depends_on: [classify-testability, find-ports, resolve-paths, code-review-main, code-review-feature]\n    when: \"$classify-testability.output.testable == 'e2e_testable'\"\n    context: fresh\n    idle_timeout: 1800000\n\n  - id: e2e-test-feature\n    command: archon-validate-pr-e2e-feature\n    depends_on: [e2e-test-main, find-ports, resolve-paths]\n    when: \"$classify-testability.output.testable == 'e2e_testable'\"\n    context: fresh\n    idle_timeout: 1800000\n\n  # ═══════════════════════════════════════════════════════════════\n  # PHASE 4: FINAL REPORT — Synthesize all findings\n  # ═══════════════════════════════════════════════════════════════\n\n  - id: cleanup-processes\n    bash: |\n      # Safety net: kill any orphaned processes from E2E testing\n      # This runs after E2E nodes complete (or timeout/fail) to prevent process accumulation\n      BACKEND_PORT=$(cat \"$ARTIFACTS_DIR/.backend-port\" 2>/dev/null | tr -d '\\n')\n      FRONTEND_PORT=$(cat \"$ARTIFACTS_DIR/.frontend-port\" 2>/dev/null | tr -d '\\n')\n\n      if [ -z \"$BACKEND_PORT\" ] || [ -z \"$FRONTEND_PORT\" ]; then\n        echo \"No port files found — skipping cleanup\"\n        exit 0\n      fi\n\n      echo \"Cleaning up ports $BACKEND_PORT and $FRONTEND_PORT...\"\n\n      # Kill by all recorded PID files\n      for pidfile in \"$ARTIFACTS_DIR\"/.e2e-*-pid; do\n        if [ -f \"$pidfile\" ]; then\n          PID=$(cat \"$pidfile\" | tr -d '\\n')\n          echo \"Killing PID $PID from $pidfile\"\n          kill \"$PID\" 2>/dev/null || taskkill //F //T //PID \"$PID\" 2>/dev/null || true\n        fi\n      done\n\n      # Kill by port (cross-platform fallback)\n      for PORT in $BACKEND_PORT $FRONTEND_PORT; do\n        fuser -k \"$PORT/tcp\" 2>/dev/null || true\n        lsof -ti:\"$PORT\" 2>/dev/null | xargs kill -9 2>/dev/null || true\n        netstat -ano 2>/dev/null | grep \":$PORT \" | grep LISTENING | awk '{print $5}' | sort -u | while read pid; do\n          taskkill //F //T //PID \"$pid\" 2>/dev/null || true\n        done\n      done\n\n      # pkill fallback: catch processes that escaped PID/port cleanup\n      pkill -f \"PORT=$BACKEND_PORT.*bun\" 2>/dev/null || true\n      pkill -f \"vite.*port.*$FRONTEND_PORT\" 2>/dev/null || true\n\n      # Close this workflow's browser session only (scoped by session ID)\n      BROWSER_SESSION=$(cat \"$ARTIFACTS_DIR/.browser-session\" 2>/dev/null | tr -d '\\n')\n      if [ -n \"$BROWSER_SESSION\" ]; then\n        agent-browser --session \"$BROWSER_SESSION\" close 2>/dev/null || true\n      fi\n\n      # Remove main E2E worktree if it still exists (safety net)\n      CANONICAL_REPO=$(cat \"$ARTIFACTS_DIR/.canonical-repo\" 2>/dev/null | tr -d '\\n')\n      MAIN_E2E_PATH=$(cat \"$ARTIFACTS_DIR/.e2e-main-worktree\" 2>/dev/null | tr -d '\\n')\n      if [ -n \"$MAIN_E2E_PATH\" ] && [ -n \"$CANONICAL_REPO\" ] && [ -d \"$MAIN_E2E_PATH\" ]; then\n        echo \"Removing leftover main E2E worktree: $MAIN_E2E_PATH\"\n        git -C \"$CANONICAL_REPO\" worktree remove \"$MAIN_E2E_PATH\" --force 2>/dev/null || rm -rf \"$MAIN_E2E_PATH\"\n      fi\n\n      sleep 1\n      echo \"Process cleanup complete\"\n    depends_on: [e2e-test-main, e2e-test-feature]\n    trigger_rule: all_done\n\n  - id: final-report\n    command: archon-validate-pr-report\n    depends_on: [code-review-main, code-review-feature, e2e-test-main, e2e-test-feature, classify-testability, cleanup-processes]\n    trigger_rule: all_done\n    context: fresh\n",
-  "archon-workflow-builder": "name: archon-workflow-builder\ndescription: |\n  Use when: User wants to create a new custom workflow for their project.\n  Triggers: \"build me a workflow\", \"create a workflow\", \"generate a workflow\",\n            \"new workflow\", \"make a workflow for\", \"workflow builder\".\n  Does: Scans codebase -> extracts intent (JSON) -> generates YAML -> validates -> saves.\n  NOT for: Editing existing workflows or creating non-workflow files.\n\nnodes:\n  - id: scan-codebase\n    bash: |\n      echo \"=== Existing Commands ===\"\n      if [ -d \".archon/commands\" ]; then\n        find .archon/commands -type f -name \"*.md\" 2>/dev/null | head -30\n      else\n        echo \"(no .archon/commands/ directory)\"\n      fi\n\n      echo \"\"\n      echo \"=== Existing Workflows ===\"\n      if [ -d \".archon/workflows\" ]; then\n        find .archon/workflows -type f \\( -name \"*.yaml\" -o -name \"*.yml\" \\) 2>/dev/null | head -30\n      else\n        echo \"(no .archon/workflows/ directory)\"\n      fi\n\n      echo \"\"\n      echo \"=== Package Info ===\"\n      if [ -f \"package.json\" ]; then\n        grep -E '\"name\"|\"scripts\"' package.json | head -10\n      else\n        echo \"(no package.json)\"\n      fi\n\n      echo \"\"\n      echo \"=== Project Context (CLAUDE.md first 50 lines) ===\"\n      if [ -f \"CLAUDE.md\" ]; then\n        head -50 CLAUDE.md\n      else\n        echo \"(no CLAUDE.md)\"\n      fi\n\n  - id: extract-intent\n    prompt: |\n      You are a workflow design classifier. Given a user's description of what they want\n      a workflow to do, extract structured intent.\n\n      ## User's Request\n      $ARGUMENTS\n\n      ## Codebase Context\n      $scan-codebase.output\n\n      ## Instructions\n\n      Analyze the user's request and the existing codebase to determine:\n      1. A kebab-case workflow name (e.g., \"lint-and-test\", \"deploy-staging\")\n      2. A description following the Archon pattern (Use when / Triggers / Does / NOT for)\n      3. Trigger phrases the router should match\n      4. A list of proposed nodes with their types and purposes\n      5. Whether this should be a simple DAG or include a loop node\n\n      Be specific and concrete. Each proposed node should have a clear type\n      (bash, prompt, command, script, loop, or approval) and a one-line\n      description of what it does.\n    model: haiku\n    allowed_tools: []\n    output_format:\n      type: object\n      properties:\n        workflow_name:\n          type: string\n        description:\n          type: string\n        trigger_phrases:\n          type: string\n        proposed_nodes:\n          type: string\n        execution_mode:\n          type: string\n          enum: [\"dag\", \"loop\"]\n      required: [workflow_name, description, trigger_phrases, proposed_nodes, execution_mode]\n    depends_on: [scan-codebase]\n\n  - id: generate-yaml\n    prompt: |\n      You are an Archon workflow author. Generate a complete, valid workflow YAML file\n      based on the structured intent provided.\n\n      ## Intent\n      - **Name**: $extract-intent.output.workflow_name\n      - **Description**: $extract-intent.output.description\n      - **Trigger Phrases**: $extract-intent.output.trigger_phrases\n      - **Proposed Nodes**: $extract-intent.output.proposed_nodes\n      - **Execution Mode**: $extract-intent.output.execution_mode\n\n      ## Original User Request\n      $ARGUMENTS\n\n      ## Archon Workflow YAML Schema Reference\n\n      A workflow YAML file has this structure:\n\n      ```yaml\n      name: workflow-name\n      description: |\n        Use when: ...\n        Triggers: ...\n        Does: ...\n        NOT for: ...\n\n      # Optional top-level settings:\n      # provider: claude    (or codex)\n      # model: sonnet       (or haiku, opus, etc.)\n      # interactive: true   (forces foreground execution in web UI)\n\n      nodes:\n        - id: node-id-kebab-case\n          # Choose ONE of: prompt, bash, command, script, loop, approval\n\n          # --- prompt node (AI-executed) ---\n          prompt: |\n            Instructions for the AI...\n          # Optional: model, allowed_tools, denied_tools, output_format, context, idle_timeout\n\n          # --- bash node (shell script, no AI, stdout = $<nodeId>.output) ---\n          bash: |\n            #!/bin/bash\n            set -e\n            echo \"result\"\n\n          # --- command node (references a .archon/commands/ file) ---\n          command: command-name\n\n          # --- script node (TypeScript via bun, or Python via uv — no AI, stdout = $<nodeId>.output) ---\n          # Use for deterministic data transforms the shell would mangle (JSON parsing, etc.)\n          script: |\n            // JSON is valid JS expression syntax — assign directly (String.raw breaks on backticks)\n            const data = $other-node.output;\n            console.log(JSON.stringify({ count: data.items.length }));\n          runtime: bun                       # required: 'bun' (.ts/.js) or 'uv' (.py)\n          # deps: [requests]                 # uv only\n          # Or reference a named script in .archon/scripts/:\n          # script: extract-labels           # no extension; bun resolves .ts/.js, uv resolves .py\n\n          # --- loop node (iterative AI execution) ---\n          loop:\n            prompt: |\n              Instructions repeated each iteration...\n            until: COMPLETION_SIGNAL\n            max_iterations: 10\n            fresh_context: true  # optional: reset context each iteration\n\n          # --- approval node (human gate — pauses workflow) ---\n          approval:\n            message: \"Review the plan above. Approve to continue.\"\n            # capture_response: true         # store reviewer comment as $<nodeId>.output\n\n          # Common options for all node types:\n          depends_on: [other-node-id]       # DAG edges\n          when: \"$<other-node>.output == 'value'\"  # conditional execution\n          trigger_rule: all_success          # all_success | one_success | all_done\n          timeout: 120000                    # ms, for bash and script nodes\n      ```\n\n      ## Variable Reference\n      - `$ARGUMENTS` — user's input text\n      - `$ARTIFACTS_DIR` — pre-created directory for workflow artifacts\n      - `$<nodeId>.output` — stdout from a bash/script node or AI response from a prompt node\n      - `$<nodeId>.output.field` — JSON field from a node with output_format\n      - `$BASE_BRANCH` — base git branch\n\n      ## Rules\n      1. The `name:` field MUST match: $extract-intent.output.workflow_name\n      2. The `description:` MUST follow the \"Use when / Triggers / Does / NOT for\" pattern\n      3. Every node MUST have a unique kebab-case `id`\n      4. Use `depends_on` to define execution order\n      5. Use `bash` nodes for deterministic shell operations (file checks, git commands, installs)\n      6. Use `script` nodes for typed data transforms (TypeScript JSON parsing, Python with deps)\n         — stdout is captured as output, stderr is forwarded as a warning.\n         $nodeId.output is NOT shell-quoted in script bodies.\n         - **TypeScript/bun**: assign directly — `const data = $nodeId.output;`\n           (JSON is valid JS expression syntax; avoid String.raw — it breaks on backticks)\n         - **Python/uv**: use json.loads — `import json; data = json.loads(\"\"\"$nodeId.output\"\"\")`\n         Never interpolate into shell syntax.\n      7. Use `prompt` nodes for AI reasoning tasks\n      8. Use `approval` nodes to pause for human review at risky gates (plan→execute boundary, destructive actions)\n      9. Use `output_format` on prompt nodes when downstream nodes need structured data\n      10. Use `allowed_tools: []` on classification/analysis nodes that don't need tools\n      11. Use `denied_tools: [Edit, Bash]` when a node should only use Write (not edit existing files)\n      12. Prefer `model: haiku` for simple classification tasks to save cost\n\n      ## Output\n\n      Write the complete workflow YAML to: `$ARTIFACTS_DIR/generated-workflow.yaml`\n\n      Use the Write tool. Do NOT use Edit or Bash. The file must be valid YAML and follow\n      all the patterns above.\n    denied_tools: [Edit, Bash]\n    depends_on: [extract-intent]\n\n  - id: validate-yaml\n    bash: |\n      FILE=\"$ARTIFACTS_DIR/generated-workflow.yaml\"\n\n      if [ ! -f \"$FILE\" ]; then\n        echo \"ERROR: generated-workflow.yaml not found at $FILE\"\n        exit 1\n      fi\n\n      if [ ! -s \"$FILE\" ]; then\n        echo \"ERROR: generated-workflow.yaml is empty\"\n        exit 1\n      fi\n\n      if ! grep -q \"^name:\" \"$FILE\"; then\n        echo \"ERROR: missing 'name:' field\"\n        exit 1\n      fi\n\n      if ! grep -q \"^nodes:\" \"$FILE\"; then\n        echo \"ERROR: missing 'nodes:' field\"\n        exit 1\n      fi\n\n      echo \"VALID\"\n    depends_on: [generate-yaml]\n\n  - id: save-or-report\n    prompt: |\n      You are a workflow installer. Save the generated workflow and report to the user.\n\n      ## Workflow Details\n      - **Name**: $extract-intent.output.workflow_name\n      - **Trigger Phrases**: $extract-intent.output.trigger_phrases\n\n      ## Instructions\n\n      1. Read the generated workflow from `$ARTIFACTS_DIR/generated-workflow.yaml`\n      2. Create the directory `.archon/workflows/` if it doesn't exist (use Bash: `mkdir -p .archon/workflows/`)\n      3. Save the workflow to `.archon/workflows/$extract-intent.output.workflow_name.yaml`\n         Use the Write tool to write the file.\n      4. Report to the user:\n         - Workflow name and file location\n         - Trigger phrases that will invoke it\n         - How to run it: `bun run cli workflow run $extract-intent.output.workflow_name \"your input\"`\n         - How to test it: `bun run cli validate workflows $extract-intent.output.workflow_name`\n    depends_on: [validate-yaml]\n",
+  "archon-workflow-builder": "name: archon-workflow-builder\ndescription: |\n  Use when: User wants to create a new custom workflow for their project.\n  Triggers: \"build me a workflow\", \"create a workflow\", \"generate a workflow\",\n            \"new workflow\", \"make a workflow for\", \"workflow builder\".\n  Does: Scans codebase -> extracts intent (JSON) -> generates YAML -> validates -> saves.\n  NOT for: Editing existing workflows or creating non-workflow files.\n\nnodes:\n  - id: scan-codebase\n    bash: |\n      echo \"=== Existing Commands ===\"\n      if [ -d \".archon/commands\" ]; then\n        find .archon/commands -type f -name \"*.md\" 2>/dev/null | head -30\n      else\n        echo \"(no .archon/commands/ directory)\"\n      fi\n\n      echo \"\"\n      echo \"=== Existing Workflows ===\"\n      if [ -d \".archon/workflows\" ]; then\n        find .archon/workflows -type f \\( -name \"*.yaml\" -o -name \"*.yml\" \\) 2>/dev/null | head -30\n      else\n        echo \"(no .archon/workflows/ directory)\"\n      fi\n\n      echo \"\"\n      echo \"=== Package Info ===\"\n      if [ -f \"package.json\" ]; then\n        grep -E '\"name\"|\"scripts\"' package.json | head -10\n      else\n        echo \"(no package.json)\"\n      fi\n\n      echo \"\"\n      echo \"=== Project Context (CLAUDE.md first 50 lines) ===\"\n      if [ -f \"CLAUDE.md\" ]; then\n        head -50 CLAUDE.md\n      else\n        echo \"(no CLAUDE.md)\"\n      fi\n\n  - id: extract-intent\n    prompt: |\n      You are a workflow design classifier. Given a user's description of what they want\n      a workflow to do, extract structured intent.\n\n      ## User's Request\n      $ARGUMENTS\n\n      ## Codebase Context\n      $scan-codebase.output\n\n      ## Instructions\n\n      Analyze the user's request and the existing codebase to determine:\n      1. A kebab-case workflow name (e.g., \"lint-and-test\", \"deploy-staging\")\n      2. A description following the Archon pattern (Use when / Triggers / Does / NOT for)\n      3. Trigger phrases the router should match\n      4. A list of proposed nodes with their types and purposes\n      5. Whether this should be a simple DAG or include a loop node\n\n      Be specific and concrete. Each proposed node should have a clear type\n      (bash, prompt, command, script, loop, or approval) and a one-line\n      description of what it does.\n    model: haiku\n    allowed_tools: []\n    output_format:\n      type: object\n      properties:\n        workflow_name:\n          type: string\n        description:\n          type: string\n        trigger_phrases:\n          type: string\n        proposed_nodes:\n          type: string\n        execution_mode:\n          type: string\n          enum: [\"dag\", \"loop\"]\n      required: [workflow_name, description, trigger_phrases, proposed_nodes, execution_mode]\n    depends_on: [scan-codebase]\n\n  - id: generate-yaml\n    prompt: |\n      You are an Archon workflow author. Generate a complete, valid workflow YAML file\n      based on the structured intent provided.\n\n      ## Intent\n      - **Name**: $extract-intent.output.workflow_name\n      - **Description**: $extract-intent.output.description\n      - **Trigger Phrases**: $extract-intent.output.trigger_phrases\n      - **Proposed Nodes**: $extract-intent.output.proposed_nodes\n      - **Execution Mode**: $extract-intent.output.execution_mode\n\n      ## Original User Request\n      $ARGUMENTS\n\n      ## Archon Workflow YAML Schema Reference\n\n      A workflow YAML file has this structure:\n\n      ```yaml\n      name: workflow-name\n      description: |\n        Use when: ...\n        Triggers: ...\n        Does: ...\n        NOT for: ...\n\n      # Optional top-level settings:\n      # provider: claude    (or codex)\n      # model: sonnet       (or haiku, opus, etc.)\n      # interactive: true   (forces foreground execution in web UI)\n\n      nodes:\n        - id: node-id-kebab-case\n          # Choose ONE of: prompt, bash, command, script, loop, approval\n\n          # --- prompt node (AI-executed) ---\n          prompt: |\n            Instructions for the AI...\n          # Optional: model, allowed_tools, denied_tools, output_format, context, idle_timeout\n\n          # --- bash node (shell script, no AI, stdout = $<nodeId>.output) ---\n          bash: |\n            #!/bin/bash\n            set -e\n            echo \"result\"\n\n          # --- command node (references a .archon/commands/ file) ---\n          command: command-name\n\n          # --- script node (TypeScript via bun, or Python via uv — no AI, stdout = $<nodeId>.output) ---\n          # Use for deterministic data transforms the shell would mangle (JSON parsing, etc.)\n          script: |\n            // JSON is valid JS expression syntax — assign directly (String.raw breaks on backticks)\n            const data = $other-node.output;\n            console.log(JSON.stringify({ count: data.items.length }));\n          runtime: bun                       # required: 'bun' (.ts/.js) or 'uv' (.py)\n          # deps: [requests]                 # uv only\n          # Or reference a named script in .archon/scripts/:\n          # script: extract-labels           # no extension; bun resolves .ts/.js, uv resolves .py\n\n          # --- loop node (iterative AI execution) ---\n          loop:\n            prompt: |\n              Instructions repeated each iteration...\n            until: COMPLETION_SIGNAL\n            max_iterations: 10\n            fresh_context: true  # optional: reset context each iteration\n\n          # --- approval node (human gate — pauses workflow) ---\n          approval:\n            message: \"Review the plan above. Approve to continue.\"\n            # capture_response: true         # store reviewer comment as $<nodeId>.output\n\n          # Common options for all node types:\n          depends_on: [other-node-id]       # DAG edges\n          when: \"$<other-node>.output == 'value'\"  # conditional execution\n          trigger_rule: all_success          # all_success | one_success | all_done\n          timeout: 120000                    # ms, for bash and script nodes\n      ```\n\n      ## Variable Reference\n      - `$ARGUMENTS` — user's input text\n      - `$ARTIFACTS_DIR` — pre-created directory for workflow artifacts\n      - `$<nodeId>.output` — stdout from a bash/script node or AI response from a prompt node\n      - `$<nodeId>.output.field` — JSON field from a node with output_format\n      - `$BASE_BRANCH` — base git branch\n\n      ## Rules\n      1. The `name:` field MUST match: $extract-intent.output.workflow_name\n      2. The `description:` MUST follow the \"Use when / Triggers / Does / NOT for\" pattern\n      3. Every node MUST have a unique kebab-case `id`\n      4. Use `depends_on` to define execution order\n      5. Use `bash` nodes for deterministic shell operations (file checks, git commands, installs)\n      6. Use `script` nodes for typed data transforms (TypeScript JSON parsing, Python with deps)\n         — stdout is captured as output, stderr is forwarded as a warning.\n         `$nodeId.output` is NOT shell-quoted in script bodies.\n         - **TypeScript/bun**: assign directly — `const data = $nodeId.output;`\n           (JSON is valid JS expression syntax; avoid String.raw — it breaks on backticks)\n         - **Python/uv**: use json.loads — `import json; data = json.loads(\"\"\"$nodeId.output\"\"\")`\n         Never interpolate into shell syntax.\n      7. Use `prompt` nodes for AI reasoning tasks\n      8. Use `approval` nodes to pause for human review at risky gates (plan→execute boundary, destructive actions)\n      9. Use `output_format` on prompt nodes when downstream nodes need structured data\n      10. Use `allowed_tools: []` on classification/analysis nodes that don't need tools\n      11. Use `denied_tools: [Edit, Bash]` when a node should only use Write (not edit existing files)\n      12. Prefer `model: haiku` for simple classification tasks to save cost\n\n      ## Output\n\n      Write the complete workflow YAML to: `$ARTIFACTS_DIR/generated-workflow.yaml`\n\n      Use the Write tool. Do NOT use Edit or Bash. The file must be valid YAML and follow\n      all the patterns above.\n    denied_tools: [Edit, Bash]\n    depends_on: [extract-intent]\n\n  - id: validate-yaml\n    bash: |\n      FILE=\"$ARTIFACTS_DIR/generated-workflow.yaml\"\n\n      if [ ! -f \"$FILE\" ]; then\n        echo \"ERROR: generated-workflow.yaml not found at $FILE\"\n        exit 1\n      fi\n\n      if [ ! -s \"$FILE\" ]; then\n        echo \"ERROR: generated-workflow.yaml is empty\"\n        exit 1\n      fi\n\n      if ! grep -q \"^name:\" \"$FILE\"; then\n        echo \"ERROR: missing 'name:' field\"\n        exit 1\n      fi\n\n      if ! grep -q \"^nodes:\" \"$FILE\"; then\n        echo \"ERROR: missing 'nodes:' field\"\n        exit 1\n      fi\n\n      echo \"VALID\"\n    depends_on: [generate-yaml]\n\n  - id: save-or-report\n    prompt: |\n      You are a workflow installer. Save the generated workflow and report to the user.\n\n      ## Workflow Details\n      - **Name**: $extract-intent.output.workflow_name\n      - **Trigger Phrases**: $extract-intent.output.trigger_phrases\n\n      ## Instructions\n\n      1. Read the generated workflow from `$ARTIFACTS_DIR/generated-workflow.yaml`\n      2. Create the directory `.archon/workflows/` if it doesn't exist (use Bash: `mkdir -p .archon/workflows/`)\n      3. Save the workflow to `.archon/workflows/$extract-intent.output.workflow_name.yaml`\n         Use the Write tool to write the file.\n      4. Report to the user:\n         - Workflow name and file location\n         - Trigger phrases that will invoke it\n         - How to run it: `bun run cli workflow run $extract-intent.output.workflow_name \"your input\"`\n         - How to test it: `bun run cli validate workflows $extract-intent.output.workflow_name`\n    depends_on: [validate-yaml]\n",
 };
diff --git a/packages/workflows/src/loader.test.ts b/packages/workflows/src/loader.test.ts
index 219670f6bf..a6fa599766 100644
--- a/packages/workflows/src/loader.test.ts
+++ b/packages/workflows/src/loader.test.ts
@@ -1777,6 +1777,117 @@ nodes:
       expect(result.errors).toHaveLength(0);
       expect(result.workflows).toHaveLength(1);
     });
+
+    it('should ignore $nodeId.output inside fenced code blocks in prompt: bodies', async () => {
+      // Prompt bodies often embed fenced documentation examples for the LLM
+      // (e.g. workflow-builder shows how to author a script node). The literal
+      // $other-node.output in such a fence is documentation, not a real ref.
+      const workflowDir = join(testDir, '.archon', 'workflows');
+      await mkdir(workflowDir, { recursive: true });
+
+      await writeFile(
+        join(workflowDir, 'fenced-doc.yaml'),
+        `
+name: fenced-doc
+description: Prompt body with a fenced code example mentioning a literal output ref
+nodes:
+  - id: writer
+    prompt: |
+      Author a workflow that uses a script node:
+
+      \`\`\`yaml
+      script: |
+        const data = $other-node.output;
+        console.log(data);
+      \`\`\`
+`
+      );
+
+      const result = await discoverWorkflows(testDir, { loadDefaults: false });
+      expect(result.errors).toHaveLength(0);
+      expect(result.workflows).toHaveLength(1);
+    });
+
+    it('should ignore $nodeId.output inside inline backtick code in prompt: bodies', async () => {
+      // Inline `code` mentions like \`$nodeId.output\` are also documentation.
+      const workflowDir = join(testDir, '.archon', 'workflows');
+      await mkdir(workflowDir, { recursive: true });
+
+      await writeFile(
+        join(workflowDir, 'inline-doc.yaml'),
+        `
+name: inline-doc
+description: Prompt body that mentions a placeholder via inline backticks
+nodes:
+  - id: writer
+    prompt: |
+      Use \`$nodeId.output\` to reference a sibling node's output.
+      For Python, prefer \`json.loads("""$nodeId.output""")\`.
+`
+      );
+
+      const result = await discoverWorkflows(testDir, { loadDefaults: false });
+      expect(result.errors).toHaveLength(0);
+      expect(result.workflows).toHaveLength(1);
+    });
+
+    it('should still reject unknown $nodeId.output refs outside code', async () => {
+      // Stripping fenced/inline code must not weaken validation of real refs
+      // that appear in prose outside any code marker.
+      const workflowDir = join(testDir, '.archon', 'workflows');
+      await mkdir(workflowDir, { recursive: true });
+
+      await writeFile(
+        join(workflowDir, 'mixed-ref.yaml'),
+        `
+name: mixed-ref
+description: Real (unknown) ref in prose plus a fenced doc example
+nodes:
+  - id: step1
+    prompt: |
+      Build on $missing-node.output to do the work.
+
+      Example:
+
+      \`\`\`
+      const x = $other-node.output;
+      \`\`\`
+`
+      );
+
+      const result = await discoverWorkflows(testDir, { loadDefaults: false });
+      expect(result.errors).toHaveLength(1);
+      expect(result.errors[0].error).toContain('missing-node');
+    });
+
+    it('should ignore $nodeId.output inside fenced code in loop.prompt', async () => {
+      // Loop prompts get the same documentation-stripping treatment as node prompts.
+      const workflowDir = join(testDir, '.archon', 'workflows');
+      await mkdir(workflowDir, { recursive: true });
+
+      await writeFile(
+        join(workflowDir, 'loop-fenced.yaml'),
+        `
+name: loop-fenced
+description: Loop with a fenced doc example in its prompt
+nodes:
+  - id: my-loop
+    loop:
+      prompt: |
+        Iterate. Example syntax:
+
+        \`\`\`
+        $other-node.output
+        \`\`\`
+      until: DONE
+      max_iterations: 3
+`
+      );
+
+      const result = await discoverWorkflows(testDir, { loadDefaults: false });
+      expect(result.errors).toHaveLength(0);
+      expect(result.workflows).toHaveLength(1);
+    });
   });
 
   describe('retry config parsing', () => {
diff --git a/packages/workflows/src/loader.ts b/packages/workflows/src/loader.ts
index 3109c680d7..2988f3134f 100644
--- a/packages/workflows/src/loader.ts
+++ b/packages/workflows/src/loader.ts
@@ -143,14 +143,25 @@ function validateDagStructure(nodes: DagNode[]): string | null {
     return `Cycle detected among nodes: ${cycleNodes.join(', ')}`;
   }
 
-  // Check $nodeId.output references in when: and prompt: fields
+  // Check $nodeId.output references in when: and prompt: fields.
+  // Triple-backtick fenced blocks and single-backtick inline code inside a
+  // prompt body are documentation meant to render literally to the LLM
+  // (e.g. the workflow-builder shows authors how to write
+  // `$<other-node>.output` inside a script-node example); strip them before
+  // scanning so they don't false-match as real cross-node references. when:
+  // clauses are JS-like expressions and never carry markdown code, so they
+  // pass through unchanged.
   const outputRefPattern = /\$([a-zA-Z_][a-zA-Z0-9_-]*)\.output/g;
+  const stripMarkdownCode = (s: string): string =>
+    s.replace(/```[\s\S]*?```/g, '').replace(/`[^`\n]*`/g, '');
   for (const node of nodes) {
     const sources: string[] = [];
     if (node.when) sources.push(node.when);
-    if ('prompt' in node && typeof node.prompt === 'string') sources.push(node.prompt);
+    if ('prompt' in node && typeof node.prompt === 'string') {
+      sources.push(stripMarkdownCode(node.prompt));
+    }
     if (isLoopNode(node)) {
-      sources.push(node.loop.prompt);
+      sources.push(stripMarkdownCode(node.loop.prompt));
     }
     for (const source of sources) {
       let m: RegExpExecArray | null;